Repository: morloc-project/morloc
Branch: master
Commit: cc330baae2e1
Files: 2281
Total size: 3.9 MB

Directory structure:
gitextract_3x8i50ut/

├── .dockerignore
├── .github/
│   └── workflows/
│       ├── release.yml
│       └── test.yml
├── .gitignore
├── ChangeLog.md
├── LICENSE
├── README.md
├── bench/
│   ├── Bench.hs
│   └── test-data/
│       ├── complex-types.loc
│       ├── interop.loc
│       └── simple.loc
├── container/
│   ├── Makefile
│   ├── full/
│   │   ├── Dockerfile
│   │   └── assets/
│   │       ├── README
│   │       ├── bashrc
│   │       └── vimrc
│   ├── static-build/
│   │   ├── Dockerfile
│   │   └── build.sh
│   ├── test/
│   │   ├── Dockerfile
│   │   └── assets/
│   │       └── bashrc
│   └── tiny/
│       └── Dockerfile
├── data/
│   ├── lang/
│   │   ├── c/
│   │   │   └── lang.yaml
│   │   ├── cpp/
│   │   │   ├── cppmorloc.cpp
│   │   │   ├── cppmorloc.hpp
│   │   │   ├── init.sh
│   │   │   ├── lang.yaml
│   │   │   ├── mlc_arrow.hpp
│   │   │   ├── mlc_tensor.hpp
│   │   │   ├── morloc_pch.hpp
│   │   │   ├── nanoarrow/
│   │   │   │   ├── nanoarrow.c
│   │   │   │   └── nanoarrow.h
│   │   │   └── pool.cpp
│   │   ├── julia/
│   │   │   ├── MorlocRuntime.jl
│   │   │   ├── init.sh
│   │   │   ├── juliabridge.c
│   │   │   ├── lang.yaml
│   │   │   └── pool.jl
│   │   ├── languages.yaml
│   │   ├── py/
│   │   │   ├── Makefile
│   │   │   ├── init.sh
│   │   │   ├── lang.yaml
│   │   │   ├── pool.py
│   │   │   ├── pymorloc.c
│   │   │   └── setup.py
│   │   └── r/
│   │       ├── init.sh
│   │       ├── lang.yaml
│   │       ├── pool.R
│   │       └── rmorloc.c
│   ├── misc/
│   │   └── mlccpptypes.hpp
│   ├── morloc/
│   │   └── morloc.h
│   └── rust/
│       ├── .gitignore
│       ├── Cargo.toml
│       ├── morloc-manager/
│       │   ├── Cargo.toml
│       │   └── src/
│       │       ├── config.rs
│       │       ├── container.rs
│       │       ├── doctor.rs
│       │       ├── environment.rs
│       │       ├── error.rs
│       │       ├── freeze.rs
│       │       ├── main.rs
│       │       ├── selinux.rs
│       │       ├── serve.rs
│       │       └── types.rs
│       ├── morloc-manifest/
│       │   ├── Cargo.toml
│       │   └── src/
│       │       └── lib.rs
│       ├── morloc-nexus/
│       │   ├── Cargo.toml
│       │   ├── build.rs
│       │   └── src/
│       │       ├── dispatch.rs
│       │       ├── help.rs
│       │       ├── main.rs
│       │       ├── manifest.rs
│       │       └── process.rs
│       └── morloc-runtime/
│           ├── Cargo.toml
│           ├── build.rs
│           ├── cbindgen.toml
│           └── src/
│               ├── arrow_ffi.rs
│               ├── cache.rs
│               ├── cli.rs
│               ├── cschema.rs
│               ├── daemon_ffi.rs
│               ├── error.rs
│               ├── eval_ffi.rs
│               ├── ffi.rs
│               ├── hash.rs
│               ├── http_ffi.rs
│               ├── intrinsics.rs
│               ├── ipc.rs
│               ├── ipc_ffi.rs
│               ├── json.rs
│               ├── json_ffi.rs
│               ├── lib.rs
│               ├── manifest_ffi.rs
│               ├── mpack.rs
│               ├── packet.rs
│               ├── packet_ffi.rs
│               ├── pool_ffi.rs
│               ├── router_ffi.rs
│               ├── schema.rs
│               ├── shm.rs
│               ├── slurm_ffi.rs
│               ├── utility.rs
│               └── voidstar.rs
├── exe/
│   └── morloc-codegen-generic/
│       └── Main.hs
├── executable/
│   ├── CppPrinter.hs
│   ├── CppTranslator.hs
│   ├── Main.hs
│   ├── Subcommands.hs
│   └── UI.hs
├── fourmolu.yaml
├── hie.yaml
├── library/
│   ├── Morloc/
│   │   ├── BaseTypes.hs
│   │   ├── CodeGenerator/
│   │   │   ├── Docstrings.hs
│   │   │   ├── Emit.hs
│   │   │   ├── Express.hs
│   │   │   ├── Grammars/
│   │   │   │   ├── Common.hs
│   │   │   │   ├── Macro.hs
│   │   │   │   └── Translator/
│   │   │   │       ├── Generic.hs
│   │   │   │       ├── Imperative.hs
│   │   │   │       └── PseudoCode.hs
│   │   │   ├── Infer.hs
│   │   │   ├── LambdaEval.hs
│   │   │   ├── LanguageDescriptor.hs
│   │   │   ├── Namespace.hs
│   │   │   ├── Nexus.hs
│   │   │   ├── Parameterize.hs
│   │   │   ├── Realize.hs
│   │   │   ├── Reduce.hs
│   │   │   ├── Segment.hs
│   │   │   ├── Serial.hs
│   │   │   ├── Serialize.hs
│   │   │   └── SystemConfig.hs
│   │   ├── Completion.hs
│   │   ├── Config.hs
│   │   ├── Data/
│   │   │   ├── Annotated.hs
│   │   │   ├── Bifoldable.hs
│   │   │   ├── Bifunctor.hs
│   │   │   ├── DAG.hs
│   │   │   ├── Doc.hs
│   │   │   ├── GMap.hs
│   │   │   ├── Json.hs
│   │   │   ├── Map/
│   │   │   │   └── Extra.hs
│   │   │   ├── Map.hs
│   │   │   └── Text.hs
│   │   ├── DataFiles.hs
│   │   ├── Frontend/
│   │   │   ├── API.hs
│   │   │   ├── AST.hs
│   │   │   ├── CST.hs
│   │   │   ├── Desugar.hs
│   │   │   ├── Lexer.hs
│   │   │   ├── Link.hs
│   │   │   ├── Merge.hs
│   │   │   ├── Namespace.hs
│   │   │   ├── Parser.hs
│   │   │   ├── Parser.y
│   │   │   ├── Restructure.hs
│   │   │   ├── Token.hs
│   │   │   ├── Treeify.hs
│   │   │   ├── Typecheck.hs
│   │   │   └── Valuecheck.hs
│   │   ├── Internal.hs
│   │   ├── LangRegistry.hs
│   │   ├── Language.hs
│   │   ├── Module.hs
│   │   ├── Monad.hs
│   │   ├── Namespace/
│   │   │   ├── Expr.hs
│   │   │   ├── Prim.hs
│   │   │   ├── State.hs
│   │   │   └── Type.hs
│   │   ├── ProgramBuilder/
│   │   │   ├── Build.hs
│   │   │   └── Install.hs
│   │   ├── Quasi.hs
│   │   ├── System.hs
│   │   ├── TypeEval.hs
│   │   ├── Typecheck/
│   │   │   ├── Internal.hs
│   │   │   └── NatSolver.hs
│   │   └── Version.hs
│   └── Morloc.hs
├── metrics/
│   ├── README.md
│   └── scripts/
│       ├── collect-metrics.sh
│       └── compare-metrics.sh
├── package.yaml
├── scripts/
│   ├── build-rust.sh
│   └── bump-version.sh
├── spec/
│   ├── SPEC.md
│   ├── compiler/
│   │   ├── COMPILER.md
│   │   ├── build.md
│   │   ├── codegen.md
│   │   ├── parsing.md
│   │   ├── pipeline.md
│   │   └── typechecking.md
│   ├── interop/
│   │   ├── INTEROP.md
│   │   ├── foreign-functions.md
│   │   ├── implementation-selection.md
│   │   ├── serialization.md
│   │   └── type-mappings.md
│   ├── language/
│   │   ├── LANGUAGE.md
│   │   ├── annotations.md
│   │   ├── declarations.md
│   │   ├── expressions.md
│   │   ├── lexical-structure.md
│   │   └── operators.md
│   ├── modules/
│   │   ├── MODULES.md
│   │   ├── imports-and-exports.md
│   │   ├── packages.md
│   │   └── resolution.md
│   ├── runtime/
│   │   ├── RUNTIME.md
│   │   ├── cli.md
│   │   ├── execution-model.md
│   │   ├── ipc.md
│   │   └── manifest.md
│   └── types/
│       ├── TYPES.md
│       ├── inference.md
│       ├── polymorphism.md
│       ├── primitive-types.md
│       ├── records.md
│       ├── subtyping.md
│       ├── type-declarations.md
│       └── typeclasses.md
├── stack.yaml
└── test-suite/
    ├── .gitignore
    ├── GoldenMakefileTests.hs
    ├── Main.hs
    ├── PropertyTests.hs
    ├── UnitTypeTests.hs
    ├── cmorloc-tests/
    │   ├── Makefile
    │   ├── test.c
    │   └── test.h
    ├── concurrency-tests/
    │   ├── bidi-py-r.loc
    │   ├── bidi-r-py.loc
    │   ├── concurrent-uni.loc
    │   ├── deep-callback.loc
    │   ├── helpers/
    │   │   ├── py_funcs.py
    │   │   └── r_funcs.R
    │   └── run-tests.sh
    ├── daemon-tests/
    │   ├── arithmetic.loc
    │   ├── helpers.py
    │   ├── pure.loc
    │   ├── run-tests.sh
    │   └── strings.loc
    ├── error-message-tests/
    │   ├── README
    │   ├── bad-source/
    │   │   ├── Makefile
    │   │   └── foo.loc
    │   ├── cyclical-import/
    │   │   └── foo.loc
    │   ├── list-error-1/
    │   │   ├── Makefile
    │   │   └── foo.loc
    │   ├── missing-import-module/
    │   │   └── foo.loc
    │   ├── missing-import-term/
    │   │   ├── barm.loc
    │   │   └── main.loc
    │   ├── pool-crash-cpp/
    │   │   ├── Makefile
    │   │   ├── foo.hpp
    │   │   ├── main
    │   │   └── main.loc
    │   ├── runtime-error-cpp/
    │   │   ├── Makefile
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── runtime-error-cross-lang/
    │   │   ├── Makefile
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── runtime-error-py/
    │   │   ├── Makefile
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── runtime-error-r/
    │   │   ├── Makefile
    │   │   ├── foo.R
    │   │   └── main.loc
    │   ├── term-masking/
    │   │   ├── foo.loc
    │   │   ├── foo2.loc
    │   │   └── foo3.loc
    │   ├── typechecking-1/
    │   │   ├── Makefile
    │   │   └── foo.loc
    │   ├── typechecking-2/
    │   │   ├── Makefile
    │   │   └── foo.loc
    │   ├── typeclass-bad-instance/
    │   │   └── foo.loc
    │   ├── typeclass-bad-instance-expr/
    │   │   └── foo.loc
    │   ├── typeclass-masking/
    │   │   ├── foo.loc
    │   │   ├── foo2.loc
    │   │   └── foo3.loc
    │   ├── typeclass-monomorphic-conflict/
    │   │   ├── foo.loc
    │   │   ├── foo2.loc
    │   │   └── foo3.loc
    │   ├── typeclass-overlap/
    │   │   ├── foo.loc
    │   │   ├── foo2.loc
    │   │   └── foo3.loc
    │   └── undefined-term/
    │       ├── Makefile
    │       └── foo.loc
    ├── executable-benchmark/
    │   ├── .gitignore
    │   ├── README
    │   ├── distributed/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── foo.cpp
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── main.yaml
    │   ├── parallel-interop/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── foo.R
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── parallel.py
    │   │   └── test.sh
    │   └── serial-interop/
    │       ├── .gitignore
    │       ├── Makefile
    │       ├── foo.R
    │       ├── foo.hpp
    │       ├── foo.loc
    │       ├── foo.py
    │       ├── long-list.json
    │       ├── medium-list.json
    │       └── test.sh
    ├── golden-tests/
    │   ├── .gitignore
    │   ├── README.md
    │   ├── alias-array-monoid/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── alias-concrete-bugs/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── alias-constructor-equiv/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── alias-dedup-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── alias-no-cross-instance/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-1-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-2-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-2-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-2-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-3-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-3-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-3-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-4-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-4-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-4-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-5-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-5-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-5-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-6-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-6-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-6-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-7-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-7-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-7-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-8-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-8-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── argument-form-8-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── arrow-immutable-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── arrow-immutable-pc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── arrow-immutable-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.R
    │   │   └── src.py
    │   ├── arrow-immutable-rp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.R
    │   │   └── src.py
    │   ├── arrow-nexus-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.hpp
    │   ├── arrow-nexus-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.py
    │   ├── bare-selector-args/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── bare-selector-chain/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── bug-intrinsic-schema-crash/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── bug-load-type-infer/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-10/
    │   │   ├── Makefile
    │   │   ├── README.md
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── sequence_align.hpp
    │   │   ├── sequence_io.py
    │   │   └── sequence_stats.R
    │   ├── claude-test-11/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── sysinfo.R
    │   │   ├── sysinfo.hpp
    │   │   └── sysinfo.py
    │   ├── claude-test-12/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-13/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── stress.hpp
    │   │   └── stress.py
    │   ├── claude-test-14/
    │   │   ├── Makefile
    │   │   ├── edge.hpp
    │   │   ├── edge.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-15/
    │   │   ├── Makefile
    │   │   ├── bigdata.hpp
    │   │   ├── bigdata.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-16/
    │   │   ├── Makefile
    │   │   ├── cstress.hpp
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── pstress.py
    │   ├── claude-test-17/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-18/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-19/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-20/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── claude-test-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── claude-test-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── game.hpp
    │   │   ├── game.py
    │   │   ├── main.loc
    │   │   └── package.yaml
    │   ├── claude-test-6/
    │   │   ├── Makefile
    │   │   ├── README.md
    │   │   ├── exp.txt
    │   │   ├── filters.hpp
    │   │   ├── image_io.py
    │   │   ├── main.loc
    │   │   └── stats.R
    │   ├── claude-test-7/
    │   │   ├── Makefile
    │   │   ├── README.md
    │   │   ├── aggregations.hpp
    │   │   ├── data_io.py
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── statistics.R
    │   ├── claude-test-8/
    │   │   ├── Makefile
    │   │   ├── README.md
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── string_ops.hpp
    │   │   ├── text_processing.py
    │   │   └── text_stats.R
    │   ├── claude-test-9/
    │   │   ├── Makefile
    │   │   ├── README.md
    │   │   ├── exp.txt
    │   │   ├── finance_stats.R
    │   │   ├── helpers.py
    │   │   ├── main.loc
    │   │   ├── market_io.py
    │   │   ├── monte_carlo.hpp
    │   │   └── test-map.loc
    │   ├── command-groups/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── composition/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── paste.py
    │   ├── demo-trimming/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── config.json
    │   │   ├── example.fastq
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── edge-cases-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── edge-cases-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── effect-accumulate-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── effect-coerce-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── effect-coerce-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── effect-error-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── effect-multi-label-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── effect-subtype-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── errors/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── eta-reduction-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-6/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-7/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── eta-reduction-8-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── eta-reduction-8-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── eval-restrict-source/
    │   │   ├── Makefile
    │   │   └── exp.txt
    │   ├── feature-integration-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── file-input-c/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── main.loc
    │   │   └── run.sh
    │   ├── file-input-py/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── run.sh
    │   ├── file-input-r/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── main.loc
    │   │   └── run.sh
    │   ├── force-inline-basic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── formatting/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── functional-data-1/
    │   │   ├── Makefile
    │   │   ├── bar.py
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── functional-data-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── functional-data-3a/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── functional-data-3b/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.hpp
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-3c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-3d/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-3d-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.hpp
    │   │   └── main.loc
    │   ├── functional-data-3d-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-3d-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.R
    │   │   └── main.loc
    │   ├── functional-data-3e/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-3f/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── functional-data-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── generic-hofs-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── generic-hofs-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── guards-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-inline-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-let-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-let-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-let-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── guards-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── higher-kinded-types/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── notes
    │   ├── hofs-1/
    │   │   ├── Makefile
    │   │   ├── eq.py
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── holes-func/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── holes-record/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── holes-simple/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── import-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── import-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── localmap/
    │   │   │   ├── main.loc
    │   │   │   └── main.py
    │   │   └── main.loc
    │   ├── infix/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── impl.py
    │   │   └── main.loc
    │   ├── infix-generic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── infix-import/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── ops/
    │   │       ├── main.loc
    │   │       └── ops.py
    │   ├── infix-local-fixity/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── ops-a/
    │   │   │   ├── main.loc
    │   │   │   └── ops.py
    │   │   └── ops-b/
    │   │       ├── main.loc
    │   │       └── ops.py
    │   ├── infix-polyglot/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── ops/
    │   │   │   └── main.loc
    │   │   ├── ops-cpp/
    │   │   │   ├── main.loc
    │   │   │   └── ops.hpp
    │   │   └── ops-py/
    │   │       ├── main.loc
    │   │       └── ops.py
    │   ├── infix-typeclass-import/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── numops/
    │   │       ├── main.loc
    │   │       └── ops.py
    │   ├── infix-typeclass-polyglot/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── semiring/
    │   │   │   └── main.loc
    │   │   ├── semiring-cpp/
    │   │   │   ├── main.loc
    │   │   │   └── ops.hpp
    │   │   └── semiring-py/
    │   │       ├── main.loc
    │   │       └── ops.py
    │   ├── infix-typeclass-simple/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-block-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── inline-cross-lang/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-deep-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── inline-func-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-ho-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-mixed-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── inline-old-style-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-op-ho-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── inline-op-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── inline-typeclass-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── ops.py
    │   ├── interop-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── interop-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── interop-10/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── interop-11/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── incdef.hpp
    │   │   ├── main.loc
    │   │   └── pysum.py
    │   ├── interop-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3a-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3a-pp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   └── main.loc
    │   ├── interop-3a-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3a-rc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3b-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3b-pp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3b-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3b-rc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3c-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3c-pp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3c-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3c-rc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3d-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3d-pp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3d-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3d-rc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3e-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3e-pp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3e-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3e-rc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-3f/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── interop-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── fooc.loc
    │   │   ├── foopy.loc
    │   │   └── main.loc
    │   ├── interop-6/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.loc
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   └── main.loc
    │   ├── interop-7/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── interop-8-py-to-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── interop-8-r-to-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── interop-8-r-to-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── interop-9/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── intrinsic-agnostic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── hello.json
    │   │   └── main.loc
    │   ├── intrinsic-constants/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── intrinsic-hash/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── intrinsic-show-ho-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── intrinsic-show-read/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── intrinsic-show-read-nexus/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── let-crosslang/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── f.hpp
    │   │   ├── f.py
    │   │   └── main.loc
    │   ├── let-expressions/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── local-import-cousin-py/
    │   │   ├── Makefile
    │   │   ├── bar/
    │   │   │   └── baz/
    │   │   │       ├── main.loc
    │   │   │       └── main.py
    │   │   ├── bif/
    │   │   │   └── biz/
    │   │   │       ├── main.loc
    │   │   │       └── main.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── local-import-nested-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── lib/
    │   │   │   └── math/
    │   │   │       ├── main.loc
    │   │   │       └── main.py
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   ├── util.loc
    │   │   └── util.py
    │   ├── local-import-root-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── root/
    │   │       ├── main.loc
    │   │       └── main.py
    │   ├── manifold-form-0/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t0.loc
    │   ├── manifold-form-0x/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── manifold-form-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t1.loc
    │   ├── manifold-form-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t2.loc
    │   ├── manifold-form-2x/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t2.loc
    │   ├── manifold-form-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t3.loc
    │   ├── manifold-form-3x/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t3.loc
    │   ├── manifold-form-4_c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t4.loc
    │   ├── manifold-form-4_py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t4.loc
    │   ├── manifold-form-4_r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── manifold-form-5_c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t5.loc
    │   ├── manifold-form-5_py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t5.loc
    │   ├── manifold-form-5_r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t5.loc
    │   ├── manifold-form-6_c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t6.loc
    │   ├── manifold-form-6_py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t6.loc
    │   ├── manifold-form-6_r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t6.loc
    │   ├── manifold-form-7_c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t7.loc
    │   ├── manifold-form-7_py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t7.loc
    │   ├── manifold-form-7_r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── t7.loc
    │   ├── memory-interop-misalign-cp/
    │   │   ├── Makefile
    │   │   ├── cppfuncs.loc
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   ├── pyfuncs.loc
    │   │   └── types.loc
    │   ├── memory-nested-misalign-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── memory-nested-misalign-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── memory-optional-double-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── memory-optional-double-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── memory-record-pack-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── memory-record-pack-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── memory-split-block-cpp/
    │   │   ├── Makefile
    │   │   ├── cppfuncs.loc
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   ├── pyfuncs.loc
    │   │   └── types.loc
    │   ├── module-form-00n/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-011/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-01n/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-0n0/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-0n1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-101/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-10n/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-110/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-111/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-1n0/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-n00/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-n01/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── module-form-n10/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── foopy.loc
    │   │   ├── foor.loc
    │   │   ├── fooroot.loc
    │   │   └── main.loc
    │   ├── multi-lang-mempty-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── multiple-instances-1-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.h
    │   ├── multiple-instances-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.py
    │   ├── multiple-instances-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.R
    │   ├── multiple-instances-2-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.h
    │   ├── multiple-instances-2-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.py
    │   ├── multiple-instances-2-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── rms.R
    │   │   └── rms.py
    │   ├── multiprocessing-py-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── namespace-basic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-disambiguation/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-composition/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-double-import/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-exported/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-guard/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-hof/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-let/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-multi/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── mod-a.loc
    │   │   ├── mod-b.loc
    │   │   └── mod-c.loc
    │   ├── namespace-ns-nested-getter/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-reexport/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   ├── main.loc
    │   │   └── middle.loc
    │   ├── namespace-ns-same-func-name/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-shadow/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-ns-unqualified/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-selective/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helpers.loc
    │   │   └── main.loc
    │   ├── namespace-separate-impls/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── mod-a.loc
    │   │   └── mod-b.loc
    │   ├── nat-typecheck/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.hpp
    │   ├── native-morloc-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── native-morloc-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── native-morloc-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── native-morloc-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── native-morloc-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── high.loc
    │   │   └── high.py
    │   ├── native-morloc-6/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── native-morloc-7/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── native-morloc-8/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── native-morloc-9/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── nexus-let-lambda/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── nexus-let-pure/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── null-keyword/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.R
    │   │   ├── main.hpp
    │   │   ├── main.loc
    │   │   └── main.py
    │   ├── numeric-literals/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── object-1-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.h
    │   ├── object-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.py
    │   ├── object-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.R
    │   ├── optional-coerce-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── optional-coerce-interop/
    │   │   ├── Makefile
    │   │   ├── cfoo.hpp
    │   │   ├── cppfuncs.loc
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── pfoo.py
    │   │   ├── pyfuncs.loc
    │   │   └── types.loc
    │   ├── optional-coerce-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── optional-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── optional-interop-cp/
    │   │   ├── Makefile
    │   │   ├── cppfuncs.loc
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   ├── pyfuncs.loc
    │   │   └── types.loc
    │   ├── optional-interop-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   ├── pyfuncs.loc
    │   │   ├── rfuncs.loc
    │   │   └── types.loc
    │   ├── optional-interop-rc/
    │   │   ├── Makefile
    │   │   ├── cppfuncs.loc
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── main.loc
    │   │   ├── rfuncs.loc
    │   │   └── types.loc
    │   ├── optional-json/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── optional-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── optional-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   └── main.loc
    │   ├── optional-records-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── optional-records-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── optional-records-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   └── main.loc
    │   ├── packer-definitions-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── packer-definitions-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── lib/
    │   │   │   └── json/
    │   │   │       ├── json.py
    │   │   │       └── main.loc
    │   │   └── main.loc
    │   ├── packer-definitions-3/
    │   │   ├── Makefile
    │   │   ├── dumby.hpp
    │   │   ├── dumby.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── packer-definitions-4/
    │   │   ├── Makefile
    │   │   ├── dumby.hpp
    │   │   ├── dumby.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── packer-definitions-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── map.hpp
    │   │   └── map.py
    │   ├── packets-interop/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.h
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── make_test_data.py
    │   ├── packets-large/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.h
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   ├── make_test_data.py
    │   │   └── test-data.mpk
    │   ├── parser-stress/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── path-shadowing-c/
    │   │   ├── Makefile
    │   │   ├── bar/
    │   │   │   ├── main.hpp
    │   │   │   └── main.loc
    │   │   ├── baz/
    │   │   │   ├── main.hpp
    │   │   │   └── main.loc
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── path-shadowing-py/
    │   │   ├── Makefile
    │   │   ├── bar/
    │   │   │   ├── main.loc
    │   │   │   └── main.py
    │   │   ├── baz/
    │   │   │   ├── main.loc
    │   │   │   └── main.py
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── path-shadowing-r/
    │   │   ├── Makefile
    │   │   ├── bar/
    │   │   │   ├── main.R
    │   │   │   └── main.loc
    │   │   ├── baz/
    │   │   │   ├── main.R
    │   │   │   └── main.loc
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── pattern-getters/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── pattern-setters/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main-cpp.loc
    │   │   ├── main-py.loc
    │   │   ├── main-r.loc
    │   │   ├── tests.loc
    │   │   └── types.hpp
    │   ├── poly-list-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── record-docstrings/
    │   │   ├── Makefile
    │   │   ├── algconf.json
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── sysconf.json
    │   ├── records-alias/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   ├── lib/
    │   │   │   └── main.loc
    │   │   └── main.loc
    │   ├── records-complex-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── records-complex-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── records-nested/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── records-primitive/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── recursion-cross-py-cpp/
    │   │   ├── Makefile
    │   │   ├── cpp_helpers.hpp
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── py_helpers.py
    │   ├── recursion-cross-r-cpp/
    │   │   ├── Makefile
    │   │   ├── cpp_helpers.hpp
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── r_helpers.R
    │   ├── recursion-direct-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-direct-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-direct-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-helper-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-helper-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-mutual-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-mutual-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-mutual-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── recursion-thunk-helper-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── recursion-thunk-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── scoping-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-10/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── high.loc
    │   │   ├── high.py
    │   │   └── low.loc
    │   ├── scoping-11/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── scoping-12/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── scoping-13/
    │   │   ├── Makefile
    │   │   ├── core.hpp
    │   │   ├── exp.txt
    │   │   ├── foo/
    │   │   │   ├── main.loc
    │   │   │   └── test/
    │   │   │       ├── bar.py
    │   │   │       └── main.loc
    │   │   ├── foo-cpp.loc
    │   │   └── main.loc
    │   ├── scoping-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-6/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-7/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-8/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── scoping-9/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── w.loc
    │   ├── selection-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── selection-2/
    │   │   ├── Makefile
    │   │   ├── arithmetic/
    │   │   │   └── main.loc
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── selection-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rms.R
    │   ├── selection-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-10-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-10-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-10-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-11-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-11-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-11-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-12-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-12-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-12-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-2-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-2-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-2-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-4-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-4-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-4-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-5-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-5-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-5-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-6-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-6-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-6-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-7-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-7-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-7-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-8-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-8-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-8-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-9-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-9-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── serial-form-9-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── slurm-label-codegen/
    │   │   ├── Makefile
    │   │   ├── bar.py
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── main.yaml
    │   ├── source-old-op-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── specialization-1-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── specialization-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── specialization-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   └── main.loc
    │   ├── specialization-2-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── specialization-2-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── stderr-stdout/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   ├── main.loc
    │   │   └── package.yaml
    │   ├── stdout-flush-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── fun.py
    │   │   └── main.loc
    │   ├── string-encoding/
    │   │   ├── .gitignore
    │   │   ├── Makefile
    │   │   ├── a.json
    │   │   ├── b.json
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── string-encoding-utf8/
    │   │   ├── Makefile
    │   │   ├── a.json
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── string-escape/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── helper.R
    │   │   ├── helper.hpp
    │   │   ├── helper.py
    │   │   └── main.loc
    │   ├── string-interpolation/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── string-json-parsing/
    │   │   ├── Makefile
    │   │   ├── a.json
    │   │   ├── b.json
    │   │   ├── c.json
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── string-multiline/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── string-pretty/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── table-1-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── table-1-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── table-1-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── table-2-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.h
    │   ├── table-2-py/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.py
    │   ├── table-2-r/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── person.R
    │   ├── tensor-comprehensive-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.hpp
    │   ├── tensor-comprehensive-cross/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.R
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── tensor-cp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── tensor-dimensions/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── tensor-nat-basic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── labeled.hpp
    │   │   └── main.loc
    │   ├── tensor-nat-labeled/
    │   │   ├── Makefile
    │   │   ├── cnn.hpp
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── tensor-nexus-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.hpp
    │   ├── tensor-pc/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.hpp
    │   │   └── src.py
    │   ├── tensor-pr/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.R
    │   │   └── src.py
    │   ├── tensor-rp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   ├── src.R
    │   │   └── src.py
    │   ├── tensor-table-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── src.hpp
    │   ├── thunk-basic/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-choose/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── thunk-cross-force/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── thunk-do/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-effects/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-eval-forall/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rng.py
    │   ├── thunk-eval-hk/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── rng.py
    │   ├── thunk-export/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── thunk-export-guard/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-force/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-guard-cross/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── thunk-interop/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.R
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── thunk-let/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   ├── thunk-nullary-interop/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── two-module/
    │   │   ├── Makefile
    │   │   ├── combat.loc
    │   │   ├── exp.txt
    │   │   ├── tavern.loc
    │   │   ├── util.loc
    │   │   └── util.py
    │   ├── type-alias-transitive/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── main.loc
    │   │   ├── types/
    │   │   │   └── main.loc
    │   │   └── types-cpp.loc
    │   ├── type-annotations-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── type-identities-c/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── main.loc
    │   │   └── types.h
    │   ├── type-synthesis-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── type-synthesis-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── lib/
    │   │   │   ├── foo/
    │   │   │   │   ├── foo.py
    │   │   │   │   └── main.loc
    │   │   │   └── footypes/
    │   │   │       └── main.loc
    │   │   └── main.loc
    │   ├── typeclass-stress/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── typeclasses-1/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── typeclasses-2/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── typeclasses-3/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── typeclasses-4/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── typeclasses-5/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── typeclasses-6/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   └── main.loc
    │   ├── typeclasses-7/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── typeclasses-8/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── typeclasses-9/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── unicode-edge-cases/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── unicode-interop/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── unicode-interpolation/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── unicode-source/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   ├── foo.py
    │   │   └── main.loc
    │   ├── unicode-source-cpp/
    │   │   ├── Makefile
    │   │   ├── exp.txt
    │   │   ├── foo.hpp
    │   │   └── main.loc
    │   └── unit-1/
    │       ├── Makefile
    │       ├── exp.txt
    │       ├── foo.py
    │       └── main.loc
    ├── install-tests/
    │   ├── .gitignore
    │   ├── README.md
    │   ├── run-tests.sh
    │   ├── testcpp1/
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   └── square.hpp
    │   ├── testcpp2/
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   └── src/
    │   │       └── dbl.hpp
    │   ├── testcpp3/
    │   │   ├── inc.hpp
    │   │   ├── main.loc
    │   │   └── offset.hpp
    │   ├── testdatafile1/
    │   │   ├── data.txt
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   └── reader.py
    │   ├── testpy1/
    │   │   ├── helpers.py
    │   │   ├── main.loc
    │   │   └── package.yaml
    │   ├── testpy2/
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   └── src/
    │   │       └── mathutil.py
    │   ├── testpy3/
    │   │   ├── fmtlib.py
    │   │   ├── formatter.py
    │   │   └── main.loc
    │   ├── testr1/
    │   │   ├── main.loc
    │   │   ├── negate.R
    │   │   └── package.yaml
    │   ├── testr2/
    │   │   ├── main.loc
    │   │   ├── package.yaml
    │   │   └── src/
    │   │       └── triple.R
    │   └── testr3/
    │       ├── glue.R
    │       ├── main.loc
    │       └── rutil.R
    ├── integration/
    │   ├── Main.hs
    │   └── Morloc/
    │       └── Test/
    │           ├── Common.hs
    │           ├── ConcurrencyTests.hs
    │           ├── DaemonTests.hs
    │           ├── InstallTests.hs
    │           ├── ShmTests.hs
    │           └── StressTests.hs
    ├── shm-tests/
    │   ├── cppfuncs.loc
    │   ├── main.loc
    │   ├── pyfuncs.loc
    │   ├── stress.hpp
    │   ├── stress.py
    │   └── types.loc
    ├── stress/
    │   ├── .gitignore
    │   ├── README.md
    │   ├── common.sh
    │   ├── concurrent-stress.sh
    │   ├── crash-recovery.sh
    │   ├── run-all.sh
    │   ├── valgrind-check.sh
    │   └── zombie-stress.sh
    ├── test.sh
    └── typecheck-benchmark/
        ├── apply-ann-20.loc
        ├── apply-deep-10.loc
        ├── apply-deep-100.loc
        ├── apply-deep-30.loc
        ├── apply-deep-50.loc
        ├── apply-deep.loc
        ├── apply-multi-arg-20.loc
        ├── compose-10.loc
        ├── compose-20.loc
        ├── compose-40.loc
        ├── partial-app.loc
        ├── poly-compose.loc
        ├── run-benchmarks.sh
        └── tuple-nested-20.loc

================================================
FILE CONTENTS
================================================

================================================
FILE: .dockerignore
================================================
# Ignore build artifacts to keep Docker context small
.stack-work/
.git/
out/
container/static-build/.stack-work/
morloc-manager/.stack-work/
data/rust/target/
*.hi
*.o


================================================
FILE: .github/workflows/release.yml
================================================
# Release workflow: build all binaries + containers, run tests, publish release.
#
# Triggered by pushing a version tag:
#   git tag v0.68.0
#   git push origin v0.68.0
#
# Produces for each platform (linux-x86_64, linux-arm64, macos-arm64):
#   - morloc-manager  (Rust binary)
#   - libmorloc.so    (Rust runtime library; .dylib on macOS)
#   - morloc-nexus    (Rust binary)
#
# All three are attached to the GitHub Release.

name: Release

on:
  push:
    tags: ['v*']

env:
  REGISTRY: ghcr.io
  IMAGE_BASE: ghcr.io/morloc-project/morloc

jobs:
  # ---- Build Rust binaries (libmorloc + morloc-nexus + morloc-manager) per platform ----
  rust-binary:
    strategy:
      fail-fast: false
      matrix:
        include:
          - os: ubuntu-latest
            platform: linux-x86_64
            method: docker
          - os: ubuntu-24.04-arm
            platform: linux-arm64
            method: docker
          - os: macos-latest
            platform: macos-arm64
            method: native
    runs-on: ${{ matrix.os }}
    timeout-minutes: 30
    steps:
      - uses: actions/checkout@v4

      # ---- Linux: Docker container build ----
      # libmorloc.so + morloc-nexus: glibc (Ubuntu 20.04)
      # morloc-manager: static (Alpine/musl)
      - name: Build Rust binaries (Linux)
        if: matrix.method == 'docker'
        run: |
          docker build -t morloc-rust-build \
            -f container/static-build/Dockerfile .
          mkdir -p out
          docker run --rm -v "$(pwd)/out:/out" morloc-rust-build
          # Verify morloc-manager is static
          file out/morloc-manager | grep -qE "static(ally|-pie) linked"

      - name: Rename artifacts (Linux)
        if: matrix.method == 'docker'
        run: |
          mv out/libmorloc.so out/libmorloc-${{ matrix.platform }}.so
          mv out/morloc-nexus out/morloc-nexus-${{ matrix.platform }}
          mv out/morloc-manager out/morloc-manager-${{ matrix.platform }}

      # ---- macOS: native cargo build ----
      - name: Setup Rust (macOS)
        if: matrix.method == 'native'
        uses: dtolnay/rust-toolchain@stable

      - name: Cache Cargo (macOS)
        if: matrix.method == 'native'
        uses: actions/cache@v4
        with:
          path: |
            ~/.cargo/registry
            ~/.cargo/git
            data/rust/target
          key: cargo-macos-${{ hashFiles('data/rust/Cargo.lock') }}
          restore-keys: cargo-macos-

      - name: Build Rust binaries (macOS)
        if: matrix.method == 'native'
        run: |
          cd data/rust
          # Build libmorloc (cdylib produces .dylib on macOS)
          cargo build --release -p morloc-runtime
          # Install .dylib so nexus can link against it
          mkdir -p $HOME/.local/share/morloc/lib
          cp target/release/libmorloc_runtime.dylib $HOME/.local/share/morloc/lib/libmorloc.dylib
          # Build nexus
          cargo build --release -p morloc-nexus
          # Build manager
          cargo build --release -p morloc-manager
          # Collect artifacts
          mkdir -p ../../out
          cp target/release/libmorloc_runtime.dylib ../../out/libmorloc-${{ matrix.platform }}.dylib
          cp target/release/morloc-nexus ../../out/morloc-nexus-${{ matrix.platform }}
          cp target/release/morloc-manager ../../out/morloc-manager-${{ matrix.platform }}
          strip ../../out/morloc-nexus-${{ matrix.platform }} || true
          strip ../../out/morloc-manager-${{ matrix.platform }} || true

      - name: Upload Rust artifacts
        uses: actions/upload-artifact@v4
        with:
          name: rust-binaries-${{ matrix.platform }}
          path: out/*

  # ---- Run tests using the Rust binaries ----
  test:
    needs: rust-binary
    runs-on: ubuntu-latest
    timeout-minutes: 60
    env:
      DEBIAN_FRONTEND: noninteractive
    steps:
      - uses: actions/checkout@v4
      - uses: haskell-actions/setup@v2
        with:
          ghc-version: '9.6.7'
          enable-stack: true
          stack-version: 'latest'
      - uses: actions/cache@v4
        with:
          path: |
            ~/.stack/snapshots
            ~/.stack/setup-exe-cache
            .stack-work
          key: stack-deps-release-${{ hashFiles('stack.yaml.lock', 'package.yaml') }}
          restore-keys: stack-deps-release-
      - name: Increase shared memory
        run: sudo mount -o remount,size=4G /dev/shm
      - name: Install system dependencies
        run: |
          sudo apt-get update
          sudo apt-get install -y --no-install-recommends \
            r-base-core python3 python3-dev python3-pip \
            python3-numpy g++ gcc make libgsl-dev
          python3 -m pip install --break-system-packages --upgrade setuptools pyarrow

      - name: Cache R packages
        uses: actions/cache@v4
        id: r-cache
        with:
          path: ~/R/library
          key: r-lib-${{ runner.os }}-${{ runner.arch }}

      - name: Install R packages
        if: steps.r-cache.outputs.cache-hit != 'true'
        run: |
          mkdir -p ~/R/library
          LIBARROW_MINIMAL=true ARROW_S3=OFF ARROW_GCS=OFF \
            Rscript -e 'install.packages("arrow", lib="~/R/library", repos = "https://cloud.r-project.org")'

      - name: Download Rust binaries
        uses: actions/download-artifact@v4
        with:
          name: rust-binaries-linux-x86_64
          path: rust-bin

      - name: Prepare Rust binaries
        run: |
          mkdir -p prebuilt
          mv rust-bin/libmorloc-linux-x86_64.so prebuilt/libmorloc.so
          mv rust-bin/morloc-nexus-linux-x86_64 prebuilt/morloc-nexus
          mv rust-bin/morloc-manager-linux-x86_64 prebuilt/morloc-manager
          chmod +x prebuilt/libmorloc.so prebuilt/morloc-nexus prebuilt/morloc-manager

      - name: Add morloc to PATH
        run: |
          echo "$HOME/.local/bin" >> $GITHUB_PATH
          echo "$HOME/.local/share/morloc/bin" >> $GITHUB_PATH
          echo "R_LIBS_USER=$HOME/R/library" >> $GITHUB_ENV
      - name: Build morloc
        run: stack install --system-ghc --no-install-ghc --no-run-tests
      - name: Initialize morloc (using pre-built Rust binaries)
        run: |
          MORLOC_RUST_BIN=$(pwd)/prebuilt morloc init -f
          morloc install stdlib
      - name: Run tests
        run: stack test --system-ghc --no-install-ghc morloc:morloc-test
        timeout-minutes: 10

  # ---- Build and push container images ----
  containers:
    needs: test
    runs-on: ubuntu-latest
    timeout-minutes: 120
    permissions:
      packages: write
    steps:
      - uses: actions/checkout@v4

      - name: Extract version from tag
        id: ver
        run: echo "version=${GITHUB_REF_NAME#v}" >> "$GITHUB_OUTPUT"

      - name: Login to GHCR
        uses: docker/login-action@v3
        with:
          registry: ghcr.io
          username: ${{ github.actor }}
          password: ${{ secrets.GITHUB_TOKEN }}

      - name: Build tiny (from local source)
        run: |
          docker build \
            -t ${{ env.IMAGE_BASE }}/morloc-tiny:${{ steps.ver.outputs.version }} \
            -t ${{ env.IMAGE_BASE }}/morloc-tiny:edge \
            -f container/tiny/Dockerfile .

      - name: Build full (uses local tiny)
        run: |
          docker build \
            --build-arg MORLOC_VERSION=${{ steps.ver.outputs.version }} \
            -t ${{ env.IMAGE_BASE }}/morloc-full:${{ steps.ver.outputs.version }} \
            -t ${{ env.IMAGE_BASE }}/morloc-full:edge \
            container/full/

      - name: Push all images
        run: |
          for img in morloc-tiny morloc-full; do
            docker push ${{ env.IMAGE_BASE }}/${img}:${{ steps.ver.outputs.version }}
            docker push ${{ env.IMAGE_BASE }}/${img}:edge
          done

  # ---- Create GitHub Release ----
  release:
    if: always() && needs.containers.result == 'success'
    needs: [containers, rust-binary]
    runs-on: ubuntu-latest
    permissions:
      contents: write
    steps:
      - name: Download all artifacts
        uses: actions/download-artifact@v4
        with:
          pattern: 'rust-binaries-*'
          merge-multiple: true

      - name: List artifacts
        run: ls -lh

      - name: Create GitHub Release
        uses: softprops/action-gh-release@v2
        with:
          files: |
            morloc-manager-*
            libmorloc-*
            morloc-nexus-*
          generate_release_notes: true


================================================
FILE: .github/workflows/test.yml
================================================
name: Test Morloc
on: [push]

jobs:
  linux-test:
    runs-on: ubuntu-latest
    timeout-minutes: 60

    env:
      DEBIAN_FRONTEND: noninteractive

    steps:
      - name: Checkout
        uses: actions/checkout@v4

      - name: Setup Haskell (GHC + Stack)
        uses: haskell-actions/setup@v2
        with:
          ghc-version: '9.6.7'
          enable-stack: true
          stack-version: 'latest'

      - name: Setup Rust
        uses: dtolnay/rust-toolchain@stable

      - name: Cache Stack dependencies
        uses: actions/cache@v4
        with:
          path: |
            ~/.stack/snapshots
            ~/.stack/setup-exe-cache
            .stack-work
          key: stack-deps-${{ hashFiles('stack.yaml.lock', 'package.yaml') }}
          restore-keys: |
            stack-deps-

      - name: Cache Cargo dependencies
        uses: actions/cache@v4
        with:
          path: |
            ~/.cargo/registry
            ~/.cargo/git
            data/rust/target
          key: cargo-deps-${{ hashFiles('data/rust/Cargo.lock') }}
          restore-keys: |
            cargo-deps-

      - name: Increase shared memory (needed for morloc SHM pool tests)
        run: sudo mount -o remount,size=4G /dev/shm

      - name: Install system dependencies
        run: |
          sudo apt-get update
          sudo apt-get install -y --no-install-recommends \
            r-base-core \
            python3 \
            python3-dev \
            python3-pip \
            python3-numpy \
            g++ \
            gcc \
            make \
            libgsl-dev
          python3 -m pip install --break-system-packages --upgrade setuptools pyarrow

      - name: Cache R packages
        uses: actions/cache@v4
        id: r-cache
        with:
          path: ~/R/library
          key: r-lib-${{ runner.os }}-${{ runner.arch }}

      - name: Install R packages
        if: steps.r-cache.outputs.cache-hit != 'true'
        run: |
          mkdir -p ~/R/library
          LIBARROW_MINIMAL=true ARROW_S3=OFF ARROW_GCS=OFF \
            Rscript -e 'install.packages("arrow", lib="~/R/library", repos = "https://cloud.r-project.org")'

      - name: Add morloc bin folders to PATH
        run: |
          echo "$HOME/.local/bin" >> $GITHUB_PATH
          echo "$HOME/.local/share/morloc/bin" >> $GITHUB_PATH
          echo "R_LIBS_USER=$HOME/R/library" >> $GITHUB_ENV

      - name: Build Morloc
        run: |
          stack install --system-ghc --no-install-ghc --no-run-tests

      - name: Initialize morloc and install modules
        run: |
          MORLOC_RUST_DIR=$(pwd)/data/rust morloc init -f
          morloc install stdlib

      - name: Test morloc
        run: |
          stack test --system-ghc --no-install-ghc morloc:morloc-test
        timeout-minutes: 10


================================================
FILE: .gitignore
================================================
tags
*.hi
*.o
.stack-work/
.history
morloc.cabal
*.out
run/
.idea/
*.iml
# ignore debugging files
*.aux
*.hp
*.prof
*.ps
.bash_history
.local
.stack
CLAUDE.md
.claude/
claude-memory/
.RData
.Rhistory
pools/
nexus
out/


================================================
FILE: ChangeLog.md
================================================
0.81.0 [2026-94-22]
-------------------
 * fix type inference for type families
 * extend intrinsic support for language-agnostic code
 * do shell-expansion of flagfile lines in morloc-manager
 * fix loss of pool stderr on crash (maybe?)

0.80.1 [2026-04-21]
-------------------
 * add `morloc-manager new --include <path>` src:dest syntax
 * make stderr/stdout mim principles more consistent

0.80.0 [2026-04-20]
-------------------
 * cleaner morloc-manager
 * fixed --print bug in nexus

0.79.1-5 [2026-04-19]
 * lot's morloc-manager updates

0.79.0 [2026-04-17]
-------------------
 * add @datafile intrinsic for finding installed files
 * default to including all files when installing
   - parse `.morlocignore` to find non-install files
   - allow `include` in package.yaml for strict file inclusion
 * add `morloc-manage doctor` subcommand for health checks
 * add additional `freeze/unfreeze` validation
 * fix unfreezing bugs

0.78.0 [2026-04-17]
-------------------
 * clean up CLI usage statements
 * suppress "null" outpput in Unit-returning CLIs
 * fix string escape bugs
 * fix where parsing after do-block
 * fix many small morloc-manager issues
 * fix paths in installed morloc programs


0.77.1 [2026-04-16]
-------------------
 * resurrected `morloc-manager log` subcommand

0.77.0 [2026-04-15]
-------------------
 * many many deployment fixes

0.76.0 [2026-04-13]
-------------------
 * fix docstring groups
 * add module docstrings
 * fix bug in unfreeze

0.75.0 [2026-04-12]
-------------------
 * allow effectful final do-notation statements
 * lots of bug fixes
 * make changelog version source of truth

0.74.0 [2026-04-06]
-------------------
 * unify morloc-manager env, workspace, and version
 * allow docstrings before declarations
 * allow literal leading spaces in docstrings
 * allow escaped `<word>:` syntax

0.73.0 [2026-04-01]
-------------------
 * fix @load error on missing file
 * fix error reporting on failed `morloc-manager install`

0.72.0 [2026-03-30]
-------------------
 * fix unicode support in comments and literal strings
 * many fixes to the morloc-manager

0.71.0-2 [2026-03-29]
-------------------
 * port morloc-manager to rust

0.70.1 to 0.70.6 [2026-03-29]
-----------------------------
 * fix portability for libmorloc and morloc-nexus on darwin and linux-arm64
 * python flushing face condition

0.70.0 [2026-03-29]
-------------------
 * port libmorloc and morloc-nexus from C to Rust

0.69.0 [2026-03-27]
-------------------
 * port morloc-manager from shell to Haskell
 * share it as a static binary

0.68.0 [2026-03-22]
-------------------
 * remove explicit universal quntifiers
    - before: `id a :: a -> a`
    - now:    `id   :: a -> a`
 * add `morloc uninstall --all` option
 * do not require repeated `let` terms

0.67.1 [2026-03-17]
-------------------
 * add missing Nat kind annotation to root modules
 * better test coverage of Nat kinds
 * add `morloc uninstall --all` option
 * add `stdlib` module that simplifies recursive install of everything

0.67.0 [2026-03-17]
-------------------
 * add Arrow tables with zero-copy between language sharing
 * add tensors and
 * remove explicit qualifiers
   - no more `id a :: a -> a`
   - now `id :: a -> a`
   - this does not require C++ be more explicit in their typing
 * inline when packet data is smaller than 65kb
   - this avoids fragmenting the shared memory with many small single-use values

0.66.0 [2026-03-12]
-------------------
 * fix propagation of errors from crashed pools
 * fix shm memory alignment (inefficiency on x86, crashes on ARM)
 * add `--sanitize` option to `morloc init` for strict memory
 * replace megaparsec with parsec
 * fix label and remote handling

0.65.0 [2026-03-10]
-------------------
 * `morloc eval` for running anonymous morloc expressions
 * add %inline pragma to skip manifold gen
 * allow batch syntax for instances
 * add @show and @read intrinsics
 * add namespaces for morloc imports

0.64.0 [2026-03-03]
-------------------
 * replace thunks with more granular effect system
 * add intrinsics
 * disambiguate local module imports 
 * change null to Null

0.63.0 [2026-02-25]
-------------------
 * add optionals with implicit coercion
 * for `?Str` with `literal: true`, force `default: null`
 * add daemon args to nexus

0.62.0 [2026-02-24]
-------------------
 * term recursion support
 * conditional guards
 * nexus pretty printing option (-p/--print)
 * print defaults in usage statements
 * more bug fixes

0.61.0 [2026-02-21]
-------------------

Build updates
 * make nexus a constant binary (not recreated and recompiled)
 * add install handling and portable scripts
 * add morloc daemon mode accessible through HTTP/TCP and sockets
 * add `morloc install --build` option for installing both executable modules
 * add `morloc uninstall`
 * add `morloc list` with -v option for listing types of all exports

Typesystem updates
 * add let syntax that enforces execution order
 * class constraints (e.g., unique :: Eq a => [a] -> [a])
 * superclasses (e.g., class Semigroup => Monoid a where ...)
 * add effect system for delayed execution
 * add do-syntax for imperative programming with effects

Better errors and UI
 * cleaner error messages
 * error message localization
 * clean `morloc typecheck` output
 * add CLI subcommand tested grouping
 * Add shell TAB-completion
 * fix haddock for future hackage release

Bug fixes
 * cleaned up memory issues in all C code
 * replaced mcparallel in R with forked pool of workers
 * fix bug in `morloc install .`

Testing
 * added stress test for zombies and memory issues
 * added daemon tests

Performance
 * Split the monolithic (~7000 line) morloc.h file
 * Use a libmorloc.so shared library rather than importing all as header
 * Removed all the zombie swarms that where killing heavy morloc projects
 * Remove mcparallel from R, move most of the pool to C, 4X interop speed
 * Compile and reuse a single nexus (reduce compile costs)

Language onboarding
 * Added codegen IR that greatly simplifies new language addition
 * Factor all language-specific material out of main Haskell codebase
 * Move all grammar into template yaml specs
 * Created MessagePack bridge to bypass voidstar, making lang onboard almost
   trivial (at a performance penalty).

Other
 * Transitioned parser from recursive descent to LR1

0.60.0 [2026-02-07]
-------------------
 * add infix operator support

Testing
 * Generate many new tests with Claude
 * Extensive testing of infix operators and module inheritance

Cleanup
 * add formatting with fourmulo
 * add metric and benchmarking

Bug fixes
 * Fix several memory issues in morloc.h and lang bindings
 * Fixed indexing bug in Generator.hs
 * Fix missing space in git module cp
 * Make missing folders in install path
 * Fix `morloc install` deletion of mod folder when install has trailing '/' 
 * Disallow space between sign and number

Performance
 * Fixed exponential case hit on eta resolution
 * Fixed quadratic case in subtype algorithm

Claude memory
 * Added claude memory files

0.59.0 [2026-01-23]
-------------------
 * allow functions in data structures
 * allow source functions to return functions
 * allow application of expressions that evaluate to functions
 * fix bug in C++ bool deserialization

0.58.3 [2026-01-03]
-------------------
 * fix record docstring inheritance

0.58.2 [2025-12-29]
-------------------
 * fix minor bug optional versus positional

0.58.1 [2025-12-28]
-------------------
 * fix minor bug in record unrolling

0.58.0 [2025-12-28]
-------------------
 * add hex, octal, and binary numeric representations
 * new record syntax
 * generate CLI from docstrings
     * resolve records into groups of arguments
     * allow literal strings without the extra JSON quoting
 * change to Apache-2.0

0.57.1 [2025-11-12]
-------------------
 * minor bug fixes

0.57.0 [2025-11-11]
-------------------
 * re-allow underscores in variable names
 * add placeholder syntax / lambda lifting from holes
 * multi-line strings
 * string interpolation
 * getter patterns
 * setter patterns
 * write full Morloc nexus evaluator
 * Fix bug in local installs with "."

0.56.0 [2025-10-08]
-------------------

New file organization
 * Change file layout to conform to XDG spec; 
   replaced `~/.morloc` with `~/.local/share/morloc`
 * Move standard library to `$MORLOC_HOME/src/morloc/plane/default/morloclib`
   * src/ - stores any source code morloc needs, not just modules 
   * morloc/ - stores morloc modules
   * plane/ - stores morloc modules that are part of a plane
   * default/ - the current default plane
   * morloclib/ - the org name for the core modules in the default plane

New `morloc install` subcommand functionality
 * Multiple imports may be chained on one command
 * Source and ref can be included per install, for example:
   * `root` - install a core module
   * `root@hash:abcdef1234` - specific core instance
   * `root@tag:v1.0.0` - specific tag/version
   * `codeberg:weena/calendar@hash:abcdef1234` - 3rd party with source and ref
 * Support for install of local modules
   

0.55.1 [2025-09-29]
-------------------

 * Bug fixes

0.55.0 [2025-09-27]
-------------------

 * Allow general types to be declared and imported/exported
 * Allow undirected dependencies
 * Allow dashes in module names
 * Fix many bugs in native Morloc code handling
 * Fix bug in certain higher order foreign functions
 * Simplify internal unique naming conventions
 * Move all tests to use the new root module (rather than base)
 * Slightly improved error messages

Breaking changes:
 * Move to reverse tree model of dependency handling
 * Allow exactly one type signature for each term and class
 * Require explicit typeclass import/export
 * Fix handling of Python builtin imports
    Now builtins must not be imported from Python source. Instead
    import directly from Python, for example: `source Py ("len")`
 * More efficient Haskell Map usage

0.54.2 [2025-08-09]
-------------------

 * Enforce lowercase module name rule
 * Fix handling of executable file name option
 * Fix record handling

0.54.1 [2025-07-26]
-------------------

 * Fix pickle bug in Python multiprocessing
 * Replace asprintf non-standard C function 
 * Partially fix interop for C structs
 * Fix bug in unqualified imports

0.54.0 [2025-07-13]
-------------------

 * Add full MessagePack and VoidStar IO to nexus
 * Fixed type pretty printing in usage and typechecking output
 * Add nexus option and usage info
 * Add support for one-line command docstrings

0.53.7 [2025-05-31]
-------------------

 * Fix bug in parameterized type definition concrete type inference

0.53.6 [2025-05-31]
-------------------

 * Improve container instructions in README
 * Fix all README examples
 * Make Dockerfiles more portable
 * Fix bug in implicit typeclass instance inheritance

0.53.5 [2025-05-12]
-------------------

 * Fixed unnecessary copying in C libs
 * Fixed double let-binding in code gen

0.53.4 [2025-05-08]
-------------------

 * Replace C daemon forking with thread pooling (4X speedup)
 * Fix bugs related to 0-length array memory allocation

0.53.3 [2025-05-06]
-------------------

 * Fix handling of empty vectors

0.53.2 [2025-05-06]
-------------------

 * Fix bug in JSON parsing

0.53.1 [2025-05-06]
-------------------

 * Update containers
 * Update github actions
 * Fix bug in type scoping (sort of)

0.53.0 [2025-05-04]
-------------------

Unify backend under shared C library

 * Replace python nexus with C nexus
 * Move packets to little-endian format
 * Move all packet handling, binary protocol specs, socket handling, JSON
   parsing from pool code into the shared morloc.h library
 * Replace R `future` parallelism scheme with builtin `parallel` library

Add remote worker and resource management support

 * Add conventions for specifying caching and evaluation strategy
 * Add xxhash hashing for caching
 * Add remote handling with experimental slurm support

Other

 * `morloc` commands now return proper exit codes

0.52.1 [2025-02-16]
-------------------
 * Add python native bytes and bytearray support

0.52.0 [2025-02-09]
-------------------

Type evaluation and specialization
 * Delayed general alias evaluation
 * Add strict numeric types (`int8`, `uint8`, `int16` etc)
 * Allow concrete alias specialization
 * Add type hints allowing concrete type conservation across foreign calls

Bug fixes
 * Fix bug in opening existing shared memory volumes

Language support
  * Add C++ support for std template list-like types (`list`, `forward_list`,
     `deque`, `stack`, and `set` (I know, they're a tad different)
  * Add Python support for `numpy` vectors and arrays
  * Allow raw R vectors to be interpreted as strings
  * Nexus no longer creates python objects from returned data, instead writes
    results directly through C library (`morloc.h`)

0.51.1 [2024-12-04]
-------------------

 * Do not catch STDOUT and STDERR
 * Fix NULL return errors
 * Fix container setup

0.51.0 [2024-12-02]
------------------

Shared memory

 * Allow processes to communicate through shared memory

Setup

 * `morloc init` command will now build the `morloc` ecosystem, writing all
   required headers to `morloc` home and compiling any required shared libraries.

Other

 * Fix cases where morloc stalls when errors are transmitted across languages
 * Moved demos to the dedicated example repo


0.50.0 [2024-11-08]
-------------------

Better installation

 * `morloc install --commit 45d8df12` - for github retrieval by commit hash
 * `morloc install --branch dev` - to retrieve latest from specific branch
 * `morloc install --tag 0.1.0` - to retrieve specific tag

Better containers
 * Use podman rather than docker in Makefile
 * `morloc-tiny:<version>` - everything needed to compile morloc projects
 * `morloc-full:<version>` - an environment for running projects


0.49.0 [2024-11-04]
-------------------

New backend with better performance

 * Mediate inter-process communication with UNIX domain sockets
 * Transmit data with MessagePack rather than JSON
 * Added a benchmarking suite
 * Added `morloc init` command to configure morloc ecosystem

0.48.0 [2024-05-10]
-------------------

Second PeerJ submission (after return by editor for technical reasons)

 * Made type parameters explicit as type arguments:
   `id a :: a -> a`
    rather than either of
   `id :: a -> a`
   `id :: forall a . a -> a`.
 * Pass-by-reference in generated C++ code
 * Simplify generated C++ code by using function template arguments rather
   than type casting.


0.47.2 [2024-04-28]
-------------------

 * made the build static
 * fixed the dockerfile
 * exported the vim-syntax file out to its own repo
 * added a --version option
 * upgraded to LTS 22.18

0.47.2 [2024-04-28]
-------------------

First PeerJ submission

0.47.0 [2024.03.10]
-------------------
 * Add value checker
 * Raise error when implementations have equal score (no arbitrary choice)

0.46.0 [2024.03.06]
-------------------

 * Fix precedence of '@' operator - it binds tightest
 * Update flu demo
 * Fix github actions
 * Fix Dockerfile
 * Address all compiler warnings

0.45.0 [2024.02.14]
-------------------

 * Allow explicit import of polymorphic terms
 * Fix infinite loop bug when two many arguments are applied to a function
 * Synchronise tests with new core libraries type classes

0.44.0 [2024.02.08]
-------------------

Add support for ad hoc polymorphism.
  * Support sources and declarations in classes 
  * Support multiple parameters
  * Support overlapping instances
  * Packers are now implemented through the `Packable` typeclass

Some missing features:
  * No support typeclass constraints in the type signatures.
  * No support for parameterized class variables
  * No support for polymorphic recursion (does anyone want that?)

0.43.0 [2024.01.14]
-------------------

New features
 * Allow a module to explicitly export packers
 * Show pool pseudocode for `typecheck -r` 
 * Add `typecheck dump` subcommand to show expressions and indices
 * Allow nexus inputs to be files
 * Remove concrete type signatures - always infer
 * Make fields in language-specific table decs optional
     Rather than this:
       table (Person a) = Person {name :: Str, info :: a}
       table R (Person a) = "data.frame" {name :: Str, info :: a}
     Allow this:
       table (Person a) = Person {name :: Str, info :: a}
       table R (Person a) = "data.frame"
     Really, I need to totally redo the table/record/object handling.
 * Remove support for anonymous records in type signatures
     I will re-add this possibly at a future time when I refactor

Infrastructure changes
 * Pass all data between pools as files rather than string arguments
 * Raise an error if any general type cannot be translated to a concrete type

Fixes
 * Fix record type inference 
 * Fix bug in collecting packers (missed packers required by root manifold)
 * Fix C++ handling of quotes and special characters in JSON strings

0.42.0 [2023.10.11]
-------------------

 * Infer concrete types from inferred general types when necessary and possible
 * More informative error messages 
 * Fix template resolution in generated C++ code
 * Fix include name shadowing conflict in generated C++ code
 * Partially fix naming conflict in Python and R pools caused by use of "f". My
   solution was name mangling, though we need a more permanent solution to our
   problem.
 * Let user write correct "list" R types for lists, tuples, and records
 * Fix bug in code generation of lets

## Internal
 * For `ForeignInterfaceM` constructor of ExprM, store the full call type, not
   just the return type
 * Parameterize `ExprM` with the type type (e.g., `Maybe TypeP` or `TypeM`)
 * Replace `Argument` and `PreArgument` with a parameterized `Arg` type.
 * Fix broken `ForeignInterfaceM` and `PoolCallM` cases in `typeOfExprM`
 * Refactor backend

 Testing and documentation:
 * Complete flu demo - it builds now, just need to implement the library code
   for align and other functions.


0.41.1 [2023.05.26]
-------------------

 * Print nothing if "null" is returned
 * Fix the import of working directory modules
 * Resolve bug in occur check
 * Streamline github actions script
 * Fix `morloc install` path download for core modules
 * Raise type error for untyped concrete term
 * Fix bug in concrete type synthesis

0.41.0 [2023.04.16]
-------------------

Language updates
 * Add check to avoid infinite typechecker recursion
 * Synthesize concrete types from general types when possible
 * Improve exports
   * Move exports to module list (as in Haskell)
   * Add `*` wildcard to export every top-level named term or type
   * Raise an error if a non-existing term is exported from a module
 * Allow concrete (un)packers to vary in number of generic terms
 * Set functions with empty inputs (e.g., `()`) to have empty lists of arguments
 * Replace the `Null` literal term with `()`


Package updates
 * Default to c++17, rather than c++11
 * Restructure library to avoid name conflicts with pre-existing packages
 * Replace Perl nexus with Python nexus and remove Perl dependencies

Better error messages and logs
 * Resolve "shit output" error message (map index to export name)
 * Tidy up the verbose diagnostics
 * Print general and concrete types for typecheck with -r option
 * Add multiple levels of verbosity (quiet by default)

Bug fixes
 * Typechecking bug in record access
 * Fix bug allowing undefined things in module export lists
 * Fix cousin module imports
 * Fix unparameterized (un)packer serialization
 * Fix error raised when a module exporting a type is compiled 
 * Fix out of order record fields in nexus output

0.40.0 [2023.02.04]
-------------------

 * Infer types of records
 * Fix bug in concrete type inference
 * Fix bugs in foreign higher order function code generation
 * Simplify generator code
 * Add many tests

0.39.0 [2023.01.03]
-------------------

 * Add compose operator
 * Allow eta-reduction

0.38.0 [2022.12.23]
-------------------

 * Choose casing convention
   * camel case for terms (for now, underscore is illegal)
   * pascal case for types
 * Fix sub-module handling
 * Fix import/export of type definitions
 * Better error messages for import/export errors
 * Somewhat formatted `typecheck` subcommand output 
 * Add option to typecheck backend (concrete types and language selection)

0.37.0 [2022.12.11]
-------------------

 * Remove extra space printed at the end of R JSON
 * Clarify error message for missing exports
 * Clarify error message for missing concrete signature
 * Fix exponential time bug in parser
 * Allow prime characters in names after first position
 * Allow '.' to separate namespaces in imports/modules
 * Fix infinite loop bug when module name != import name

0.36.0 [2022.02.17]
-------------------

 * Separate reals from integers
 * Remove global haskell extensions from package.yaml

0.36.0 [2022.02.17]
-------------------

 * Separate reals from integers
 * Remove global haskell extensions from package.yaml

0.35.0 [2021.10.24]
-------------------

Where scoping and a total architecture refactor

 * Fix handling for generic parameterized types
 * Improve whitespace handling
 * Statements are order invariant
 * Thread link from expression to source expression down to generators 
 * Typecheck over final abstract syntax trees rather than expressions
 * Separate general and concrete typechecking
 * Pretty instances for all data types
 * More testing
 * Agonized over deep and wide structures

0.34.0 [2021.03.05]
-------------------

 * Add handling for C++ float primitives
 * Let C++ programs be imported through a header and shared library
 * Remove semicolon requirement
 * Add hie.yaml for compatibility with hsl
 * Update dependency set to LTS-17.4
 * Add subparsers to CLI with pcapriotti/optparse-applicative 
 * Remove brace requirement for modules and `where` statements
 * Add `-o` option to compiler to specify output executable names
 * Acceptable syntax error messages

0.33.0 [2020.11.03]
-------------------

First hackage release

 * Haddock documentation
 * Update README
 * In help statements write universal, not concrete, types
 * Make default containers non-existential (probably a bad decision?)

0.32.0 [2020.11.01]
-------------------

 * Add record/table field access
 * Fix JSON handling in nexus
 * Fix nexus bug necessitated escaping quotations and braces
 * Print general types in nexus help
 * Resolve most GHC warnings

0.31.0 [2020.10.29]
-------------------

 * Fix anonymous records in C++
 * Distinguish 'record', 'object', and 'table'
 * Add object handling
 * Add table handling

0.30.0 [2020.10.23]
-------------------

 * Add `object` keyword for defining record types
 * Add full record serialization handling (C++, py, R)

0.29.0 [2020.10.21]
-------------------

 * Add AST directed (de)serialization framework
 * Add type constructors for parameterized types

0.28.0 [2020.10.12]
-------------------

 * Allow import/export of type aliases
 * Refactor with DAGs all through the parser and typechecker

0.27.0 [2020.10.04]
-------------------

 * Add systematic tests for data serialization
 * Fix bug in C++ serialization
 * Move to serialize to dedicated libraries that require no import

0.26.0 [2020.09.27]
-------------------

Add `type` keyword for defining type aliases

0.25.0 [2020.09.26]
-------------------

No explicit forall. Instead use Haskell convention of generics being lowercase
and non-generics being uppercase. 

 * no more explicit "forall"
 * generics are lowercase in type signatures
 * non-generic types are uppercase
 * normal functions are lowercase
 * class constructors are uppercase (though handling for this is not yet implemented)

0.24.0 [2020.09.22]
-------------------

Allow integration of many instances

0.23.0 [2020.05.14]

Bug fixes and code cleanup

Bug fixes / tests
 - [x] [x] github issue #7 - new Var=> typechecking rule
 - [x] [x] github issue #9 - rewire container type inference
 - [x] [x] github issue #10
 - [x] [x] github issue #11


0.22.0 [2020.04.28]
-------------------

Implement a schema-directed composable serialization system

Major changes
 * Fully composable serialization over containers and primitives
 * Improved C++ support of generic functions
 * Record support for R and Python3 (not C++ yet)
 * Refactor generator - replace old grammar system
 * Allow arguments to be passed to general functions
   (e.g., `foo x = [x]`, where no specific language is needed) 

Minor changes
 * change default python3 interpreter from "python" to "python3"
 * add default library and tmp paths to config handler
 * test composable serialization functions in all supported languages
 * allow wrapped comments in R

Testing - grammar directed testing
 * test record handling
 * remove and replace out-of-date golden tests
 * systematic argument handling tests
 * systematic manifold form tests
 * systematic interop testing

0.21.0 [2020.03.31]
-------------------

Major - add handling and test for many many corner cases
 * Allow export of data statements
 * Allow export of non-functions
 * Allow functions with containers at the root
 * Allow export of 0-argument functions 

Minor
 * proof-of-concept composable serialization functions in C++ (cppbase)
 * add python tests
 * make the test output look pretty (no weird whitespace)

0.20.0 [2020.03.23]
-------------------

 * Add composable default types

0.19.1 [2020.02.22]
-------------------

 * bug fixes

0.19.0 [2020.02.20]
-------------------

Major changes
 * Allow currying
 * Add realization optimizations
 * Refactor generator into series of clear transformations
 * Added handling for dealing with ambiguous ASTs

Minor bug fixes and updates
 * Prettier code generation for C++, Python and R
 * More detailed comments in generated code
 * Allow tags on parenthesized types
 * Fix bug in functions with multiple parameters 
 * Fix bug preventing loading of package metadata 

0.18.1 [2019.11.08]
-------------------

 * Fix travis
 * Use C++11 for C++ builds
 * Make .morloc/config optional
 * Fix bug in parsing unit type: `()`

0.18.0 [2019.11.04]
-------------------

 * Add bidirectional type system
 * Allow parameterized concrete types
 * Allow higher-order functions
 * Allow properties to contain multiple terms 
 * Add many tests
 * Add module system
 * Allow non-primitive types in lists, tuples, and records
 * Removed arq and SPARQL dependency (very fast compilation)

0.17.4 [2019.06.29]
-------------------

 * Add C and C++ handling
 * Define Ord intance for MTypeMeta
 * Allow pools to be called as executables
 * Add type handling to generators
 * Remove redundant SPARQL queries (better performance)
 * New RDF list semantics
 * Use strings to represent concrete types (e.g. "char\*")
 * Write pretty-printed diagnostic files to `$MORLOC_HOME/tmp` 
 * Handling for multiple concrete type signatures (e.g., definition of
   a function in multiple languages).
 * Handling for multiple abstract type signatures
 * Handling for multiple function declarations

0.17.3 [2019.06.14]
-------------------

 * Partial C support
   - execution of sourced functions
   - no composition
   - no foreign calls

 * Partial transition to typed generators
   - bound arguments are still not typed correctly

 * Use integer IDs to identify manifolds in pools and the nexus (can to make
   calls between them) instead of long, mangled names.

 * Replace string names of languages (e.g., "python") with a sum type.

0.17.2 [2019.05.05]
-------------------

  Pycon release

0.17.1 [2019.04.26]
-------------------

 * Fix output serialization in generate code
 * Fix module linking in generated code

0.17.0 [2019.04.16]
-------------------

 * Add morloc home
 * Load modules from `$MORLOCHOME/lib`
 * Create monad stack

0.16.2 [2018.03.05]
-------------------

 * Add Zenodo badge making the project citable
 * Move to `morloc-project/morloc` github repo

0.16.1 [2018.09.24]
-------------------

Minor release consisting of internal refactoring

 * Pruned unnecessary code
 * Pruned unnecessary imports
 * Compliance with stricter compile flags

0.16.0 [2018.09.14]
-------------------

 * Write RDF bools in lowercase ("true", rather than "True"), as per specs
 * Stricter node typing (replace ad hoc names with elements from an ADT)
 * Add very rudimentary typechecking
 * Remove SPARQL server dependency (now there's a sluggish Jena dependency)

0.15.1 [2018.09.10]
-------------------

 * Add error handling and reporting to pools
 * Add type signature comments to generated pools 
 * Richer internal data structures

0.15.0 [2018.09.05]
-------------------

 * Generalize code generators using grammar records
 * Add Python compatibility
 * Replace unit tests with golden tests
 * Use docopt and USAGE template for argument handling
 * Report number of arguments in nexus usage statements


================================================
FILE: LICENSE
================================================
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "[]"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and


================================================
FILE: README.md
================================================
<p align="center">
  <a href="https://github.com/morloc-project/morloc/actions/workflows/.test.yml">
    <img src="https://github.com/morloc-project/morloc/actions/workflows/.test.yml/badge.svg" alt="build status">
  </a>
  <a href="https://github.com/morloc-project/morloc/releases">
    <img src="https://img.shields.io/github/release/morloc-project/morloc.svg?label=current+release" alt="github release">
  </a>
  <a href="https://www.apache.org/licenses/LICENSE-2.0">
      <img src="https://img.shields.io/badge/License-Apache%202.0-blue.svg" alt="license: Apache 2.0">
</a>
</p>

<p align="center">
  <a href="https://morloc-project.github.io/docs">Manual</a> |
  <a href="https://discord.gg/dyhKd9sJfF">Discord</a> |
  <a href="https://peerj.com/articles/cs-3435/">Paper</a> |
  <a href="https://x.com/morlocproject">X</a> |
  <a href="https://bsky.app/profile/morloc-project.bsky.social">BlueSky</a> |
  <a href= "mailto:z@morloc.io">Email</a>
</p>


<div align="center">
<h1>Morloc</h1>
<h2>compose functions across languages under a common type system</h2>
</div>

**Why use Morloc?**

 * Universal function composition: Import functions from multiple languages and
   compose them together under a unified, strongly-typed functional framework.

 * Polyglot without boilerplate: Use the best language for each task with no
   manual bindings or interop code.

 * Type-directed CLI generation: Write concrete function signatures once and
   automatically generate elegant command-line interfaces with argument
   parsing, validation, help text, and documentation.

 * Composable CLI tools: Morloc CLI programs can be composed by simply importing
   them into a new Morloc module and re-exporting their functions.

 * Seamless benchmarking and testing: Swap implementations and run the same
   benchmarks/tests across languages with consistent type signatures and data
   representation.

 * Design universal libraries: Build abstract, type-driven libraries and
   populate them with foreign language implementations, enabling rigorous code
   organization and reuse.

 * Smarter workflows: Replace brittle application/file-based pipelines with
   faster, more maintainable pipelines made from functions acting on structured
   data.


Below is a simple example, for installation details and more examples, see the
[Manual](https://morloc-project.github.io/docs).

A Morloc module can import functions from foreign languages, assign them general
types, and compose new functions:


```morloc
-- Morloc code, in "main.loc"
module m (vsum)

import root-py
import root-cpp

source Py from "foo.py" ("pmap")
pmap a b :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("sum")
sum :: [Real] -> Real

--' Input numeric vectors that will be summed in parallel
--' metavar: VECTORS
type Vectors = [[Real]]

--' Sum a list of numeric vectors
--' return: Final sum of all elements in all vectors
vsum :: Vectors -> Real
vsum = sum . pmap sum 
```

The imported code is natural code with no Morloc-specific dependencies.

Below is the C++ code that defines `sum` as a function of a standard C++ vector
of `double`s that returns a `double`:

```C++
// C++ code, in "foo.hpp"

#pragma once

#include <vector>
#include <numeric>

double sum(std::vector<double> xs) {
    return std::accumulate(
       xs.begin(), xs.end(), 0.0);
}
```

Below is Python code that defines a parallel map function:

```python
# Python code, in "foo.py"

import multiprocessing as mp

# Parallel map function
def pmap(f, xs):
    with mp.Pool() as pool:
        results = pool.map(f, xs)
    return results
```

This program can be compiled and run as below:

```
$ menv morloc make main.loc

$ menv ./nexus vsum -h
Usage: ./nexus vsum VECTORS

Sum a list of numeric vectors

Positional arguments:
  VECTORS  Input numeric vectors that will be summed in parallel
           type: [[Real]]

Return: Real
  Final sum of all elements in all vectors

$ menv ./nexus vsum [[1.2],[0,0.1]]
1.3
```


================================================
FILE: bench/Bench.hs
================================================
{-|
Module      : Bench
Description : Benchmark suite for morloc compiler
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

This benchmark suite tracks performance of key compiler components:
- Parser: parsing .loc source files
- Type checker: type inference and checking
- Code generator: nexus and pool generation

Run with: stack bench
Run with options: stack bench --benchmark-arguments '--csv bench-results.csv'
-}

module Main (main) where

import Test.Tasty.Bench
import qualified Data.Text as T
import System.FilePath ((</>))
import qualified System.Directory as SD

import Morloc (typecheckFrontend, typecheck)
import Morloc.Namespace.Prim (Code(..), Defaultable(..))
import Morloc.Namespace.State (Config(..), MorlocMonad, MorlocError)
import qualified Morloc.Monad as MM

-- | Helper to read benchmark test files
readTestFile :: FilePath -> IO Code
readTestFile name = do
  let path = "bench" </> "test-data" </> name
  Code . T.pack <$> readFile path

-- | Create a minimal config for benchmarking
emptyConfig :: IO Config
emptyConfig = do
  home <- SD.getHomeDirectory
  return $ Config
    { configHome        = home <> "/.local/share/morloc"
    , configLibrary     = home <> "/.local/share/src/morloc"
    , configPlane       = "default"
    , configPlaneCore   = "morloclib"
    , configTmpDir      = home <> "/.morloc/tmp"
    , configBuildConfig = home <> "/.morloc/.build-config.yaml"
    , configLangOverrides = mempty
    }

-- | Run a MorlocMonad action for benchmarking
runBench :: MorlocMonad a -> IO (Either MorlocError a)
runBench action = do
  config <- emptyConfig
  ((result, _), _) <- MM.runMorlocMonad Nothing 0 config defaultValue action
  return result

main :: IO ()
main = defaultMain
  [ bgroup "Parser"
    [ bench "parse-simple" $ whnfIO $ do
        code <- readTestFile "simple.loc"
        runBench (typecheckFrontend Nothing code)

    , bench "parse-interop" $ whnfIO $ do
        code <- readTestFile "interop.loc"
        runBench (typecheckFrontend Nothing code)

    , bench "parse-complex-types" $ whnfIO $ do
        code <- readTestFile "complex-types.loc"
        runBench (typecheckFrontend Nothing code)
    ]

  , bgroup "Type Checker"
    [ bench "typecheck-simple" $ whnfIO $ do
        code <- readTestFile "simple.loc"
        runBench (typecheck Nothing code)

    , bench "typecheck-interop" $ whnfIO $ do
        code <- readTestFile "interop.loc"
        runBench (typecheck Nothing code)

    , bench "typecheck-complex-types" $ whnfIO $ do
        code <- readTestFile "complex-types.loc"
        runBench (typecheck Nothing code)
    ]

  -- Note: Code generation benchmarks commented out as they require
  -- file system access and module initialization
  -- Uncomment after setting up appropriate test environment
  {-
  , bgroup "Code Generation"
    [ bench "generate-simple" $ whnfIO $ do
        code <- readTestFile "simple.loc"
        runBench (writeProgram Nothing code)
    ]
  -}
  ]


================================================
FILE: bench/test-data/complex-types.loc
================================================
module complex (processRecords)

type Record = {id :: Int, name :: Str, values :: [Real]}

processRecords :: [Record] -> [Int]
processRecords rs = map (\r -> r.id) rs


================================================
FILE: bench/test-data/interop.loc
================================================
module interop (processList)

import math (sqrt from python)

processList :: [Real] -> [Real]
processList xs = map sqrt xs


================================================
FILE: bench/test-data/simple.loc
================================================
module simple (add, mul)

add :: Int -> Int -> Int
add x y = x + y

mul :: Int -> Int -> Int
mul x y = x * y


================================================
FILE: container/Makefile
================================================
# Pushing to the github registry requires a personal token with package
# permissions. Login is required, for example:
#
#   $ echo $GITHUB_TOKEN | podman login ghcr.io -u morloc-project --password-stdin
#
# I am currently using the "classic" token (ghp_*), not the fine-grained
# token. These need to be refreshed every few months
#
# You need to provide the desired morloc version as an environmental variable,
# so run the make commands like so:
#
# $ make MORLOC_VERSION=0.70.0 build-tiny

define HEREDOC
#!/bin/bash
mkdir -p ~/.morloc
podman run --rm \
  -e HOME=$$HOME \
  -v $$HOME/.morloc:$$HOME/.morloc \
  -v $$PWD:$$HOME \
  -w $$HOME ghcr.io/morloc-project/morloc/morloc-tiny:edge \
  morloc "$$@"
endef
export HEREDOC

install:
	# Pull the exact version to ensure it exists locally
	podman pull ghcr.io/morloc-project/morloc/morloc-tiny:edge
	@mkdir -p ${HOME}/bin
	@echo "$$HEREDOC" > ${HOME}/bin/morloc-edge
	chmod 755 ${HOME}/bin/morloc-edge


# Build a container that just has the morloc compiler.
# Context is the repo root (..) so COPY gets the local source tree.
build-tiny:
	podman build --no-cache --force-rm \
		-t ghcr.io/morloc-project/morloc/morloc-tiny:$(MORLOC_VERSION) \
		-t ghcr.io/morloc-project/morloc/morloc-tiny:edge \
		-f tiny/Dockerfile ..

# Build the full interactive development image.
# Copies the morloc binary from the locally-built morloc-tiny image.
# Run build-tiny first.
build-full:
	podman build --no-cache --force-rm \
		--build-arg MORLOC_VERSION=$(MORLOC_VERSION) \
		-t ghcr.io/morloc-project/morloc/morloc-full:$(MORLOC_VERSION) \
		-t ghcr.io/morloc-project/morloc/morloc-full:edge \
		full

# Build the required docker image
build-test:
	podman build --no-cache --force-rm -t ghcr.io/morloc-project/morloc/morloc-test test
	podman tag ghcr.io/morloc-project/morloc/morloc-test ghcr.io/morloc-project/morloc/morloc-test:edge

shell:
	podman run --shm-size=4g --rm -it ghcr.io/morloc-project/morloc/morloc-full:edge /bin/bash

shell-tiny:
	podman run --shm-size=4g --rm -it ghcr.io/morloc-project/morloc/morloc-tiny:edge /bin/bash

shell-test:
	podman run --shm-size=4g --rm -it ghcr.io/morloc-project/morloc/morloc-test /bin/bash

# push local containers to the github registry
# Ensures edge moves to the same digest as $(MORLOC_VERSION)
push:
	# Push tiny version and edge
	podman push ghcr.io/morloc-project/morloc/morloc-tiny:$(MORLOC_VERSION)
	podman push ghcr.io/morloc-project/morloc/morloc-tiny:edge
	# Push full version and edge
	podman push ghcr.io/morloc-project/morloc/morloc-full:$(MORLOC_VERSION)
	podman push ghcr.io/morloc-project/morloc/morloc-full:edge
	# Push test (no moving tag)
	podman push ghcr.io/morloc-project/morloc/morloc-test:edge

# retrieve the latest morloc builds from the github registry
pull:
	podman pull ghcr.io/morloc-project/morloc/morloc-tiny:$(MORLOC_VERSION)
	podman pull ghcr.io/morloc-project/morloc/morloc-full:$(MORLOC_VERSION)
	podman pull ghcr.io/morloc-project/morloc/morloc-test
	podman pull ghcr.io/morloc-project/morloc/morloc-test:edge

# Convenience: pull moving edge tags
pull-edge:
	podman pull ghcr.io/morloc-project/morloc/morloc-tiny:edge
	podman pull ghcr.io/morloc-project/morloc/morloc-full:edge

# Cleanup of podman images may be done as follows
# $ podman image prune
# $ podman container prune
# $ podman image rm -f $(podman image ls -q)


================================================
FILE: container/full/Dockerfile
================================================
# Copy the morloc binary from the matching tiny image
ARG MORLOC_VERSION=edge
FROM ghcr.io/morloc-project/morloc/morloc-tiny:${MORLOC_VERSION} AS morloc-bin

FROM docker.io/library/ubuntu:24.04

LABEL org.opencontainers.image.source=https://github.com/morloc-project/morloc
LABEL org.opencontainers.image.description="A morloc container intended for interactive shell use"
LABEL org.opencontainers.image.licenses=Apache-2.0

COPY --from=morloc-bin /bin/morloc /bin/morloc
COPY --from=morloc-bin /opt/morloc-rust-bin /opt/morloc-rust-bin

WORKDIR $HOME

ENV DEBIAN_FRONTEND=noninteractive
ENV PATH="/root/.local/bin:/root/.local/share/morloc/bin:${PATH}"
# Pre-built Rust binaries: morloc init uses these directly (no cargo needed)
ENV MORLOC_RUST_BIN=/opt/morloc-rust-bin

RUN apt-get update

# Set the timezone, this avoids hanging later on
RUN TZ=Antarctica/Troll apt-get -y install tzdata

RUN apt-get install -y r-base python3 python3-dev python3-pip python3-numpy libgsl-dev git curl

RUN python3 -m pip install --break-system-packages --upgrade setuptools

# Setup the morloc home (uses pre-built Rust binaries, no cargo needed)
RUN morloc init
# Copy morloc-nexus to a system path so it remains on PATH even when
# morloc-manager bind-mounts over ~/.local/bin with a host directory
RUN cp /root/.local/share/morloc/bin/morloc-nexus /usr/local/bin/morloc-nexus
RUN echo "lang_python3 : python3" >> $HOME/.local/share/morloc/config

RUN morloc install stdlib

RUN apt-get install -y vim

# Copy over custom vimrc
COPY assets/vimrc /root/.vimrc
COPY assets/README /root/README

# Set up vim highlighting for morloc
RUN git clone https://github.com/morloc-project/vimmorloc \
  && mkdir -p ~/.vim/syntax/ \
  && mkdir -p ~/.vim/ftdetect/ \
  && cp vimmorloc/loc.vim ~/.vim/syntax/ \
  && echo 'au BufRead,BufNewFile *.loc set filetype=loc' > ~/.vim/ftdetect/loc.vim \
  && rm -rf vimmorloc

RUN git clone https://github.com/morloc-project/morloc ~/morloc

COPY assets/bashrc /etc/bash.bashrc

# Cleanup to reduce image size
RUN apt-get clean && rm -rf /var/lib/apt/lists/*


================================================
FILE: container/full/assets/README
================================================
This container has a full morloc installation and language support for R, Python3, and C++.

The ~/tests folder contains a set of tests from the morloc test suite. These may
serve as simplistic examples of morloc scripts. Though they are designed for
testing the language not pedagogy.


================================================
FILE: container/full/assets/bashrc
================================================
# basic morloc bashrc

# If not running interactively, don't do anything
case $- in
    *i*) ;;
      *) return;;
esac

# History Configuration
HISTCONTROL=ignoreboth:erasedups
HISTSIZE=10000
HISTFILESIZE=20000
shopt -s histappend

# Shell Options
shopt -s checkwinsize
shopt -s globstar 2>/dev/null

# Colors
if [ -x /usr/bin/dircolors ]; then
    test -r ~/.dircolors && eval "$(dircolors -b ~/.dircolors)" || eval "$(dircolors -b)"
fi

# Prompt
# Detect if we have color support
if [ -x /usr/bin/tput ] && tput setaf 1 >&/dev/null; then
    # Define colors
    RESET='\[\033[0m\]'
    BOLD='\[\033[1m\]'
    DIM='\[\033[2m\]'
    
    # Color palette
    BLUE='\[\033[38;5;75m\]'
    GREEN='\[\033[38;5;114m\]'
    YELLOW='\[\033[38;5;221m\]'
    GRAY='\[\033[38;5;245m\]'
    RED='\[\033[38;5;204m\]'

    DEVNAME=""
    if [ ! -z "$MORLOC_ENV_NAME" ]; then
      DEVNAME="${DIM}${GRAY}(${MORLOC_ENV_NAME})${RESET} "
    fi 

    MORLOC_VERSION=$(morloc --version)
    if [ $? -eq 0 ]; then
      MORLOC_VERSION="-${MORLOC_VERSION}"
    fi
    
    # Format: (container) morloc $
    PS1="${DEVNAME}${YELLOW}morloc${MORLOC_VERSION}${RESET} $ "
else
    # Fallback for no color
    PS1="morloc $ "
fi

# aliases
alias ls='ls --color=auto'
alias ll='ls -lh'
alias la='ls -lah'
alias l='ls -CF'

# coloring
alias grep='grep --color=auto'
alias fgrep='fgrep --color=auto'
alias egrep='egrep --color=auto'

# fast navigation
alias ..='cd ..'
alias ...='cd ../..'
alias ....='cd ../../..'
alias .....='cd ../../../..'

# setup path
[ -d "$HOME/.local/bin" ] && PATH="$HOME/.local/bin:$PATH"
[ -d "$HOME/bin" ] && PATH="$HOME/bin:$PATH"

# completions
if ! shopt -oq posix; then
  if [ -f /usr/share/bash-completion/bash_completion ]; then
    . /usr/share/bash-completion/bash_completion
  elif [ -f /etc/bash_completion ]; then
    . /etc/bash_completion
  fi
fi


================================================
FILE: container/full/assets/vimrc
================================================
" Jump to the last position when reopening a file
au BufReadPost * if line("'\"") > 1 && line("'\"") <= line("$") | exe "normal! g'\"" | endif

" Load indentation rules and plugins according to the detected filetype.
filetype plugin indent on
syntax on
set showcmd             " Show (partial) command in status line.
set showmatch           " Show matching brackets.
set ignorecase          " Do case insensitive matching
set smartcase           " Do smart case matching
set incsearch           " Incremental search
set autowrite           " Automatically save before commands like :next and :make
set hidden              " Hide buffers when they are abandoned

" An OK colorscheme
colorscheme torte


================================================
FILE: container/static-build/Dockerfile
================================================
# Portable build of libmorloc.so, morloc-nexus, and morloc-manager.
#
# Strategy:
#   - libmorloc.so: shared library built on Ubuntu 20.04 (glibc >= 2.31)
#   - morloc-nexus: dynamically linked to libmorloc.so (glibc >= 2.31)
#   - morloc-manager: fully static binary (Alpine/musl, runs on any Linux)
#
# Build:
#   docker build -t morloc-rust-build -f container/static-build/Dockerfile .
#   docker run --rm -v $(pwd)/out:/out morloc-rust-build
#
# Output:
#   ./out/libmorloc.so      (shared library, glibc >= 2.31)
#   ./out/morloc-nexus      (binary, glibc >= 2.31, links libmorloc.so)
#   ./out/morloc-manager    (static binary, runs on any Linux including NixOS)

# ===========================================================================
# Stage 1: Build libmorloc.so + morloc-nexus on Ubuntu (glibc)
#
# morloc-nexus dynamically links libmorloc.so at runtime, so both must be
# built against the same libc. Ubuntu 20.04 gives glibc 2.31 forward compat.
# ===========================================================================
FROM docker.io/library/ubuntu:20.04 AS glibc-builder

ENV DEBIAN_FRONTEND=noninteractive

RUN apt-get update && apt-get install -y --no-install-recommends \
    curl ca-certificates gcc g++ make pkg-config \
    && rm -rf /var/lib/apt/lists/*

RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y --default-toolchain stable \
    && /root/.cargo/bin/cargo --version
ENV PATH="/root/.cargo/bin:${PATH}"

WORKDIR /build

# Copy Cargo manifests first for dependency caching
COPY data/rust/Cargo.toml data/rust/Cargo.lock ./
COPY data/rust/morloc-runtime/Cargo.toml ./morloc-runtime/
COPY data/rust/morloc-nexus/Cargo.toml ./morloc-nexus/
COPY data/rust/morloc-manager/Cargo.toml ./morloc-manager/

# Create dummy source files for dependency pre-build
RUN mkdir -p morloc-runtime/src morloc-nexus/src morloc-manager/src \
    && echo "fn main() {}" > morloc-nexus/src/main.rs \
    && echo "fn main() {}" > morloc-manager/src/main.rs \
    && echo "" > morloc-runtime/src/lib.rs

RUN cargo build --release -p morloc-runtime 2>/dev/null || true

# Copy actual source
COPY data/rust/ ./

# Force rebuild after copying real source over dummy stubs
RUN touch morloc-runtime/src/lib.rs morloc-nexus/src/main.rs

# Build libmorloc.so from staticlib via gcc --whole-archive to export ALL
# symbols (internal Rust runtime state must be visible to language extensions)
RUN cargo build --release -p morloc-runtime

RUN mkdir -p /root/.local/share/morloc/lib \
    && gcc -shared -o /root/.local/share/morloc/lib/libmorloc.so \
       -Wl,--whole-archive target/release/libmorloc_runtime.a -Wl,--no-whole-archive \
       -lpthread -lrt -ldl -lm

# Build morloc-nexus (dynamically links libmorloc.so)
RUN cargo build --release -p morloc-nexus

RUN strip /root/.local/share/morloc/lib/libmorloc.so target/release/morloc-nexus

# ===========================================================================
# Stage 2: Build morloc-manager on Alpine (musl, fully static)
#
# morloc-manager has no native dependencies — pure Rust crates only.
# Building on Alpine produces a fully static musl binary that runs on any
# Linux, including NixOS and minimal containers.
# ===========================================================================
FROM docker.io/library/alpine:3.20 AS musl-builder

RUN apk add --no-cache curl gcc musl-dev

RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y --default-toolchain stable \
    && /root/.cargo/bin/cargo --version
ENV PATH="/root/.cargo/bin:${PATH}"

WORKDIR /build

# Copy Cargo manifests for dependency caching
COPY data/rust/Cargo.toml data/rust/Cargo.lock ./
COPY data/rust/morloc-runtime/Cargo.toml ./morloc-runtime/
COPY data/rust/morloc-nexus/Cargo.toml ./morloc-nexus/
COPY data/rust/morloc-manager/Cargo.toml ./morloc-manager/

RUN mkdir -p morloc-runtime/src morloc-nexus/src morloc-manager/src \
    && echo "fn main() {}" > morloc-nexus/src/main.rs \
    && echo "fn main() {}" > morloc-manager/src/main.rs \
    && echo "" > morloc-runtime/src/lib.rs

RUN cargo build --release -p morloc-manager 2>/dev/null || true

COPY data/rust/ ./

# Force rebuild: cargo may skip if it thinks the cached dummy binary is fresh
RUN touch morloc-manager/src/main.rs \
    && cargo build --release -p morloc-manager

RUN strip target/release/morloc-manager

# ===========================================================================
# Stage 3: Verify and output
# ===========================================================================
FROM docker.io/library/alpine:3.20

RUN apk add --no-cache file

COPY --from=glibc-builder /root/.local/share/morloc/lib/libmorloc.so /out-staging/libmorloc.so
COPY --from=glibc-builder /build/target/release/morloc-nexus /out-staging/morloc-nexus
COPY --from=musl-builder /build/target/release/morloc-manager /out-staging/morloc-manager

# Verify morloc-manager is static (no dynamic linker needed)
RUN file /out-staging/morloc-manager \
    && ! ldd /out-staging/morloc-manager 2>&1 | grep -q "=>" \
    && echo "OK: morloc-manager has no dynamic dependencies"

CMD ["sh", "-c", "cp /out-staging/libmorloc.so /out-staging/morloc-nexus /out-staging/morloc-manager /out/ && echo 'Wrote libmorloc.so, morloc-nexus, morloc-manager' && ls -lh /out/libmorloc.so /out/morloc-nexus /out/morloc-manager && echo && file /out/morloc-manager"]


================================================
FILE: container/static-build/build.sh
================================================
#!/bin/sh
# Build portable libmorloc.so, morloc-nexus, and morloc-manager.
#
# Usage:
#   ./container/static-build/build.sh
#
# Output:
#   ./out/libmorloc.so      (shared library, glibc >= 2.31)
#   ./out/morloc-nexus      (binary, glibc >= 2.31, links libmorloc.so)
#   ./out/morloc-manager    (static binary, runs on any Linux)

set -e

SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
PROJECT_DIR="$(cd "$SCRIPT_DIR/../.." && pwd)"

# Detect container engine (prefer podman)
if command -v podman >/dev/null 2>&1; then
    ENGINE=podman
elif command -v docker >/dev/null 2>&1; then
    ENGINE=docker
else
    echo "Error: neither podman nor docker found" >&2
    exit 1
fi

echo "Building libmorloc.so, morloc-nexus, and morloc-manager with $ENGINE..."

mkdir -p "$PROJECT_DIR/out"

$ENGINE build \
    -t morloc-rust-build \
    -f "$SCRIPT_DIR/Dockerfile" \
    "$PROJECT_DIR"

$ENGINE run --rm \
    -v "$PROJECT_DIR/out:/out" \
    morloc-rust-build

echo ""
echo "Binaries:"
ls -lh "$PROJECT_DIR/out/libmorloc.so" "$PROJECT_DIR/out/morloc-nexus" "$PROJECT_DIR/out/morloc-manager"
file "$PROJECT_DIR/out/libmorloc.so" "$PROJECT_DIR/out/morloc-nexus" "$PROJECT_DIR/out/morloc-manager"


================================================
FILE: container/test/Dockerfile
================================================
FROM docker.io/library/ubuntu:24.04

ENV DEBIAN_FRONTEND=noninteractive

RUN apt-get update && apt-get install -y \
  git \
  gdb \
  curl \
  pkg-config \
  libglib2.0-dev \
  build-essential \
  libffi-dev \
  libgmp-dev \
  zlib1g-dev

# Install GHCup into /opt/ghcup (accessible to all users)
ENV GHCUP_INSTALL_BASE_PREFIX=/opt
ENV BOOTSTRAP_HASKELL_NONINTERACTIVE=1
RUN curl --proto '=https' --tlsv1.2 -sSf https://get-ghcup.haskell.org | sh

# Add ghcup to PATH
ENV PATH="/opt/.ghcup/bin:${PATH}"

# Install Rust toolchain (needed by morloc init to build libmorloc.so)
RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y
ENV PATH="/root/.cargo/bin:${PATH}"

# Set the timezone, this avoids hanging later on
RUN TZ=Antarctica/Troll apt-get -y install tzdata

# hyperfine is needed for shell benchmarks
RUN apt-get install -y r-base python3 python3-dev python3-pip libgsl-dev git hyperfine
RUN python3 -m pip install --break-system-packages --upgrade setuptools numpy pyarrow

# Set up R environment
# stringi is needed for benchmarks
RUN Rscript -e 'install.packages("stringi", repos  = "https://cloud.r-project.org")'

# Install R Arrow package for cross-language Arrow IPC support
ENV LIBARROW_MINIMAL=true
ENV ARROW_S3=OFF
ENV ARROW_GCS=OFF
RUN Rscript -e 'install.packages("arrow", repos = "https://cloud.r-project.org")'

# Cleanup to reduce image size
RUN apt-get clean && rm -rf /var/lib/apt/lists/*

# Create /home/dev with permissive access so any --user UID:GID can write here.
# morloc-manager bind-mounts .stack and .local into this directory.
RUN mkdir -p /home/dev && chmod 1777 /home/dev

COPY assets/bashrc /etc/bash.bashrc


================================================
FILE: container/test/assets/bashrc
================================================
# basic morloc bashrc

# If not running interactively, don't do anything
case $- in
    *i*) ;;
      *) return;;
esac

# History Configuration
HISTCONTROL=ignoreboth:erasedups
HISTSIZE=10000
HISTFILESIZE=20000
shopt -s histappend

# Shell Options
shopt -s checkwinsize
shopt -s globstar 2>/dev/null

# Colors
if [ -x /usr/bin/dircolors ]; then
    test -r ~/.dircolors && eval "$(dircolors -b ~/.dircolors)" || eval "$(dircolors -b)"
fi

# Prompt
# Detect if we have color support
if [ -x /usr/bin/tput ] && tput setaf 1 >&/dev/null; then
    # Define colors
    RESET='\[\033[0m\]'
    BOLD='\[\033[1m\]'
    DIM='\[\033[2m\]'
    
    # Color palette
    BLUE='\[\033[38;5;75m\]'
    GREEN='\[\033[38;5;114m\]'
    YELLOW='\[\033[38;5;221m\]'
    GRAY='\[\033[38;5;245m\]'
    RED='\[\033[38;5;204m\]'

    DEVNAME=""
    if [ ! -z "$MORLOC_ENV_NAME" ]; then
      DEVNAME="${DIM}${GRAY}(${MORLOC_ENV_NAME})${RESET} "
    fi 
    
    # Format: (container) morloc $
    PS1="${DEVNAME}${YELLOW}morloc-dev${RESET} $ "
else
    # Fallback for no color
    PS1="morloc-dev $ "
fi

# aliases
alias ls='ls --color=auto'
alias ll='ls -lh'
alias la='ls -lah'
alias l='ls -CF'

# coloring
alias grep='grep --color=auto'
alias fgrep='fgrep --color=auto'
alias egrep='egrep --color=auto'

# fast navigation
alias ..='cd ..'
alias ...='cd ../..'
alias ....='cd ../../..'
alias .....='cd ../../../..'

# setup path
[ -d "$HOME/.local/bin" ] && PATH="$HOME/.local/bin:$PATH"
[ -d "$HOME/bin" ] && PATH="$HOME/bin:$PATH"

# completions
if ! shopt -oq posix; then
  if [ -f /usr/share/bash-completion/bash_completion ]; then
    . /usr/share/bash-completion/bash_completion
  elif [ -f /etc/bash_completion ]; then
    . /etc/bash_completion
  fi
fi


================================================
FILE: container/tiny/Dockerfile
================================================
###############################################################################
# Stage 1: Build the morloc compiler from local source
FROM docker.io/library/ubuntu:24.04 AS morloc-build

ENV DEBIAN_FRONTEND=noninteractive

RUN apt-get update && apt-get install -y git curl pkg-config libglib2.0-dev

# Install stack
RUN curl -SL https://get.haskellstack.org/ | sh

# Copy the local source tree (no git clone -- builds exactly this checkout)
COPY . /morloc

# Build morloc
RUN cd /morloc && stack install --no-run-tests

###############################################################################
# Stage 2: Build Rust binaries (libmorloc.so + morloc-nexus + morloc-manager)
FROM docker.io/library/ubuntu:24.04 AS rust-build

ENV DEBIAN_FRONTEND=noninteractive

RUN apt-get update && apt-get install -y --no-install-recommends \
    curl ca-certificates gcc g++ make pkg-config \
    && rm -rf /var/lib/apt/lists/*

RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y --default-toolchain stable
ENV PATH="/root/.cargo/bin:${PATH}"

COPY data/rust/ /build/
WORKDIR /build

# Build libmorloc.so from staticlib
RUN cargo build --release -p morloc-runtime
RUN gcc -shared -o libmorloc.so \
    -Wl,--whole-archive target/release/libmorloc_runtime.a -Wl,--no-whole-archive \
    -lpthread -lrt -ldl -lm

# Install libmorloc.so where the nexus linker expects it
RUN mkdir -p /root/.local/share/morloc/lib \
    && cp libmorloc.so /root/.local/share/morloc/lib/

# Build morloc-nexus and morloc-manager
RUN cargo build --release -p morloc-nexus
RUN cargo build --release -p morloc-manager

# Strip all
RUN strip libmorloc.so target/release/morloc-nexus target/release/morloc-manager

# Collect into a single directory
RUN mkdir -p /rust-bin \
    && cp libmorloc.so /rust-bin/ \
    && cp target/release/morloc-nexus /rust-bin/ \
    && cp target/release/morloc-manager /rust-bin/

###############################################################################
# Stage 3: Final minimal image with compiler + pre-built Rust binaries

LABEL org.opencontainers.image.source=https://github.com/morloc-project/morloc
LABEL org.opencontainers.image.description="Morloc executable in a minimal container"
LABEL org.opencontainers.image.licenses=Apache-2.0

FROM docker.io/library/ubuntu:24.04
COPY --from=morloc-build /root/.local/bin/morloc /bin/morloc
COPY --from=rust-build /rust-bin/ /opt/morloc-rust-bin/

# morloc make builds C++ pools, so g++ is needed
RUN apt-get update && apt-get install -y --no-install-recommends g++ \
    && apt-get clean && rm -rf /var/lib/apt/lists/*

# Point morloc init at pre-built binaries (no cargo needed at runtime)
ENV MORLOC_RUST_BIN=/opt/morloc-rust-bin


================================================
FILE: data/lang/c/lang.yaml
================================================
# C language metadata for morloc compiler
name: c
extension: c
aliases: []
is_compiled: true
run_command: []
serial_type: ""
cost: 1


================================================
FILE: data/lang/cpp/cppmorloc.cpp
================================================
#include <stdexcept>
#include <string>
#include <cstdlib>

#include "morloc.h"

absptr_t cpp_rel2abs(relptr_t ptr){
    char* errmsg = NULL;
    absptr_t absptr = rel2abs(ptr, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return absptr;
}

relptr_t abs2rel_cpp(absptr_t ptr){
    char* errmsg = NULL;
    relptr_t relptr = abs2rel(ptr, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return relptr;
}

bool shfree_cpp(absptr_t ptr){
    char* errmsg = NULL;
    bool success = shfree(ptr, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return success;
}

Schema* parse_schema_cpp(const char* schema_ptr){
    char* errmsg = NULL;
    Schema* schema = parse_schema(schema_ptr, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return schema;
}

void* shmalloc_cpp(size_t size){
    char* errmsg = NULL;
    void* new_ptr = shmalloc(size, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return new_ptr;
}

shm_t* shinit_cpp(const char* shm_basename, size_t volume_index, size_t shm_size) {
    char* errmsg = NULL;
    shm_t* new_ptr = shinit(shm_basename, volume_index, shm_size, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return new_ptr;
}

int pack_with_schema_cpp(const void* mlc, const Schema* schema, char** mpk, size_t* mpk_size){
    char* errmsg = NULL;
    int exitcode = pack_with_schema(mlc, schema, mpk, mpk_size, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return exitcode;
}

int unpack_with_schema_cpp(const char* mgk, size_t mgk_size, const Schema* schema, void** mlcptr){
    char* errmsg = NULL;
    int exitcode = unpack_with_schema(mgk, mgk_size, schema, mlcptr, &errmsg);
    if(errmsg != NULL){
        std::string msg(errmsg); free(errmsg);
        throw std::runtime_error(msg);
    }
    return exitcode;
}


================================================
FILE: data/lang/cpp/cppmorloc.hpp
================================================
#ifndef __CPPMORLOC_HPP__
#define __CPPMORLOC_HPP__

#include <vector>
#include <stack>
#include <list>
#include <forward_list>
#include <queue>
#include <deque>
#include <optional>

#include <algorithm>
#include <tuple>
#include <stdexcept>
#include <cstring>
#include <string>
#include <type_traits>

#include "morloc.h"
#include "mlc_tensor.hpp"

// ============================================================
// Type traits for container dispatch
// ============================================================

template<typename T> struct is_std_vector : std::false_type {};
template<typename T, typename A> struct is_std_vector<std::vector<T, A>> : std::true_type {};

template<typename T> struct is_std_list : std::false_type {};
template<typename T, typename A> struct is_std_list<std::list<T, A>> : std::true_type {};

template<typename T> struct is_std_forward_list : std::false_type {};
template<typename T, typename A> struct is_std_forward_list<std::forward_list<T, A>> : std::true_type {};

template<typename T> struct is_std_deque : std::false_type {};
template<typename T, typename A> struct is_std_deque<std::deque<T, A>> : std::true_type {};

template<typename T> struct is_std_stack : std::false_type {};
template<typename T, typename C> struct is_std_stack<std::stack<T, C>> : std::true_type {};

template<typename T> struct is_std_queue : std::false_type {};
template<typename T, typename C> struct is_std_queue<std::queue<T, C>> : std::true_type {};

template<typename T> struct is_std_tuple : std::false_type {};
template<typename... Args> struct is_std_tuple<std::tuple<Args...>> : std::true_type {};

template<typename T> struct is_std_pair : std::false_type {};
template<typename A, typename B> struct is_std_pair<std::pair<A, B>> : std::true_type {};

template<typename T> struct is_std_optional : std::false_type {};
template<typename T> struct is_std_optional<std::optional<T>> : std::true_type {};

template<typename T>
inline constexpr bool is_non_vector_container_v =
    is_std_list<T>::value || is_std_forward_list<T>::value ||
    is_std_deque<T>::value || is_std_stack<T>::value ||
    is_std_queue<T>::value;


// ============================================================
// Container-to-vector conversion
// ============================================================

template<typename Container>
auto to_vector(const Container& c) {
    using T = typename Container::value_type;
    if constexpr (is_std_stack<Container>::value) {
        std::vector<T> v;
        auto copy = c;
        while (!copy.empty()) { v.push_back(copy.top()); copy.pop(); }
        std::reverse(v.begin(), v.end());
        return v;
    } else if constexpr (is_std_queue<Container>::value) {
        std::vector<T> v;
        auto copy = c;
        while (!copy.empty()) { v.push_back(copy.front()); copy.pop(); }
        return v;
    } else {
        return std::vector<T>(c.begin(), c.end());
    }
}


// ============================================================
// C runtime wrappers (implementations in cppmorloc.cpp)
// ============================================================

absptr_t cpp_rel2abs(relptr_t ptr);
relptr_t abs2rel_cpp(absptr_t ptr);

// Resolve a relative pointer using either base-pointer arithmetic (inline data)
// or SHM. When base_ptr is non-null, data lives in a contiguous malloc'd blob.
static inline void* resolve_relptr_cpp(relptr_t relptr, const void* base_ptr) {
    if (base_ptr) {
        return (char*)base_ptr + relptr;
    }
    return cpp_rel2abs(relptr);
}
bool shfree_cpp(absptr_t ptr);
Schema* parse_schema_cpp(const char* schema_ptr);
void* shmalloc_cpp(size_t size);
shm_t* shinit_cpp(const char* shm_basename, size_t volume_index, size_t shm_size);
int pack_with_schema_cpp(const void* mlc, const Schema* schema, char** mpk, size_t* mpk_size);
int unpack_with_schema_cpp(const char* mgk, size_t mgk_size, const Schema* schema, void** mlcptr);


// ============================================================
// mpk_pack / mpk_unpack declarations
// ============================================================

template<typename T>
std::vector<char> mpk_pack(const T& data, const std::string& schema_str);

template<typename T>
T mpk_unpack(const std::vector<char>& packed_data, const std::string& schema_str);


// ============================================================
// schema_alignment (C++ mirror of the C function in schema.c)
// ============================================================

inline size_t schema_alignment_cpp(const Schema* schema) {
    switch (schema->type) {
        case MORLOC_NIL: case MORLOC_BOOL: case MORLOC_SINT8: case MORLOC_UINT8: return 1;
        case MORLOC_SINT16: case MORLOC_UINT16: return 2;
        case MORLOC_SINT32: case MORLOC_UINT32: case MORLOC_FLOAT32: return 4;
        case MORLOC_SINT64: case MORLOC_UINT64: case MORLOC_FLOAT64:
        case MORLOC_STRING: case MORLOC_ARRAY: case MORLOC_TENSOR: return alignof(size_t);
        case MORLOC_TUPLE: case MORLOC_MAP: {
            size_t max_align = 1;
            for (size_t i = 0; i < schema->size; i++) {
                size_t a = schema_alignment_cpp(schema->parameters[i]);
                if (a > max_align) max_align = a;
            }
            return max_align;
        }
        case MORLOC_OPTIONAL: return schema_alignment_cpp(schema->parameters[0]);
        default: return alignof(size_t);
    }
}


// ============================================================
// get_shm_size
// ============================================================

// Forward declaration
template<typename T>
size_t get_shm_size(const Schema* schema, const T& data);

size_t get_shm_size(const Schema* schema, const std::nullptr_t&) {
    return sizeof(int8_t);
}

// Primitives
template<typename Primitive>
size_t get_shm_size(const Schema* schema, const Primitive& data) {
    return schema->width;
}

template<typename T>
size_t get_shm_size(const Schema* schema, const std::vector<T>& data) {
    size_t total_size = schema->width;
    // worst-case cursor alignment padding for element data
    total_size += schema_alignment_cpp(schema->parameters[0]) - 1;
    switch(schema->parameters[0]->type){
        case MORLOC_NIL:
        case MORLOC_BOOL:
        case MORLOC_SINT8:
        case MORLOC_SINT16:
        case MORLOC_SINT32:
        case MORLOC_SINT64:
        case MORLOC_UINT8:
        case MORLOC_UINT16:
        case MORLOC_UINT32:
        case MORLOC_UINT64:
        case MORLOC_FLOAT32:
        case MORLOC_FLOAT64:
            total_size += data.size() * schema->parameters[0]->width;
            break;
        case MORLOC_STRING:
        case MORLOC_ARRAY:
        case MORLOC_TUPLE:
        case MORLOC_MAP:
        case MORLOC_OPTIONAL:
            for(size_t i = 0; i < data.size(); i++){
               total_size += get_shm_size(schema->parameters[0], data[i]);
            }
            break;
    }
    return total_size;
}

// Optional: tag byte + aligned inner value
template<typename T>
size_t get_shm_size(const Schema* schema, const std::optional<T>& data) {
    if (!data.has_value()) {
        return schema->width;
    }
    size_t inner_size = get_shm_size(schema->parameters[0], *data);
    size_t extra = (inner_size > schema->parameters[0]->width) ? inner_size - schema->parameters[0]->width : 0;
    return schema->width + extra;
}

size_t get_shm_size(const Schema* schema, const std::string& data) {
    return schema->width + data.size();
}

size_t get_shm_size(void* dest, const Schema* schema, const char* data) {
    return schema->width + strlen(data);
}

template<typename Tuple, size_t... Is>
size_t createTupleShmSizeHelper(const Schema* schema, const Tuple& data, std::index_sequence<Is...>) {
    size_t total_size = schema->width;
    (void)std::initializer_list<int>{(
        [&](){
            size_t elem = get_shm_size(schema->parameters[Is], std::get<Is>(data));
            if (elem > schema->parameters[Is]->width) {
                total_size += elem - schema->parameters[Is]->width;
            }
        }(),
        0
    )...};
    return total_size;
}

template<typename... Args>
size_t get_shm_size(const Schema* schema, const std::tuple<Args...>& data) {
    return createTupleShmSizeHelper(schema, data, std::index_sequence_for<Args...>{});
}

// Non-vector containers: convert to vector and delegate
template<typename T>
size_t get_shm_size(const Schema* schema, const std::list<T>& data) {
    return get_shm_size(schema, to_vector(data));
}

template<typename T>
size_t get_shm_size(const Schema* schema, const std::forward_list<T>& data) {
    return get_shm_size(schema, to_vector(data));
}

template<typename T>
size_t get_shm_size(const Schema* schema, const std::deque<T>& data) {
    return get_shm_size(schema, to_vector(data));
}

template<typename T>
size_t get_shm_size(const Schema* schema, const std::stack<T>& data) {
    return get_shm_size(schema, to_vector(data));
}

template<typename T>
size_t get_shm_size(const Schema* schema, const std::queue<T>& data) {
    return get_shm_size(schema, to_vector(data));
}

// Tensor: header + shape array + contiguous data
template<typename T, int NDim>
size_t get_shm_size(const Schema* schema, const mlc::Tensor<T, NDim>& data) {
    using S = mlc::tensor_storage_t<T>;
    size_t total = sizeof(Tensor);
    // alignment padding for shape array
    total += alignof(int64_t) - 1;
    total += NDim * sizeof(int64_t);
    // alignment padding for element data
    total += schema_alignment_cpp(schema->parameters[0]) - 1;
    total += data.size() * sizeof(S);
    return total;
}


// ============================================================
// toAnything - top-level (allocating)
// ============================================================

// Generic top-level: compute size, allocate, serialize
template<typename T>
void* toAnything(const Schema* schema, const T& data){
    size_t total_size = get_shm_size(schema, data);
    void* dest = shmalloc_cpp(total_size);
    void* cursor = (void*)((char*)dest + schema->width);
    try {
        return toAnything(dest, &cursor, schema, data);
    } catch (...) {
        shfree_cpp(dest);
        throw;
    }
}

// Non-vector containers: convert to vector and delegate
template<typename T>
void* toAnything(const Schema* schema, const std::stack<T>& data) {
    return toAnything(schema, to_vector(data));
}

template<typename T>
void* toAnything(const Schema* schema, const std::forward_list<T>& data) {
    return toAnything(schema, to_vector(data));
}

template<typename T>
void* toAnything(const Schema* schema, const std::queue<T>& data) {
    return toAnything(schema, to_vector(data));
}

template<typename T>
void* toAnything(const Schema* schema, const std::deque<T>& data) {
    return toAnything(schema, to_vector(data));
}

template<typename T>
void* toAnything(const Schema* schema, const std::list<T>& data) {
    return toAnything(schema, to_vector(data));
}


// ============================================================
// toAnything - cursor-based (recursive)
// ============================================================

// Forward declaration
template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const T& data);

// Write raw binary data as an array
void* binarytoAnything(void* dest, void** cursor, const Schema* schema, const uint8_t* data, size_t size) {
    Array* result = static_cast<Array*>(dest);
    result->size = size;
    if(size == 0){
        result->data = RELNULL;
        return dest;
    }
    absptr_t data_ptr = static_cast<absptr_t>(*cursor);
    result->data = abs2rel_cpp(data_ptr);
    *cursor = static_cast<char*>(*cursor) + size * schema->parameters[0]->width;
    memcpy(data_ptr, data, size);
    return dest;
}

void* toAnything(void* dest, void** cursor, const Schema* schema, const std::nullptr_t&) {
    *((int8_t*)dest) = (int8_t)0;
    return dest;
}

// Primitives
template<typename Primitive>
void* toAnything(void* dest, void** cursor, const Schema* schema, const Primitive& data) {
    *((Primitive*)dest) = data;
    return dest;
}

// Vector (primary array implementation)
template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::vector<T>& data) {
    Array* result = static_cast<Array*>(dest);
    result->size = data.size();
    if(data.size() == 0){
        result->data = RELNULL;
        return dest;
    }
    // align cursor for element data placement
    *cursor = reinterpret_cast<void*>(ALIGN_UP(reinterpret_cast<uintptr_t>(*cursor), schema_alignment_cpp(schema->parameters[0])));
    result->data = abs2rel_cpp(static_cast<absptr_t>(*cursor));
    *cursor = static_cast<char*>(*cursor) + data.size() * schema->parameters[0]->width;
    char* start = (char*)cpp_rel2abs(result->data);
    size_t width = schema->parameters[0]->width;
    for (size_t i = 0; i < data.size(); ++i) {
         toAnything(start + width * i, cursor, schema->parameters[0], data[i]);
    }
    return dest;
}

// Shared helper for iterable containers (list, forward_list, deque)
template<typename Container>
void* toAnything_seq(void* dest, void** cursor, const Schema* schema, const Container& data, size_t size) {
    Array* result = static_cast<Array*>(dest);
    result->size = size;
    if(size == 0){
        result->data = RELNULL;
        return dest;
    }
    // align cursor for element data placement
    *cursor = reinterpret_cast<void*>(ALIGN_UP(reinterpret_cast<uintptr_t>(*cursor), schema_alignment_cpp(schema->parameters[0])));
    result->data = abs2rel_cpp(static_cast<absptr_t>(*cursor));
    *cursor = static_cast<char*>(*cursor) + size * schema->parameters[0]->width;
    char* start = (char*)cpp_rel2abs(result->data);
    size_t width = schema->parameters[0]->width;
    size_t i = 0;
    for (const auto& item : data) {
        toAnything(start + width * i, cursor, schema->parameters[0], item);
        ++i;
    }
    return dest;
}

template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::list<T>& data) {
    return toAnything_seq(dest, cursor, schema, data, data.size());
}

template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::forward_list<T>& data) {
    return toAnything_seq(dest, cursor, schema, data, std::distance(data.begin(), data.end()));
}

template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::deque<T>& data) {
    return toAnything_seq(dest, cursor, schema, data, data.size());
}

// Stack and queue: convert to vector and delegate
template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::queue<T>& data) {
    return toAnything(dest, cursor, schema, to_vector(data));
}

template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::stack<T>& data) {
    return toAnything(dest, cursor, schema, to_vector(data));
}

// String and C string
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::string& data) {
    return binarytoAnything(dest, cursor, schema, (const uint8_t*)data.c_str(), data.size());
}

void* toAnything(void* dest, void** cursor, const Schema* schema, const char* data) {
    return binarytoAnything(dest, cursor, schema, (const uint8_t*)data, strlen(data));
}

// Tuple
template<typename Tuple, size_t... Is>
void* createTupleAnythingHelper(void* dest, const Schema* schema, void** cursor, const Tuple& data, std::index_sequence<Is...>) {
    (void)std::initializer_list<int>{(
        toAnything((char*)dest + schema->offsets[Is], cursor, schema->parameters[Is], std::get<Is>(data)),
        0
    )...};
    return dest;
}

template<typename... Args>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::tuple<Args...>& data) {
    return createTupleAnythingHelper(dest, schema, cursor, data, std::index_sequence_for<Args...>{});
}

// Pair (reuses tuple helper since std::pair supports std::get)
template<typename A, typename B>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::pair<A, B>& data) {
    return createTupleAnythingHelper(dest, schema, cursor, data, std::index_sequence<0, 1>{});
}

// Optional
template<typename T>
void* toAnything(void* dest, void** cursor, const Schema* schema, const std::optional<T>& data) {
    if (!data.has_value()) {
        *((uint8_t*)dest) = 0;
        memset((char*)dest + schema->offsets[0], 0, schema->parameters[0]->width);
    } else {
        *((uint8_t*)dest) = 1;
        toAnything((char*)dest + schema->offsets[0], cursor, schema->parameters[0], *data);
    }
    return dest;
}

// Tensor: write Tensor header + shape array + contiguous data
template<typename T, int NDim>
void* toAnything(void* dest, void** cursor, const Schema* schema, const mlc::Tensor<T, NDim>& data) {
    Tensor* result = static_cast<Tensor*>(dest);
    result->total_elements = data.size();
    result->device_type = 0;
    result->device_id = 0;

    if (data.size() == 0) {
        result->shape = RELNULL;
        result->data = RELNULL;
        return dest;
    }

    // Write shape array
    *cursor = reinterpret_cast<void*>(ALIGN_UP(reinterpret_cast<uintptr_t>(*cursor), alignof(int64_t)));
    result->shape = abs2rel_cpp(static_cast<absptr_t>(*cursor));
    int64_t* shape_dst = (int64_t*)*cursor;
    for (int i = 0; i < NDim; i++) shape_dst[i] = data.shape()[i];
    *cursor = (char*)*cursor + NDim * sizeof(int64_t);

    // Write data buffer (contiguous row-major)
    using S = mlc::tensor_storage_t<T>;
    size_t elem_align = schema_alignment_cpp(schema->parameters[0]);
    *cursor = reinterpret_cast<void*>(ALIGN_UP(reinterpret_cast<uintptr_t>(*cursor), elem_align));
    result->data = abs2rel_cpp(static_cast<absptr_t>(*cursor));
    size_t data_bytes = data.size() * sizeof(S);
    memcpy(*cursor, data.data(), data_bytes);
    *cursor = (char*)*cursor + data_bytes;

    return dest;
}


// ============================================================
// fromAnything - single template with if constexpr dispatch
// ============================================================

// Forward declaration for recursive calls
template<typename T>
T fromAnything(const Schema* schema, const void* data, T* = nullptr, const void* base_ptr = nullptr);

// Tuple helper (needs forward declaration of fromAnything)
template<typename Tuple, size_t... Is>
Tuple fromTupleAnythingHelper(
  const Schema* schema,
  const void* anything,
  std::index_sequence<Is...>,
  Tuple* = nullptr,
  const void* base_ptr = nullptr
) {
    return Tuple(fromAnything(schema->parameters[Is],
                              (char*)anything + schema->offsets[Is],
                              static_cast<std::tuple_element_t<Is, Tuple>*>(nullptr),
                              base_ptr)...);
}

template<typename T>
T fromAnything(const Schema* schema, const void* data, T*, const void* base_ptr) {
    if(data == NULL){
        throw std::runtime_error("Void error in fromAnything");
    }

    if constexpr (std::is_same_v<T, bool>) {
        // NOTE: do NOT use bool here since its width is often not 1 byte
        return *(uint8_t*)data == 1;
    }
    else if constexpr (std::is_same_v<T, std::string>) {
        Array* array = (Array*)data;
        if(array->size > 0){
            return std::string((char*)resolve_relptr_cpp(array->data, base_ptr), array->size);
        }
        return std::string("");
    }
    else if constexpr (is_std_vector<T>::value) {
        using ElemT = typename T::value_type;
        std::vector<ElemT> result;
        Array* array = (Array*)data;
        if(array->size == 0) return result;

        // Fast path for primitive arrays
        switch(schema->parameters[0]->type){
            case MORLOC_NIL:
            case MORLOC_BOOL:
            case MORLOC_SINT8:
            case MORLOC_SINT16:
            case MORLOC_SINT32:
            case MORLOC_SINT64:
            case MORLOC_UINT8:
            case MORLOC_UINT16:
            case MORLOC_UINT32:
            case MORLOC_UINT64:
            case MORLOC_FLOAT32:
            case MORLOC_FLOAT64: {
                ElemT* arr_start = (ElemT*)resolve_relptr_cpp(array->data, base_ptr);
                std::vector<ElemT> pv(arr_start, arr_start + array->size);
                return pv;
            }
        }

        // Complex element types
        result.reserve(array->size);
        const Schema* elem_schema = schema->parameters[0];
        char* start = (char*)resolve_relptr_cpp(array->data, base_ptr);
        for(size_t i = 0; i < array->size; i++){
            result.push_back(fromAnything(elem_schema, (void*)(start + i * elem_schema->width), static_cast<ElemT*>(nullptr), base_ptr));
        }
        return result;
    }
    else if constexpr (is_non_vector_container_v<T>) {
        using ElemT = typename T::value_type;
        Array* array = (Array*)data;
        T result;
        if(array->size == 0) return result;

        const Schema* elem_schema = schema->parameters[0];
        char* start = (char*)resolve_relptr_cpp(array->data, base_ptr);

        constexpr bool reverse = is_std_stack<T>::value || is_std_forward_list<T>::value;

        if constexpr (reverse) {
            for (size_t i = array->size; i > 0; --i) {
                auto elem = fromAnything(elem_schema, (void*)(start + (i-1) * elem_schema->width), static_cast<ElemT*>(nullptr), base_ptr);
                if constexpr (is_std_stack<T>::value) result.push(std::move(elem));
                else result.push_front(std::move(elem));
            }
        } else {
            for (size_t i = 0; i < array->size; ++i) {
                auto elem = fromAnything(elem_schema, (void*)(start + i * elem_schema->width), static_cast<ElemT*>(nullptr), base_ptr);
                if constexpr (is_std_queue<T>::value) result.push(std::move(elem));
                else result.push_back(std::move(elem));
            }
        }
        return result;
    }
    else if constexpr (is_std_tuple<T>::value) {
        return fromTupleAnythingHelper(
            schema, data,
            std::make_index_sequence<std::tuple_size_v<T>>{},
            static_cast<T*>(nullptr),
            base_ptr
        );
    }
    else if constexpr (is_std_pair<T>::value) {
        return fromTupleAnythingHelper(
            schema, data,
            std::index_sequence<0, 1>{},
            static_cast<T*>(nullptr),
            base_ptr
        );
    }
    else if constexpr (is_std_optional<T>::value) {
        using InnerT = typename T::value_type;
        uint8_t tag = *(const uint8_t*)data;
        if (tag == 0) {
            return std::nullopt;
        }
        return std::optional<InnerT>(fromAnything(schema->parameters[0], (const char*)data + schema->offsets[0], static_cast<InnerT*>(nullptr), base_ptr));
    }
    else if constexpr (mlc::is_mlc_tensor_v<T>) {
        using ElemT = mlc::tensor_element_t<T>;
        using StorageT = mlc::tensor_storage_t<ElemT>;
        constexpr int NDim = mlc::tensor_ndim_v<T>;
        const Tensor* tensor = (const Tensor*)data;

        if (tensor->total_elements == 0) {
            int64_t zero_shape[NDim] = {};
            return T(zero_shape);
        }

        const int64_t* shape = (const int64_t*)resolve_relptr_cpp(tensor->shape, base_ptr);
        StorageT* tdata = (StorageT*)resolve_relptr_cpp(tensor->data, base_ptr);
        return T(tdata, shape, tensor->total_elements);
    }
    else {
        // Primitives (int, double, float, etc.)
        // Record types are handled by generated overloads which are preferred
        // by overload resolution over this template.
        return *(T*)data;
    }
}


// ============================================================
// mpk_pack / mpk_unpack
// ============================================================

template<typename T>
std::vector<char> mpk_pack(const T& data, const std::string& schema_str) {
    const char* schema_ptr = schema_str.c_str();
    Schema* schema = parse_schema_cpp(schema_ptr);

    void* voidstar = nullptr;
    char* msgpack_data = NULL;
    size_t msg_size = 0;

    try {
        voidstar = toAnything(schema, data);
        pack_with_schema_cpp(voidstar, schema, &msgpack_data, &msg_size);
    } catch (...) {
        if (voidstar) shfree_cpp(voidstar);
        free(msgpack_data);
        free_schema(schema);
        throw;
    }

    shfree_cpp(voidstar);

    std::vector<char> result(msgpack_data, msgpack_data + msg_size);
    free(msgpack_data);
    free_schema(schema);

    return result;
}

template<typename T>
T mpk_unpack(const std::vector<char>& packed_data, const std::string& schema_str) {
    const char* schema_ptr = schema_str.c_str();
    Schema* schema = parse_schema_cpp(schema_ptr);

    void* voidstar = nullptr;
    int unpack_result = unpack_with_schema_cpp(packed_data.data(), packed_data.size(), schema, &voidstar);
    if (unpack_result != 0) {
        free_schema(schema);
        throw std::runtime_error("Unpacking failed");
    }

    T x;
    try {
        x = fromAnything(schema, voidstar, static_cast<T*>(nullptr));
    } catch (...) {
        free_schema(schema);
        shfree_cpp(voidstar);
        throw;
    }

    free_schema(schema);
    shfree_cpp(voidstar);

    return x;
}

#endif


================================================
FILE: data/lang/cpp/init.sh
================================================
#!/bin/bash
set -e

MORLOC_HOME="$1"
BUILD_DIR="$2"
SANITIZE_FLAGS="$3"
INCLUDE_DIR="$MORLOC_HOME/include"
LIB_DIR="$MORLOC_HOME/lib"

# Install mlccpptypes if not present
if [ ! -d "$INCLUDE_DIR/mlccpptypes" ]; then
    git clone https://github.com/morloclib/mlccpptypes "$INCLUDE_DIR/mlccpptypes"
fi

# Install headers
cp "$BUILD_DIR/cppmorloc.hpp" "$INCLUDE_DIR/"
cp "$BUILD_DIR/mlc_arrow.hpp" "$INCLUDE_DIR/"
cp "$BUILD_DIR/mlc_tensor.hpp" "$INCLUDE_DIR/"

# Install nanoarrow headers
mkdir -p "$INCLUDE_DIR/nanoarrow"
cp "$BUILD_DIR/nanoarrow.h" "$INCLUDE_DIR/nanoarrow/"

# Compile nanoarrow.c
gcc -c -O2 -fPIC $SANITIZE_FLAGS -I"$INCLUDE_DIR" -o "$BUILD_DIR/nanoarrow.o" "$BUILD_DIR/nanoarrow.c"

# Compile cppmorloc.cpp
g++ -c --std=c++17 -O2 $SANITIZE_FLAGS -I"$INCLUDE_DIR" -o "$BUILD_DIR/cppmorloc.o" "$BUILD_DIR/cppmorloc.cpp"

# Archive into libcppmorloc.a
ar rcs "$LIB_DIR/libcppmorloc.a" "$BUILD_DIR/cppmorloc.o" "$BUILD_DIR/nanoarrow.o"

# Compile precompiled header
cp "$BUILD_DIR/morloc_pch.hpp" "$INCLUDE_DIR/"
g++ --std=c++17 -O2 $SANITIZE_FLAGS -I"$INCLUDE_DIR" -x c++-header "$INCLUDE_DIR/morloc_pch.hpp" -o "$INCLUDE_DIR/morloc_pch.hpp.gch"


================================================
FILE: data/lang/cpp/lang.yaml
================================================
# C++ language metadata for morloc compiler
name: cpp
extension: cpp
aliases: ["c++"]
is_compiled: true
run_command: []
serial_type: "uint8_t*"
cost: 0


================================================
FILE: data/lang/cpp/mlc_arrow.hpp
================================================
#ifndef MLC_ARROW_HPP
#define MLC_ARROW_HPP

// mlc_arrow.hpp -- thin RAII wrapper around Arrow C Data Interface structs
// for use in morloc C++ pools.  Holds ArrowSchema + ArrowArray as a single
// move-only value.  The pool template dispatches arrow-hinted schemas to
// arrow_to_shm / arrow_from_shm (in libmorloc.so) via this type.
//
// User code should include <nanoarrow/nanoarrow.h> to build and read columns.

#include "morloc.h"
#include <cstring>
#include <stdexcept>
#include <utility>

namespace mlc {

class ArrowTable {
public:
    // Construct from moved-in C Data Interface structs.
    // Takes ownership of release callbacks.
    ArrowTable(struct ArrowSchema schema, struct ArrowArray array)
        : schema_(schema), array_(array)
    {
        // Zero the source structs so the caller does not double-release
        memset(&schema, 0, sizeof(schema));
        memset(&array, 0, sizeof(array));
    }

    ~ArrowTable() {
        if (array_.release) array_.release(&array_);
        if (schema_.release) schema_.release(&schema_);
    }

    // Move-only
    ArrowTable(ArrowTable&& other) noexcept
        : schema_(other.schema_), array_(other.array_)
    {
        memset(&other.schema_, 0, sizeof(other.schema_));
        memset(&other.array_, 0, sizeof(other.array_));
    }

    ArrowTable& operator=(ArrowTable&& other) noexcept {
        if (this != &other) {
            if (array_.release) array_.release(&array_);
            if (schema_.release) schema_.release(&schema_);
            schema_ = other.schema_;
            array_ = other.array_;
            memset(&other.schema_, 0, sizeof(other.schema_));
            memset(&other.array_, 0, sizeof(other.array_));
        }
        return *this;
    }

    ArrowTable(const ArrowTable&) = delete;
    ArrowTable& operator=(const ArrowTable&) = delete;

    // Accessors (const -- arrow data is immutable)
    const struct ArrowSchema* schema() const { return &schema_; }
    const struct ArrowArray*  array()  const { return &array_; }
    int64_t n_columns() const { return schema_.n_children; }
    int64_t n_rows()    const { return array_.length; }

    // Build from shared memory header (zero-copy import)
    static ArrowTable from_shm(const arrow_shm_header_t* hdr) {
        struct ArrowSchema as;
        struct ArrowArray aa;
        char* err = nullptr;
        arrow_from_shm(hdr, &as, &aa, &err);
        if (err) {
            std::string msg(err);
            free(err);
            throw std::runtime_error(msg);
        }
        return ArrowTable(std::move(as), std::move(aa));
    }

    // Move table data to shared memory: copies buffers into a contiguous SHM
    // block, frees the original heap buffers, then repoints this table's
    // internal ArrowSchema/ArrowArray into the SHM block (zero-copy).
    // After this call the table is still usable but backed by SHM.
    // Returns relptr to the SHM block for use in packets.
    relptr_t move_to_shm() {
        // Step 1: copy all column data into contiguous SHM
        char* copy_err = nullptr;
        relptr_t rp = arrow_to_shm(&array_, &schema_, &copy_err);
        if (copy_err) {
            std::string msg(copy_err);
            free(copy_err);
            throw std::runtime_error(msg);
        }

        // Step 2: release heap-backed structs (frees all original buffers)
        if (array_.release) array_.release(&array_);
        if (schema_.release) schema_.release(&schema_);
        memset(&schema_, 0, sizeof(schema_));
        memset(&array_, 0, sizeof(array_));

        // Step 3: resolve SHM pointer and rebuild structs pointing into it
        char* resolve_err = nullptr;
        void* abs = rel2abs(rp, &resolve_err);
        if (resolve_err) {
            std::string msg(resolve_err);
            free(resolve_err);
            throw std::runtime_error(msg);
        }

        char* shm_err = nullptr;
        arrow_from_shm((const arrow_shm_header_t*)abs, &schema_, &array_, &shm_err);
        if (shm_err) {
            std::string msg(shm_err);
            free(shm_err);
            throw std::runtime_error(msg);
        }

        return rp;
    }

private:
    struct ArrowSchema schema_;
    struct ArrowArray array_;
};

} // namespace mlc

#endif // MLC_ARROW_HPP


================================================
FILE: data/lang/cpp/mlc_tensor.hpp
================================================
#ifndef MLC_TENSOR_HPP
#define MLC_TENSOR_HPP

// mlc_tensor.hpp -- dense N-dimensional tensor for morloc C++ pools.
// Data is always contiguous row-major (C order). The Tensor struct in
// schema.h defines the voidstar layout; this header provides the C++
// user-facing type that maps to it.

#include "morloc.h"
#include <cstring>
#include <stdexcept>
#include <numeric>
#include <initializer_list>

namespace mlc {

// Storage type trait: maps bool to uint8_t so that tensor memory layout
// matches the voidstar format (MORLOC_BOOL = 1 byte) regardless of
// sizeof(bool) on the target platform.
template<typename T> struct tensor_storage { using type = T; };
template<> struct tensor_storage<bool> { using type = uint8_t; };
template<typename T> using tensor_storage_t = typename tensor_storage<T>::type;

template<typename T, int NDim>
class Tensor {
    using S = tensor_storage_t<T>;
public:
    // Construct with given shape, allocating data on the heap
    Tensor(const int64_t (&dims)[NDim]) : owns_data_(true) {
        for (int i = 0; i < NDim; i++) shape_[i] = dims[i];
        total_ = 1;
        for (int i = 0; i < NDim; i++) total_ *= (size_t)shape_[i];
        data_ = new S[total_]();
    }

    // Construct from initializer list of dims
    Tensor(std::initializer_list<int64_t> dims) : owns_data_(true) {
        if ((int)dims.size() != NDim) {
            throw std::runtime_error("Tensor dimension mismatch");
        }
        int i = 0;
        for (auto d : dims) shape_[i++] = d;
        total_ = 1;
        for (i = 0; i < NDim; i++) total_ *= (size_t)shape_[i];
        data_ = new S[total_]();
    }

    // Construct as a view over existing data (does not own)
    Tensor(S* data, const int64_t* shape, size_t total)
        : data_(data), total_(total), owns_data_(false) {
        for (int i = 0; i < NDim; i++) shape_[i] = shape[i];
    }

    ~Tensor() {
        if (owns_data_ && data_) delete[] data_;
    }

    // Move-only
    Tensor(Tensor&& other) noexcept
        : data_(other.data_), total_(other.total_), owns_data_(other.owns_data_) {
        for (int i = 0; i < NDim; i++) shape_[i] = other.shape_[i];
        other.data_ = nullptr;
        other.owns_data_ = false;
    }

    Tensor& operator=(Tensor&& other) noexcept {
        if (this != &other) {
            if (owns_data_ && data_) delete[] data_;
            data_ = other.data_;
            total_ = other.total_;
            owns_data_ = other.owns_data_;
            for (int i = 0; i < NDim; i++) shape_[i] = other.shape_[i];
            other.data_ = nullptr;
            other.owns_data_ = false;
        }
        return *this;
    }

    Tensor(const Tensor&) = delete;
    Tensor& operator=(const Tensor&) = delete;

    // Accessors (S* for raw access; S == T for all types except bool)
    const S* data() const { return data_; }
    S* data() { return data_; }
    constexpr int ndim() const { return NDim; }
    const int64_t* shape() const { return shape_; }
    int64_t shape(int d) const { return shape_[d]; }
    size_t size() const { return total_; }

    // Linear access (returns S& which is uint8_t& for bool tensors;
    // implicit conversion to/from bool handles the difference)
    const S& operator[](size_t i) const { return data_[i]; }
    S& operator[](size_t i) { return data_[i]; }

    // 1D access
    template<int N = NDim, typename = std::enable_if_t<N == 1>>
    const S& operator()(int64_t i) const { return data_[i]; }
    template<int N = NDim, typename = std::enable_if_t<N == 1>>
    S& operator()(int64_t i) { return data_[i]; }

    // 2D access (row-major)
    template<int N = NDim, typename = std::enable_if_t<N == 2>>
    const S& operator()(int64_t i, int64_t j) const {
        return data_[i * shape_[1] + j];
    }
    template<int N = NDim, typename = std::enable_if_t<N == 2>>
    S& operator()(int64_t i, int64_t j) {
        return data_[i * shape_[1] + j];
    }

    // 3D access (row-major)
    template<int N = NDim, typename = std::enable_if_t<N == 3>>
    const S& operator()(int64_t i, int64_t j, int64_t k) const {
        return data_[(i * shape_[1] + j) * shape_[2] + k];
    }
    template<int N = NDim, typename = std::enable_if_t<N == 3>>
    S& operator()(int64_t i, int64_t j, int64_t k) {
        return data_[(i * shape_[1] + j) * shape_[2] + k];
    }

private:
    S* data_ = nullptr;
    int64_t shape_[NDim] = {};
    size_t total_ = 0;
    bool owns_data_ = false;
};

// Convenience aliases
template<typename T> using Tensor1 = Tensor<T, 1>;
template<typename T> using Tensor2 = Tensor<T, 2>;
template<typename T> using Tensor3 = Tensor<T, 3>;
template<typename T> using Tensor4 = Tensor<T, 4>;
template<typename T> using Tensor5 = Tensor<T, 5>;

// Type trait for detecting mlc::Tensor
template<typename T> struct is_mlc_tensor : std::false_type {};
template<typename T, int N> struct is_mlc_tensor<Tensor<T, N>> : std::true_type {};
template<typename T>
inline constexpr bool is_mlc_tensor_v = is_mlc_tensor<T>::value;

// Extract element type from Tensor
template<typename T> struct tensor_element;
template<typename T, int N> struct tensor_element<Tensor<T, N>> { using type = T; };
template<typename T> using tensor_element_t = typename tensor_element<T>::type;

// Extract ndim from Tensor
template<typename T> struct tensor_ndim;
template<typename T, int N> struct tensor_ndim<Tensor<T, N>>
    { static constexpr int value = N; };
template<typename T>
inline constexpr int tensor_ndim_v = tensor_ndim<T>::value;

} // namespace mlc

#endif // MLC_TENSOR_HPP


================================================
FILE: data/lang/cpp/morloc_pch.hpp
================================================
// Precompiled header for morloc C++ pools.
// Compiled once during 'morloc init', reused for every pool compilation.

#ifndef MORLOC_PCH_HPP
#define MORLOC_PCH_HPP

// STL containers
#include <vector>
#include <stack>
#include <list>
#include <forward_list>
#include <queue>
#include <deque>
#include <unordered_map>

// STL algorithms and utilities
#include <algorithm>
#include <tuple>
#include <functional>
#include <limits>
#include <utility>
#include <type_traits>

// Strings and I/O
#include <string>
#include <iostream>
#include <sstream>
#include <fstream>

// C standard library
#include <cstring>
#include <cstdlib>
#include <cstdio>
#include <cstdint>
#include <stdexcept>
#include <system_error>

// POSIX headers
#include <sys/stat.h>
#include <sys/mman.h>
#include <unistd.h>
#include <pthread.h>
#include <signal.h>

// Morloc runtime
#include "morloc.h"

#endif


================================================
FILE: data/lang/cpp/nanoarrow/nanoarrow.c
================================================
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#include <errno.h>
#include <stdarg.h>
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include "nanoarrow/nanoarrow.h"

const char* ArrowNanoarrowVersion(void) { return NANOARROW_VERSION; }

int ArrowNanoarrowVersionInt(void) { return NANOARROW_VERSION_INT; }

ArrowErrorCode ArrowErrorSet(struct ArrowError* error, const char* fmt, ...) {
  if (error == NULL) {
    return NANOARROW_OK;
  }

  memset(error->message, 0, sizeof(error->message));

  va_list args;
  va_start(args, fmt);
  int chars_needed = vsnprintf(error->message, sizeof(error->message), fmt, args);
  va_end(args);

  if (chars_needed < 0) {
    return EINVAL;
  } else if (((size_t)chars_needed) >= sizeof(error->message)) {
    return ERANGE;
  } else {
    return NANOARROW_OK;
  }
}

void ArrowLayoutInit(struct ArrowLayout* layout, enum ArrowType storage_type) {
  layout->buffer_type[0] = NANOARROW_BUFFER_TYPE_VALIDITY;
  layout->buffer_data_type[0] = NANOARROW_TYPE_BOOL;
  layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA;
  layout->buffer_data_type[1] = storage_type;
  layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_NONE;
  layout->buffer_data_type[2] = NANOARROW_TYPE_UNINITIALIZED;

  layout->element_size_bits[0] = 1;
  layout->element_size_bits[1] = 0;
  layout->element_size_bits[2] = 0;

  layout->child_size_elements = 0;

  switch (storage_type) {
    case NANOARROW_TYPE_UNINITIALIZED:
    case NANOARROW_TYPE_NA:
    case NANOARROW_TYPE_RUN_END_ENCODED:
      layout->buffer_type[0] = NANOARROW_BUFFER_TYPE_NONE;
      layout->buffer_data_type[0] = NANOARROW_TYPE_UNINITIALIZED;
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_NONE;
      layout->buffer_data_type[1] = NANOARROW_TYPE_UNINITIALIZED;
      layout->element_size_bits[0] = 0;
      break;

    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_MAP:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[1] = 32;
      break;

    case NANOARROW_TYPE_LARGE_LIST:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT64;
      layout->element_size_bits[1] = 64;
      break;

    case NANOARROW_TYPE_STRUCT:
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_NONE;
      layout->buffer_data_type[1] = NANOARROW_TYPE_UNINITIALIZED;
      break;

    case NANOARROW_TYPE_BOOL:
      layout->element_size_bits[1] = 1;
      break;

    case NANOARROW_TYPE_UINT8:
    case NANOARROW_TYPE_INT8:
      layout->element_size_bits[1] = 8;
      break;

    case NANOARROW_TYPE_UINT16:
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_HALF_FLOAT:
      layout->element_size_bits[1] = 16;
      break;

    case NANOARROW_TYPE_UINT32:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_FLOAT:
    case NANOARROW_TYPE_DECIMAL32:
      layout->element_size_bits[1] = 32;
      break;
    case NANOARROW_TYPE_INTERVAL_MONTHS:
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[1] = 32;
      break;

    case NANOARROW_TYPE_UINT64:
    case NANOARROW_TYPE_INT64:
    case NANOARROW_TYPE_DOUBLE:
    case NANOARROW_TYPE_INTERVAL_DAY_TIME:
    case NANOARROW_TYPE_DECIMAL64:
      layout->element_size_bits[1] = 64;
      break;

    case NANOARROW_TYPE_DECIMAL128:
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO:
      layout->element_size_bits[1] = 128;
      break;

    case NANOARROW_TYPE_DECIMAL256:
      layout->element_size_bits[1] = 256;
      break;

    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      layout->buffer_data_type[1] = NANOARROW_TYPE_BINARY;
      break;

    case NANOARROW_TYPE_DENSE_UNION:
      layout->buffer_type[0] = NANOARROW_BUFFER_TYPE_TYPE_ID;
      layout->buffer_data_type[0] = NANOARROW_TYPE_INT8;
      layout->element_size_bits[0] = 8;
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_UNION_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[1] = 32;
      break;

    case NANOARROW_TYPE_SPARSE_UNION:
      layout->buffer_type[0] = NANOARROW_BUFFER_TYPE_TYPE_ID;
      layout->buffer_data_type[0] = NANOARROW_TYPE_INT8;
      layout->element_size_bits[0] = 8;
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_NONE;
      layout->buffer_data_type[1] = NANOARROW_TYPE_UNINITIALIZED;
      break;

    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_BINARY:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[1] = 32;
      layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_DATA;
      layout->buffer_data_type[2] = storage_type;
      break;

    case NANOARROW_TYPE_LARGE_STRING:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT64;
      layout->element_size_bits[1] = 64;
      layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_DATA;
      layout->buffer_data_type[2] = NANOARROW_TYPE_STRING;
      break;
    case NANOARROW_TYPE_LARGE_BINARY:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT64;
      layout->element_size_bits[1] = 64;
      layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_DATA;
      layout->buffer_data_type[2] = NANOARROW_TYPE_BINARY;
      break;

    case NANOARROW_TYPE_BINARY_VIEW:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA;
      layout->buffer_data_type[1] = NANOARROW_TYPE_BINARY_VIEW;
      layout->element_size_bits[1] = 128;
      break;
    case NANOARROW_TYPE_STRING_VIEW:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_DATA;
      layout->buffer_data_type[1] = NANOARROW_TYPE_STRING_VIEW;
      layout->element_size_bits[1] = 128;
      break;

    case NANOARROW_TYPE_LIST_VIEW:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_VIEW_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[1] = 32;
      layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_SIZE;
      layout->buffer_data_type[2] = NANOARROW_TYPE_INT32;
      layout->element_size_bits[2] = 32;
      break;
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      layout->buffer_type[1] = NANOARROW_BUFFER_TYPE_VIEW_OFFSET;
      layout->buffer_data_type[1] = NANOARROW_TYPE_INT64;
      layout->element_size_bits[1] = 64;
      layout->buffer_type[2] = NANOARROW_BUFFER_TYPE_SIZE;
      layout->buffer_data_type[2] = NANOARROW_TYPE_INT64;
      layout->element_size_bits[2] = 64;
      break;

    default:
      break;
  }
}

void* ArrowMalloc(int64_t size) { return malloc(size); }

void* ArrowRealloc(void* ptr, int64_t size) { return realloc(ptr, size); }

void ArrowFree(void* ptr) { free(ptr); }

static uint8_t* ArrowBufferAllocatorMallocReallocate(
    struct ArrowBufferAllocator* allocator, uint8_t* ptr, int64_t old_size,
    int64_t new_size) {
  NANOARROW_UNUSED(allocator);
  NANOARROW_UNUSED(old_size);
  return (uint8_t*)ArrowRealloc(ptr, new_size);
}

static void ArrowBufferAllocatorMallocFree(struct ArrowBufferAllocator* allocator,
                                           uint8_t* ptr, int64_t size) {
  NANOARROW_UNUSED(allocator);
  NANOARROW_UNUSED(size);
  if (ptr != NULL) {
    ArrowFree(ptr);
  }
}

static struct ArrowBufferAllocator ArrowBufferAllocatorMalloc = {
    &ArrowBufferAllocatorMallocReallocate, &ArrowBufferAllocatorMallocFree, NULL};

struct ArrowBufferAllocator ArrowBufferAllocatorDefault(void) {
  return ArrowBufferAllocatorMalloc;
}

static uint8_t* ArrowBufferDeallocatorReallocate(struct ArrowBufferAllocator* allocator,
                                                 uint8_t* ptr, int64_t old_size,
                                                 int64_t new_size) {
  NANOARROW_UNUSED(new_size);

  // Attempting to reallocate a buffer with a custom deallocator is
  // a programming error. In debug mode, crash here.
#if defined(NANOARROW_DEBUG)
  NANOARROW_PRINT_AND_DIE(ENOMEM,
                          "It is an error to reallocate a buffer whose allocator is "
                          "ArrowBufferDeallocator()");
#endif

  // In release mode, ensure the the deallocator is called exactly
  // once using the pointer it was given and return NULL, which
  // will trigger the caller to return ENOMEM.
  allocator->free(allocator, ptr, old_size);
  *allocator = ArrowBufferAllocatorDefault();
  return NULL;
}

struct ArrowBufferAllocator ArrowBufferDeallocator(
    void (*custom_free)(struct ArrowBufferAllocator* allocator, uint8_t* ptr,
                        int64_t size),
    void* private_data) {
  struct ArrowBufferAllocator allocator;
  allocator.reallocate = &ArrowBufferDeallocatorReallocate;
  allocator.free = custom_free;
  allocator.private_data = private_data;
  return allocator;
}

static const int kInt32DecimalDigits = 9;

static const uint64_t kUInt32PowersOfTen[] = {
    1ULL,      10ULL,      100ULL,      1000ULL,      10000ULL,
    100000ULL, 1000000ULL, 10000000ULL, 100000000ULL, 1000000000ULL};

// Adapted from Arrow C++ to use 32-bit words for better C portability
// https://github.com/apache/arrow/blob/cd3321b28b0c9703e5d7105d6146c1270bbadd7f/cpp/src/arrow/util/decimal.cc#L524-L544
static void ShiftAndAdd(struct ArrowStringView value, uint32_t* out, int64_t out_size) {
  // We use strtoll for parsing, which needs input that is null-terminated
  char chunk_string[16];

  for (int64_t posn = 0; posn < value.size_bytes;) {
    int64_t remaining = value.size_bytes - posn;

    int64_t group_size;
    if (remaining > kInt32DecimalDigits) {
      group_size = kInt32DecimalDigits;
    } else {
      group_size = remaining;
    }

    const uint64_t multiple = kUInt32PowersOfTen[group_size];

    memcpy(chunk_string, value.data + posn, group_size);
    chunk_string[group_size] = '\0';
    uint32_t chunk = (uint32_t)strtoll(chunk_string, NULL, 10);

    for (int64_t i = 0; i < out_size; i++) {
      uint64_t tmp = out[i];
      tmp *= multiple;
      tmp += chunk;
      out[i] = (uint32_t)(tmp & 0xFFFFFFFFULL);
      chunk = (uint32_t)(tmp >> 32);
    }
    posn += group_size;
  }
}

ArrowErrorCode ArrowDecimalSetDigits(struct ArrowDecimal* decimal,
                                     struct ArrowStringView value) {
  // Check for sign
  int is_negative = value.data[0] == '-';
  int has_sign = is_negative || value.data[0] == '+';
  value.data += has_sign;
  value.size_bytes -= has_sign;

  // Check all characters are digits that are not the negative sign
  for (int64_t i = 0; i < value.size_bytes; i++) {
    char c = value.data[i];
    if (c < '0' || c > '9') {
      return EINVAL;
    }
  }

  // Skip over leading 0s
  int64_t n_leading_zeroes = 0;
  for (int64_t i = 0; i < value.size_bytes; i++) {
    if (value.data[i] == '0') {
      n_leading_zeroes++;
    } else {
      break;
    }
  }

  value.data += n_leading_zeroes;
  value.size_bytes -= n_leading_zeroes;

  // Use 32-bit words for portability
  uint32_t words32[8];
  memset(words32, 0, sizeof(words32));
  int n_words32 = decimal->n_words > 0 ? decimal->n_words * 2 : 1;
  NANOARROW_DCHECK(n_words32 <= 8);
  memset(words32, 0, sizeof(words32));

  ShiftAndAdd(value, words32, n_words32);

  if (_ArrowIsLittleEndian() || n_words32 == 1) {
    memcpy(decimal->words, words32, sizeof(uint32_t) * n_words32);
  } else {
    uint64_t lo;
    uint64_t hi;

    for (int i = 0; i < decimal->n_words; i++) {
      lo = (uint64_t)words32[i * 2];
      hi = (uint64_t)words32[i * 2 + 1] << 32;
      decimal->words[decimal->n_words - i - 1] = lo | hi;
    }
  }

  if (is_negative) {
    ArrowDecimalNegate(decimal);
  }

  return NANOARROW_OK;
}

// Adapted from Arrow C++ for C
// https://github.com/apache/arrow/blob/cd3321b28b0c9703e5d7105d6146c1270bbadd7f/cpp/src/arrow/util/decimal.cc#L365
ArrowErrorCode ArrowDecimalAppendDigitsToBuffer(const struct ArrowDecimal* decimal,
                                                struct ArrowBuffer* buffer) {
  NANOARROW_DCHECK(decimal->n_words == 0 || decimal->n_words == 1 ||
                   decimal->n_words == 2 || decimal->n_words == 4);

  // For the 32-bit case, just use snprintf()
  if (decimal->n_words == 0) {
    int32_t value;
    memcpy(&value, decimal->words, sizeof(int32_t));
    NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, 16));
    int n_chars = snprintf((char*)buffer->data + buffer->size_bytes,
                           (buffer->capacity_bytes - buffer->size_bytes), "%d", value);
    if (n_chars <= 0) {
      return EINVAL;
    }

    buffer->size_bytes += n_chars;
    return NANOARROW_OK;
  }

  int is_negative = ArrowDecimalSign(decimal) < 0;

  uint64_t words_little_endian[4];
  if (decimal->n_words == 0) {
    words_little_endian[0] = 0;
    memcpy(words_little_endian, decimal->words, sizeof(uint32_t));
  } else if (decimal->low_word_index == 0) {
    memcpy(words_little_endian, decimal->words, decimal->n_words * sizeof(uint64_t));
  } else {
    for (int i = 0; i < decimal->n_words; i++) {
      words_little_endian[i] = decimal->words[decimal->n_words - i - 1];
    }
  }

  // We've already made a copy, so negate that if needed
  if (is_negative) {
    if (decimal->n_words == 0) {
      uint32_t elem = (uint32_t)words_little_endian[0];
      elem = ~elem + 1;
      words_little_endian[0] = (int32_t)elem;
    } else {
      uint64_t carry = 1;
      for (int i = 0; i < decimal->n_words; i++) {
        uint64_t elem = words_little_endian[i];
        elem = ~elem + carry;
        carry &= (elem == 0);
        words_little_endian[i] = elem;
      }
    }
  }

  // Find the most significant word that is non-zero
  int most_significant_elem_idx = -1;
  if (decimal->n_words == 0) {
    if (words_little_endian[0] != 0) {
      most_significant_elem_idx = 0;
    }
  } else {
    for (int i = decimal->n_words - 1; i >= 0; i--) {
      if (words_little_endian[i] != 0) {
        most_significant_elem_idx = i;
        break;
      }
    }
  }

  // If they are all zero, the output is just '0'
  if (most_significant_elem_idx == -1) {
    NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt8(buffer, '0'));
    return NANOARROW_OK;
  }

  // Define segments such that each segment represents 9 digits with the
  // least significant group of 9 digits first. For example, if the input represents
  // 9876543210123456789, then segments will be [123456789, 876543210, 9].
  // We handle at most a signed 256 bit integer, whose maximum value occupies 77
  // characters. Thus, we need at most 9 segments.
  const uint32_t k1e9 = 1000000000U;
  int num_segments = 0;
  uint32_t segments[9];
  memset(segments, 0, sizeof(segments));
  uint64_t* most_significant_elem = words_little_endian + most_significant_elem_idx;

  do {
    // Compute remainder = words_little_endian % 1e9 and words_little_endian =
    // words_little_endian / 1e9.
    uint32_t remainder = 0;
    uint64_t* elem = most_significant_elem;

    do {
      // Compute dividend = (remainder << 32) | *elem  (a virtual 96-bit integer);
      // *elem = dividend / 1e9;
      // remainder = dividend % 1e9.
      uint32_t hi = (uint32_t)(*elem >> 32);
      uint32_t lo = (uint32_t)(*elem & 0xFFFFFFFFULL);
      uint64_t dividend_hi = ((uint64_t)(remainder) << 32) | hi;
      uint64_t quotient_hi = dividend_hi / k1e9;
      remainder = (uint32_t)(dividend_hi % k1e9);
      uint64_t dividend_lo = ((uint64_t)(remainder) << 32) | lo;
      uint64_t quotient_lo = dividend_lo / k1e9;
      remainder = (uint32_t)(dividend_lo % k1e9);

      *elem = (quotient_hi << 32) | quotient_lo;
    } while (elem-- != words_little_endian);

    segments[num_segments++] = remainder;
  } while (*most_significant_elem != 0 || most_significant_elem-- != words_little_endian);

  // We know our output has no more than 9 digits per segment, plus a negative sign,
  // plus any further digits between our output of 9 digits plus enough
  // extra characters to ensure that snprintf() with n = 21 (maximum length of %lu
  // including a the null terminator) is bounded properly.
  NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, num_segments * 9 + 1 + 21 - 9));
  if (is_negative) {
    buffer->data[buffer->size_bytes++] = '-';
  }

  // The most significant segment should have no leading zeroes
  int n_chars = snprintf((char*)buffer->data + buffer->size_bytes, 21, "%lu",
                         (unsigned long)segments[num_segments - 1]);

  // Ensure that an encoding error from snprintf() does not result
  // in an out-of-bounds access.
  if (n_chars < 0) {
    return ERANGE;
  }

  buffer->size_bytes += n_chars;

  // Subsequent output needs to be left-padded with zeroes such that each segment
  // takes up exactly 9 digits.
  for (int i = num_segments - 2; i >= 0; i--) {
    int n_chars = snprintf((char*)buffer->data + buffer->size_bytes, 21, "%09lu",
                           (unsigned long)segments[i]);
    buffer->size_bytes += n_chars;
    NANOARROW_DCHECK(buffer->size_bytes <= buffer->capacity_bytes);
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowDecimalAppendStringToBuffer(const struct ArrowDecimal* decimal,
                                                struct ArrowBuffer* buffer) {
  int64_t buffer_size = buffer->size_bytes;
  NANOARROW_RETURN_NOT_OK(ArrowDecimalAppendDigitsToBuffer(decimal, buffer));
  int64_t digits_size = buffer->size_bytes - buffer_size;

  if (decimal->scale <= 0) {
    // e.g., digits are -12345 and scale is -2 -> -1234500
    // Just add zeros to the end
    for (int i = decimal->scale; i < 0; i++) {
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt8(buffer, '0'));
    }
    return NANOARROW_OK;
  }

  int is_negative = buffer->data[0] == '-';
  int64_t num_digits = digits_size - is_negative;
  if (num_digits <= decimal->scale) {
    // e.g., digits are -12345 and scale is 6 -> -0.012345
    // Insert "0.<some zeros>" between the (maybe) negative sign and the digits
    int64_t num_zeros_after_decimal = decimal->scale - num_digits;
    NANOARROW_RETURN_NOT_OK(
        ArrowBufferResize(buffer, buffer->size_bytes + num_zeros_after_decimal + 2, 0));

    uint8_t* digits_start = buffer->data + is_negative;
    memmove(digits_start + num_zeros_after_decimal + 2, digits_start, num_digits);
    *digits_start++ = '0';
    *digits_start++ = '.';
    for (int i = 0; i < num_zeros_after_decimal; i++) {
      *digits_start++ = '0';
    }

  } else {
    // e.g., digits are -12345 and scale is 4 -> -1.2345
    // Insert a decimal point before scale digits of output
    NANOARROW_RETURN_NOT_OK(ArrowBufferResize(buffer, buffer->size_bytes + 1, 0));
    uint8_t* decimal_point_to_be = buffer->data + buffer->size_bytes - 1 - decimal->scale;
    memmove(decimal_point_to_be + 1, decimal_point_to_be, decimal->scale);
    *decimal_point_to_be = '.';
  }

  return NANOARROW_OK;
}
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#include <errno.h>
#include <inttypes.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include "nanoarrow/nanoarrow.h"

static void ArrowSchemaReleaseInternal(struct ArrowSchema* schema) {
  if (schema->format != NULL) ArrowFree((void*)schema->format);
  if (schema->name != NULL) ArrowFree((void*)schema->name);
  if (schema->metadata != NULL) ArrowFree((void*)schema->metadata);

  // This object owns the memory for all the children, but those
  // children may have been generated elsewhere and might have
  // their own release() callback.
  if (schema->children != NULL) {
    for (int64_t i = 0; i < schema->n_children; i++) {
      if (schema->children[i] != NULL) {
        if (schema->children[i]->release != NULL) {
          ArrowSchemaRelease(schema->children[i]);
        }

        ArrowFree(schema->children[i]);
      }
    }

    ArrowFree(schema->children);
  }

  // This object owns the memory for the dictionary but it
  // may have been generated somewhere else and have its own
  // release() callback.
  if (schema->dictionary != NULL) {
    if (schema->dictionary->release != NULL) {
      ArrowSchemaRelease(schema->dictionary);
    }

    ArrowFree(schema->dictionary);
  }

  // private data not currently used
  if (schema->private_data != NULL) {
    ArrowFree(schema->private_data);
  }

  schema->release = NULL;
}

static const char* ArrowSchemaFormatTemplate(enum ArrowType type) {
  switch (type) {
    case NANOARROW_TYPE_UNINITIALIZED:
      return NULL;
    case NANOARROW_TYPE_NA:
      return "n";
    case NANOARROW_TYPE_BOOL:
      return "b";

    case NANOARROW_TYPE_UINT8:
      return "C";
    case NANOARROW_TYPE_INT8:
      return "c";
    case NANOARROW_TYPE_UINT16:
      return "S";
    case NANOARROW_TYPE_INT16:
      return "s";
    case NANOARROW_TYPE_UINT32:
      return "I";
    case NANOARROW_TYPE_INT32:
      return "i";
    case NANOARROW_TYPE_UINT64:
      return "L";
    case NANOARROW_TYPE_INT64:
      return "l";

    case NANOARROW_TYPE_HALF_FLOAT:
      return "e";
    case NANOARROW_TYPE_FLOAT:
      return "f";
    case NANOARROW_TYPE_DOUBLE:
      return "g";

    case NANOARROW_TYPE_STRING:
      return "u";
    case NANOARROW_TYPE_LARGE_STRING:
      return "U";
    case NANOARROW_TYPE_STRING_VIEW:
      return "vu";
    case NANOARROW_TYPE_BINARY:
      return "z";
    case NANOARROW_TYPE_BINARY_VIEW:
      return "vz";
    case NANOARROW_TYPE_LARGE_BINARY:
      return "Z";

    case NANOARROW_TYPE_DATE32:
      return "tdD";
    case NANOARROW_TYPE_DATE64:
      return "tdm";
    case NANOARROW_TYPE_INTERVAL_MONTHS:
      return "tiM";
    case NANOARROW_TYPE_INTERVAL_DAY_TIME:
      return "tiD";
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO:
      return "tin";

    case NANOARROW_TYPE_LIST:
      return "+l";
    case NANOARROW_TYPE_LARGE_LIST:
      return "+L";
    case NANOARROW_TYPE_LIST_VIEW:
      return "+vl";
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      return "+vL";
    case NANOARROW_TYPE_STRUCT:
      return "+s";
    case NANOARROW_TYPE_MAP:
      return "+m";
    case NANOARROW_TYPE_RUN_END_ENCODED:
      return "+r";

    default:
      return NULL;
  }
}

static int ArrowSchemaInitChildrenIfNeeded(struct ArrowSchema* schema,
                                           enum ArrowType type) {
  switch (type) {
    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_LARGE_LIST:
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
    case NANOARROW_TYPE_LIST_VIEW:
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema, 1));
      ArrowSchemaInit(schema->children[0]);
      NANOARROW_RETURN_NOT_OK(ArrowSchemaSetName(schema->children[0], "item"));
      break;
    case NANOARROW_TYPE_MAP:
      NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema, 1));
      NANOARROW_RETURN_NOT_OK(
          ArrowSchemaInitFromType(schema->children[0], NANOARROW_TYPE_STRUCT));
      NANOARROW_RETURN_NOT_OK(ArrowSchemaSetName(schema->children[0], "entries"));
      schema->children[0]->flags &= ~ARROW_FLAG_NULLABLE;
      NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema->children[0], 2));
      ArrowSchemaInit(schema->children[0]->children[0]);
      ArrowSchemaInit(schema->children[0]->children[1]);
      NANOARROW_RETURN_NOT_OK(
          ArrowSchemaSetName(schema->children[0]->children[0], "key"));
      schema->children[0]->children[0]->flags &= ~ARROW_FLAG_NULLABLE;
      NANOARROW_RETURN_NOT_OK(
          ArrowSchemaSetName(schema->children[0]->children[1], "value"));
      break;
    case NANOARROW_TYPE_RUN_END_ENCODED:
      NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema, 2));
      ArrowSchemaInit(schema->children[0]);
      NANOARROW_RETURN_NOT_OK(ArrowSchemaSetName(schema->children[0], "run_ends"));
      schema->children[0]->flags &= ~ARROW_FLAG_NULLABLE;
      ArrowSchemaInit(schema->children[1]);
      NANOARROW_RETURN_NOT_OK(ArrowSchemaSetName(schema->children[1], "values"));
    default:
      break;
  }

  return NANOARROW_OK;
}

void ArrowSchemaInit(struct ArrowSchema* schema) {
  schema->format = NULL;
  schema->name = NULL;
  schema->metadata = NULL;
  schema->flags = ARROW_FLAG_NULLABLE;
  schema->n_children = 0;
  schema->children = NULL;
  schema->dictionary = NULL;
  schema->private_data = NULL;
  schema->release = &ArrowSchemaReleaseInternal;
}

ArrowErrorCode ArrowSchemaSetType(struct ArrowSchema* schema, enum ArrowType type) {
  // We don't allocate the dictionary because it has to be nullptr
  // for non-dictionary-encoded arrays.

  // Set the format to a valid format string for type
  const char* template_format = ArrowSchemaFormatTemplate(type);

  // If type isn't recognized and not explicitly unset
  if (template_format == NULL && type != NANOARROW_TYPE_UNINITIALIZED) {
    return EINVAL;
  }

  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetFormat(schema, template_format));

  // For types with an umabiguous child structure, allocate children
  return ArrowSchemaInitChildrenIfNeeded(schema, type);
}

ArrowErrorCode ArrowSchemaSetTypeStruct(struct ArrowSchema* schema, int64_t n_children) {
  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetType(schema, NANOARROW_TYPE_STRUCT));
  NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema, n_children));
  for (int64_t i = 0; i < n_children; i++) {
    ArrowSchemaInit(schema->children[i]);
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaInitFromType(struct ArrowSchema* schema, enum ArrowType type) {
  ArrowSchemaInit(schema);

  int result = ArrowSchemaSetType(schema, type);
  if (result != NANOARROW_OK) {
    ArrowSchemaRelease(schema);
    return result;
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaSetTypeFixedSize(struct ArrowSchema* schema,
                                           enum ArrowType type, int32_t fixed_size) {
  if (fixed_size <= 0) {
    return EINVAL;
  }

  char buffer[64];
  int n_chars;
  switch (type) {
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      n_chars = snprintf(buffer, sizeof(buffer), "w:%" PRId32, fixed_size);
      break;
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      n_chars = snprintf(buffer, sizeof(buffer), "+w:%" PRId32, fixed_size);
      break;
    default:
      return EINVAL;
  }

  if (((size_t)n_chars) >= sizeof(buffer) || n_chars < 0) {
    return ERANGE;
  }

  buffer[n_chars] = '\0';
  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetFormat(schema, buffer));

  if (type == NANOARROW_TYPE_FIXED_SIZE_LIST) {
    NANOARROW_RETURN_NOT_OK(ArrowSchemaInitChildrenIfNeeded(schema, type));
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaSetTypeDecimal(struct ArrowSchema* schema, enum ArrowType type,
                                         int32_t decimal_precision,
                                         int32_t decimal_scale) {
  if (decimal_precision <= 0) {
    return EINVAL;
  }

  char buffer[64];
  int n_chars;
  switch (type) {
    case NANOARROW_TYPE_DECIMAL32:
      if (decimal_precision > 9) {
        return EINVAL;
      }

      n_chars = snprintf(buffer, sizeof(buffer), "d:%d,%d,32", decimal_precision,
                         decimal_scale);
      break;
    case NANOARROW_TYPE_DECIMAL64:
      if (decimal_precision > 18) {
        return EINVAL;
      }

      n_chars = snprintf(buffer, sizeof(buffer), "d:%d,%d,64", decimal_precision,
                         decimal_scale);
      break;
    case NANOARROW_TYPE_DECIMAL128:
      if (decimal_precision > 38) {
        return EINVAL;
      }

      n_chars =
          snprintf(buffer, sizeof(buffer), "d:%d,%d", decimal_precision, decimal_scale);
      break;
    case NANOARROW_TYPE_DECIMAL256:
      if (decimal_precision > 76) {
        return EINVAL;
      }

      n_chars = snprintf(buffer, sizeof(buffer), "d:%d,%d,256", decimal_precision,
                         decimal_scale);
      break;
    default:
      return EINVAL;
  }

  if (((size_t)n_chars) >= sizeof(buffer) || n_chars < 0) {
    return ERANGE;
  }

  buffer[n_chars] = '\0';
  return ArrowSchemaSetFormat(schema, buffer);
}

ArrowErrorCode ArrowSchemaSetTypeRunEndEncoded(struct ArrowSchema* schema,
                                               enum ArrowType run_end_type) {
  switch (run_end_type) {
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_INT64:
      break;
    default:
      return EINVAL;
  }

  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetFormat(
      schema, ArrowSchemaFormatTemplate(NANOARROW_TYPE_RUN_END_ENCODED)));
  NANOARROW_RETURN_NOT_OK(
      ArrowSchemaInitChildrenIfNeeded(schema, NANOARROW_TYPE_RUN_END_ENCODED));
  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetType(schema->children[0], run_end_type));
  NANOARROW_RETURN_NOT_OK(
      ArrowSchemaSetType(schema->children[1], NANOARROW_TYPE_UNINITIALIZED));

  return NANOARROW_OK;
}

static const char* ArrowTimeUnitFormatString(enum ArrowTimeUnit time_unit) {
  switch (time_unit) {
    case NANOARROW_TIME_UNIT_SECOND:
      return "s";
    case NANOARROW_TIME_UNIT_MILLI:
      return "m";
    case NANOARROW_TIME_UNIT_MICRO:
      return "u";
    case NANOARROW_TIME_UNIT_NANO:
      return "n";
    default:
      return NULL;
  }
}

ArrowErrorCode ArrowSchemaSetTypeDateTime(struct ArrowSchema* schema, enum ArrowType type,
                                          enum ArrowTimeUnit time_unit,
                                          const char* timezone) {
  const char* time_unit_str = ArrowTimeUnitFormatString(time_unit);
  if (time_unit_str == NULL) {
    return EINVAL;
  }

  char buffer[128];
  int n_chars;
  switch (type) {
    case NANOARROW_TYPE_TIME32:
      if (timezone != NULL) {
        return EINVAL;
      }

      switch (time_unit) {
        case NANOARROW_TIME_UNIT_MICRO:
        case NANOARROW_TIME_UNIT_NANO:
          return EINVAL;
        default:
          break;
      }

      n_chars = snprintf(buffer, sizeof(buffer), "tt%s", time_unit_str);
      break;
    case NANOARROW_TYPE_TIME64:
      if (timezone != NULL) {
        return EINVAL;
      }

      switch (time_unit) {
        case NANOARROW_TIME_UNIT_SECOND:
        case NANOARROW_TIME_UNIT_MILLI:
          return EINVAL;
        default:
          break;
      }

      n_chars = snprintf(buffer, sizeof(buffer), "tt%s", time_unit_str);
      break;
    case NANOARROW_TYPE_TIMESTAMP:
      if (timezone == NULL) {
        timezone = "";
      }
      n_chars = snprintf(buffer, sizeof(buffer), "ts%s:%s", time_unit_str, timezone);
      break;
    case NANOARROW_TYPE_DURATION:
      if (timezone != NULL) {
        return EINVAL;
      }
      n_chars = snprintf(buffer, sizeof(buffer), "tD%s", time_unit_str);
      break;
    default:
      return EINVAL;
  }

  if (((size_t)n_chars) >= sizeof(buffer) || n_chars < 0) {
    return ERANGE;
  }

  buffer[n_chars] = '\0';

  return ArrowSchemaSetFormat(schema, buffer);
}

ArrowErrorCode ArrowSchemaSetTypeUnion(struct ArrowSchema* schema, enum ArrowType type,
                                       int64_t n_children) {
  if (n_children < 0 || n_children > 127) {
    return EINVAL;
  }

  // Max valid size would be +ud:0,1,...126 = 401 characters + null terminator
  char format_out[512];
  int64_t format_out_size = 512;
  memset(format_out, 0, format_out_size);
  int n_chars;
  char* format_cursor = format_out;

  switch (type) {
    case NANOARROW_TYPE_SPARSE_UNION:
      n_chars = snprintf(format_cursor, format_out_size, "+us:");
      format_cursor += n_chars;
      format_out_size -= n_chars;
      break;
    case NANOARROW_TYPE_DENSE_UNION:
      n_chars = snprintf(format_cursor, format_out_size, "+ud:");
      format_cursor += n_chars;
      format_out_size -= n_chars;
      break;
    default:
      return EINVAL;
  }

  // Ensure that an encoding error from snprintf() does not result
  // in an out-of-bounds access.
  if (n_chars < 0) {
    return ERANGE;
  }

  if (n_children > 0) {
    n_chars = snprintf(format_cursor, format_out_size, "0");
    format_cursor += n_chars;
    format_out_size -= n_chars;

    for (int64_t i = 1; i < n_children; i++) {
      n_chars = snprintf(format_cursor, format_out_size, ",%" PRId64, i);
      format_cursor += n_chars;
      format_out_size -= n_chars;
    }
  }

  // Ensure that an encoding error from snprintf() does not result
  // in an out-of-bounds access.
  if (n_chars < 0) {
    return ERANGE;
  }

  NANOARROW_RETURN_NOT_OK(ArrowSchemaSetFormat(schema, format_out));

  NANOARROW_RETURN_NOT_OK(ArrowSchemaAllocateChildren(schema, n_children));
  for (int64_t i = 0; i < n_children; i++) {
    ArrowSchemaInit(schema->children[i]);
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaSetFormat(struct ArrowSchema* schema, const char* format) {
  if (schema->format != NULL) {
    ArrowFree((void*)schema->format);
  }

  if (format != NULL) {
    size_t format_size = strlen(format) + 1;
    schema->format = (const char*)ArrowMalloc(format_size);
    if (schema->format == NULL) {
      return ENOMEM;
    }

    memcpy((void*)schema->format, format, format_size);
  } else {
    schema->format = NULL;
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaSetName(struct ArrowSchema* schema, const char* name) {
  if (schema->name != NULL) {
    ArrowFree((void*)schema->name);
  }

  if (name != NULL) {
    size_t name_size = strlen(name) + 1;
    schema->name = (const char*)ArrowMalloc(name_size);
    if (schema->name == NULL) {
      return ENOMEM;
    }

    memcpy((void*)schema->name, name, name_size);
  } else {
    schema->name = NULL;
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaSetMetadata(struct ArrowSchema* schema, const char* metadata) {
  if (schema->metadata != NULL) {
    ArrowFree((void*)schema->metadata);
  }

  if (metadata != NULL) {
    size_t metadata_size = ArrowMetadataSizeOf(metadata);
    schema->metadata = (const char*)ArrowMalloc(metadata_size);
    if (schema->metadata == NULL) {
      return ENOMEM;
    }

    memcpy((void*)schema->metadata, metadata, metadata_size);
  } else {
    schema->metadata = NULL;
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaAllocateChildren(struct ArrowSchema* schema,
                                           int64_t n_children) {
  if (schema->children != NULL) {
    return EEXIST;
  }

  if (n_children > 0) {
    schema->children =
        (struct ArrowSchema**)ArrowMalloc(n_children * sizeof(struct ArrowSchema*));

    if (schema->children == NULL) {
      return ENOMEM;
    }

    schema->n_children = n_children;

    memset(schema->children, 0, n_children * sizeof(struct ArrowSchema*));

    for (int64_t i = 0; i < n_children; i++) {
      schema->children[i] = (struct ArrowSchema*)ArrowMalloc(sizeof(struct ArrowSchema));

      if (schema->children[i] == NULL) {
        return ENOMEM;
      }

      schema->children[i]->release = NULL;
    }
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaAllocateDictionary(struct ArrowSchema* schema) {
  if (schema->dictionary != NULL) {
    return EEXIST;
  }

  schema->dictionary = (struct ArrowSchema*)ArrowMalloc(sizeof(struct ArrowSchema));
  if (schema->dictionary == NULL) {
    return ENOMEM;
  }

  schema->dictionary->release = NULL;
  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaDeepCopy(const struct ArrowSchema* schema,
                                   struct ArrowSchema* schema_out) {
  ArrowSchemaInit(schema_out);

  int result = ArrowSchemaSetFormat(schema_out, schema->format);
  if (result != NANOARROW_OK) {
    ArrowSchemaRelease(schema_out);
    return result;
  }

  schema_out->flags = schema->flags;

  result = ArrowSchemaSetName(schema_out, schema->name);
  if (result != NANOARROW_OK) {
    ArrowSchemaRelease(schema_out);
    return result;
  }

  result = ArrowSchemaSetMetadata(schema_out, schema->metadata);
  if (result != NANOARROW_OK) {
    ArrowSchemaRelease(schema_out);
    return result;
  }

  result = ArrowSchemaAllocateChildren(schema_out, schema->n_children);
  if (result != NANOARROW_OK) {
    ArrowSchemaRelease(schema_out);
    return result;
  }

  for (int64_t i = 0; i < schema->n_children; i++) {
    result = ArrowSchemaDeepCopy(schema->children[i], schema_out->children[i]);
    if (result != NANOARROW_OK) {
      ArrowSchemaRelease(schema_out);
      return result;
    }
  }

  if (schema->dictionary != NULL) {
    result = ArrowSchemaAllocateDictionary(schema_out);
    if (result != NANOARROW_OK) {
      ArrowSchemaRelease(schema_out);
      return result;
    }

    result = ArrowSchemaDeepCopy(schema->dictionary, schema_out->dictionary);
    if (result != NANOARROW_OK) {
      ArrowSchemaRelease(schema_out);
      return result;
    }
  }

  return NANOARROW_OK;
}

static void ArrowSchemaViewSetPrimitive(struct ArrowSchemaView* schema_view,
                                        enum ArrowType type) {
  schema_view->type = type;
  schema_view->storage_type = type;
}

static ArrowErrorCode ArrowSchemaViewParse(struct ArrowSchemaView* schema_view,
                                           const char* format,
                                           const char** format_end_out,
                                           struct ArrowError* error) {
  *format_end_out = format;

  // needed for decimal parsing
  const char* parse_start;
  char* parse_end;

  switch (format[0]) {
    case 'n':
      schema_view->type = NANOARROW_TYPE_NA;
      schema_view->storage_type = NANOARROW_TYPE_NA;
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'b':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_BOOL);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'c':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT8);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'C':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_UINT8);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 's':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT16);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'S':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_UINT16);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'i':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT32);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'I':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_UINT32);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'l':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'L':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_UINT64);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'e':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_HALF_FLOAT);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'f':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_FLOAT);
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'g':
      ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_DOUBLE);
      *format_end_out = format + 1;
      return NANOARROW_OK;

    // decimal
    case 'd':
      if (format[1] != ':' || format[2] == '\0') {
        ArrowErrorSet(error, "Expected ':precision,scale[,bitwidth]' following 'd'");
        return EINVAL;
      }

      parse_start = format + 2;
      schema_view->decimal_precision = (int32_t)strtol(parse_start, &parse_end, 10);
      if (parse_end == parse_start || parse_end[0] != ',') {
        ArrowErrorSet(error, "Expected 'precision,scale[,bitwidth]' following 'd:'");
        return EINVAL;
      }

      parse_start = parse_end + 1;
      schema_view->decimal_scale = (int32_t)strtol(parse_start, &parse_end, 10);
      if (parse_end == parse_start) {
        ArrowErrorSet(error, "Expected 'scale[,bitwidth]' following 'd:precision,'");
        return EINVAL;
      } else if (parse_end[0] != ',') {
        schema_view->decimal_bitwidth = 128;
      } else {
        parse_start = parse_end + 1;
        schema_view->decimal_bitwidth = (int32_t)strtol(parse_start, &parse_end, 10);
        if (parse_start == parse_end) {
          ArrowErrorSet(error, "Expected precision following 'd:precision,scale,'");
          return EINVAL;
        }
      }

      *format_end_out = parse_end;

      switch (schema_view->decimal_bitwidth) {
        case 32:
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_DECIMAL32);
          return NANOARROW_OK;
        case 64:
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_DECIMAL64);
          return NANOARROW_OK;
        case 128:
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_DECIMAL128);
          return NANOARROW_OK;
        case 256:
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_DECIMAL256);
          return NANOARROW_OK;
        default:
          ArrowErrorSet(error,
                        "Expected decimal bitwidth of 128 or 256 but found %" PRId32,
                        schema_view->decimal_bitwidth);
          return EINVAL;
      }

    // validity + data
    case 'w':
      schema_view->type = NANOARROW_TYPE_FIXED_SIZE_BINARY;
      schema_view->storage_type = NANOARROW_TYPE_FIXED_SIZE_BINARY;
      if (format[1] != ':' || format[2] == '\0') {
        ArrowErrorSet(error, "Expected ':<width>' following 'w'");
        return EINVAL;
      }

      schema_view->fixed_size = (int32_t)strtol(format + 2, (char**)format_end_out, 10);
      return NANOARROW_OK;

    // validity + offset + data
    case 'z':
      schema_view->type = NANOARROW_TYPE_BINARY;
      schema_view->storage_type = NANOARROW_TYPE_BINARY;
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'u':
      schema_view->type = NANOARROW_TYPE_STRING;
      schema_view->storage_type = NANOARROW_TYPE_STRING;
      *format_end_out = format + 1;
      return NANOARROW_OK;

    // validity + large_offset + data
    case 'Z':
      schema_view->type = NANOARROW_TYPE_LARGE_BINARY;
      schema_view->storage_type = NANOARROW_TYPE_LARGE_BINARY;
      *format_end_out = format + 1;
      return NANOARROW_OK;
    case 'U':
      schema_view->type = NANOARROW_TYPE_LARGE_STRING;
      schema_view->storage_type = NANOARROW_TYPE_LARGE_STRING;
      *format_end_out = format + 1;
      return NANOARROW_OK;

    // nested types
    case '+':
      switch (format[1]) {
        // list has validity + offset or offset
        case 'l':
          schema_view->storage_type = NANOARROW_TYPE_LIST;
          schema_view->type = NANOARROW_TYPE_LIST;
          *format_end_out = format + 2;
          return NANOARROW_OK;

        // large list has validity + large_offset or large_offset
        case 'L':
          schema_view->storage_type = NANOARROW_TYPE_LARGE_LIST;
          schema_view->type = NANOARROW_TYPE_LARGE_LIST;
          *format_end_out = format + 2;
          return NANOARROW_OK;

        // run end encoded has no buffer at all
        case 'r':
          schema_view->storage_type = NANOARROW_TYPE_RUN_END_ENCODED;
          schema_view->type = NANOARROW_TYPE_RUN_END_ENCODED;
          *format_end_out = format + 2;
          return NANOARROW_OK;

        // just validity buffer
        case 'w':
          if (format[2] != ':' || format[3] == '\0') {
            ArrowErrorSet(error, "Expected ':<width>' following '+w'");
            return EINVAL;
          }

          schema_view->storage_type = NANOARROW_TYPE_FIXED_SIZE_LIST;
          schema_view->type = NANOARROW_TYPE_FIXED_SIZE_LIST;
          schema_view->fixed_size =
              (int32_t)strtol(format + 3, (char**)format_end_out, 10);
          return NANOARROW_OK;
        case 's':
          schema_view->storage_type = NANOARROW_TYPE_STRUCT;
          schema_view->type = NANOARROW_TYPE_STRUCT;
          *format_end_out = format + 2;
          return NANOARROW_OK;
        case 'm':
          schema_view->storage_type = NANOARROW_TYPE_MAP;
          schema_view->type = NANOARROW_TYPE_MAP;
          *format_end_out = format + 2;
          return NANOARROW_OK;

        // unions
        case 'u':
          switch (format[2]) {
            case 'd':
              schema_view->storage_type = NANOARROW_TYPE_DENSE_UNION;
              schema_view->type = NANOARROW_TYPE_DENSE_UNION;
              break;
            case 's':
              schema_view->storage_type = NANOARROW_TYPE_SPARSE_UNION;
              schema_view->type = NANOARROW_TYPE_SPARSE_UNION;
              break;
            default:
              ArrowErrorSet(error,
                            "Expected union format string +us:<type_ids> or "
                            "+ud:<type_ids> but found '%s'",
                            format);
              return EINVAL;
          }

          if (format[3] == ':') {
            schema_view->union_type_ids = format + 4;
            int64_t n_type_ids =
                _ArrowParseUnionTypeIds(schema_view->union_type_ids, NULL);
            if (n_type_ids != schema_view->schema->n_children) {
              ArrowErrorSet(error,
                            "Expected union type_ids parameter to be a comma-separated "
                            "list of %" PRId64 " values between 0 and 127 but found '%s'",
                            schema_view->schema->n_children, schema_view->union_type_ids);
              return EINVAL;
            }
            *format_end_out = format + strlen(format);
            return NANOARROW_OK;
          } else {
            ArrowErrorSet(error,
                          "Expected union format string +us:<type_ids> or +ud:<type_ids> "
                          "but found '%s'",
                          format);
            return EINVAL;
          }

        // views
        case 'v':
          switch (format[2]) {
            case 'l':
              schema_view->storage_type = NANOARROW_TYPE_LIST_VIEW;
              schema_view->type = NANOARROW_TYPE_LIST_VIEW;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'L':
              schema_view->storage_type = NANOARROW_TYPE_LARGE_LIST_VIEW;
              schema_view->type = NANOARROW_TYPE_LARGE_LIST_VIEW;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            default:
              ArrowErrorSet(
                  error, "Expected view format string +vl or +vL but found '%s'", format);
              return EINVAL;
          }
        default:
          ArrowErrorSet(error, "Expected nested type format string but found '%s'",
                        format);
          return EINVAL;
      }

    // date/time types
    case 't':
      switch (format[1]) {
        // date
        case 'd':
          switch (format[2]) {
            case 'D':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT32);
              schema_view->type = NANOARROW_TYPE_DATE32;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'm':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_DATE64;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            default:
              ArrowErrorSet(error, "Expected 'D' or 'm' following 'td' but found '%s'",
                            format + 2);
              return EINVAL;
          }

        // time of day
        case 't':
          switch (format[2]) {
            case 's':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT32);
              schema_view->type = NANOARROW_TYPE_TIME32;
              schema_view->time_unit = NANOARROW_TIME_UNIT_SECOND;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'm':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT32);
              schema_view->type = NANOARROW_TYPE_TIME32;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MILLI;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'u':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIME64;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MICRO;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'n':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIME64;
              schema_view->time_unit = NANOARROW_TIME_UNIT_NANO;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            default:
              ArrowErrorSet(
                  error, "Expected 's', 'm', 'u', or 'n' following 'tt' but found '%s'",
                  format + 2);
              return EINVAL;
          }

        // timestamp
        case 's':
          switch (format[2]) {
            case 's':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIMESTAMP;
              schema_view->time_unit = NANOARROW_TIME_UNIT_SECOND;
              break;
            case 'm':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIMESTAMP;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MILLI;
              break;
            case 'u':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIMESTAMP;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MICRO;
              break;
            case 'n':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_TIMESTAMP;
              schema_view->time_unit = NANOARROW_TIME_UNIT_NANO;
              break;
            default:
              ArrowErrorSet(
                  error, "Expected 's', 'm', 'u', or 'n' following 'ts' but found '%s'",
                  format + 2);
              return EINVAL;
          }

          if (format[3] != ':') {
            ArrowErrorSet(error, "Expected ':' following '%.3s' but found '%s'", format,
                          format + 3);
            return EINVAL;
          }

          schema_view->timezone = format + 4;
          *format_end_out = format + strlen(format);
          return NANOARROW_OK;

        // duration
        case 'D':
          switch (format[2]) {
            case 's':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_DURATION;
              schema_view->time_unit = NANOARROW_TIME_UNIT_SECOND;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'm':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_DURATION;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MILLI;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'u':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_DURATION;
              schema_view->time_unit = NANOARROW_TIME_UNIT_MICRO;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'n':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INT64);
              schema_view->type = NANOARROW_TYPE_DURATION;
              schema_view->time_unit = NANOARROW_TIME_UNIT_NANO;
              *format_end_out = format + 3;
              return NANOARROW_OK;
            default:
              ArrowErrorSet(error,
                            "Expected 's', 'm', u', or 'n' following 'tD' but found '%s'",
                            format + 2);
              return EINVAL;
          }

        // interval
        case 'i':
          switch (format[2]) {
            case 'M':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INTERVAL_MONTHS);
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'D':
              ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_INTERVAL_DAY_TIME);
              *format_end_out = format + 3;
              return NANOARROW_OK;
            case 'n':
              ArrowSchemaViewSetPrimitive(schema_view,
                                          NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO);
              *format_end_out = format + 3;
              return NANOARROW_OK;
            default:
              ArrowErrorSet(error,
                            "Expected 'M', 'D', or 'n' following 'ti' but found '%s'",
                            format + 2);
              return EINVAL;
          }

        default:
          ArrowErrorSet(
              error, "Expected 'd', 't', 's', 'D', or 'i' following 't' but found '%s'",
              format + 1);
          return EINVAL;
      }

    // view types
    case 'v': {
      switch (format[1]) {
        case 'u':
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_STRING_VIEW);
          *format_end_out = format + 2;
          return NANOARROW_OK;
        case 'z':
          ArrowSchemaViewSetPrimitive(schema_view, NANOARROW_TYPE_BINARY_VIEW);
          *format_end_out = format + 2;
          return NANOARROW_OK;
        default:
          ArrowErrorSet(error, "Expected 'u', or 'z' following 'v' but found '%s'",
                        format + 1);
          return EINVAL;
      }
    }

    default:
      ArrowErrorSet(error, "Unknown format: '%s'", format);
      return EINVAL;
  }
}

static ArrowErrorCode ArrowSchemaViewValidateNChildren(
    struct ArrowSchemaView* schema_view, int64_t n_children, struct ArrowError* error) {
  if (n_children != -1 && schema_view->schema->n_children != n_children) {
    ArrowErrorSet(
        error, "Expected schema with %" PRId64 " children but found %" PRId64 " children",
        n_children, schema_view->schema->n_children);
    return EINVAL;
  }

  // Don't do a full validation of children but do check that they won't
  // segfault if inspected
  struct ArrowSchema* child;
  for (int64_t i = 0; i < schema_view->schema->n_children; i++) {
    child = schema_view->schema->children[i];
    if (child == NULL) {
      ArrowErrorSet(
          error, "Expected valid schema at schema->children[%" PRId64 "] but found NULL",
          i);
      return EINVAL;
    } else if (child->release == NULL) {
      ArrowErrorSet(error,
                    "Expected valid schema at schema->children[%" PRId64
                    "] but found a released schema",
                    i);
      return EINVAL;
    }
  }

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowSchemaViewValidateUnion(struct ArrowSchemaView* schema_view,
                                                   struct ArrowError* error) {
  return ArrowSchemaViewValidateNChildren(schema_view, -1, error);
}

static ArrowErrorCode ArrowSchemaViewValidateMap(struct ArrowSchemaView* schema_view,
                                                 struct ArrowError* error) {
  NANOARROW_RETURN_NOT_OK(ArrowSchemaViewValidateNChildren(schema_view, 1, error));

  if (schema_view->schema->children[0]->n_children != 2) {
    ArrowErrorSet(error,
                  "Expected child of map type to have 2 children but found %" PRId64,
                  schema_view->schema->children[0]->n_children);
    return EINVAL;
  }

  if (strcmp(schema_view->schema->children[0]->format, "+s") != 0) {
    ArrowErrorSet(error, "Expected format of child of map type to be '+s' but found '%s'",
                  schema_view->schema->children[0]->format);
    return EINVAL;
  }

  if (schema_view->schema->children[0]->flags & ARROW_FLAG_NULLABLE) {
    ArrowErrorSet(error,
                  "Expected child of map type to be non-nullable but was nullable");
    return EINVAL;
  }

  if (schema_view->schema->children[0]->children[0]->flags & ARROW_FLAG_NULLABLE) {
    ArrowErrorSet(error, "Expected key of map type to be non-nullable but was nullable");
    return EINVAL;
  }

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowSchemaViewValidateDictionary(
    struct ArrowSchemaView* schema_view, struct ArrowError* error) {
  // check for valid index type
  switch (schema_view->storage_type) {
    case NANOARROW_TYPE_UINT8:
    case NANOARROW_TYPE_INT8:
    case NANOARROW_TYPE_UINT16:
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_UINT32:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_UINT64:
    case NANOARROW_TYPE_INT64:
      break;
    default:
      ArrowErrorSet(
          error,
          "Expected dictionary schema index type to be an integral type but found '%s'",
          schema_view->schema->format);
      return EINVAL;
  }

  struct ArrowSchemaView dictionary_schema_view;
  return ArrowSchemaViewInit(&dictionary_schema_view, schema_view->schema->dictionary,
                             error);
}

static ArrowErrorCode ArrowSchemaViewValidate(struct ArrowSchemaView* schema_view,
                                              enum ArrowType type,
                                              struct ArrowError* error) {
  switch (type) {
    case NANOARROW_TYPE_NA:
    case NANOARROW_TYPE_BOOL:
    case NANOARROW_TYPE_UINT8:
    case NANOARROW_TYPE_INT8:
    case NANOARROW_TYPE_UINT16:
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_UINT32:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_UINT64:
    case NANOARROW_TYPE_INT64:
    case NANOARROW_TYPE_HALF_FLOAT:
    case NANOARROW_TYPE_FLOAT:
    case NANOARROW_TYPE_DOUBLE:
    case NANOARROW_TYPE_DECIMAL32:
    case NANOARROW_TYPE_DECIMAL64:
    case NANOARROW_TYPE_DECIMAL128:
    case NANOARROW_TYPE_DECIMAL256:
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_BINARY:
    case NANOARROW_TYPE_LARGE_BINARY:
    case NANOARROW_TYPE_DATE32:
    case NANOARROW_TYPE_DATE64:
    case NANOARROW_TYPE_INTERVAL_MONTHS:
    case NANOARROW_TYPE_INTERVAL_DAY_TIME:
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO:
    case NANOARROW_TYPE_TIMESTAMP:
    case NANOARROW_TYPE_TIME32:
    case NANOARROW_TYPE_TIME64:
    case NANOARROW_TYPE_DURATION:
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      return ArrowSchemaViewValidateNChildren(schema_view, 0, error);

    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      if (schema_view->fixed_size <= 0) {
        ArrowErrorSet(error, "Expected size > 0 for fixed size binary but found size %d",
                      schema_view->fixed_size);
        return EINVAL;
      }
      return ArrowSchemaViewValidateNChildren(schema_view, 0, error);

    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_LIST_VIEW:
    case NANOARROW_TYPE_LARGE_LIST:
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      return ArrowSchemaViewValidateNChildren(schema_view, 1, error);

    case NANOARROW_TYPE_RUN_END_ENCODED:
      return ArrowSchemaViewValidateNChildren(schema_view, 2, error);

    case NANOARROW_TYPE_STRUCT:
      return ArrowSchemaViewValidateNChildren(schema_view, -1, error);

    case NANOARROW_TYPE_SPARSE_UNION:
    case NANOARROW_TYPE_DENSE_UNION:
      return ArrowSchemaViewValidateUnion(schema_view, error);

    case NANOARROW_TYPE_MAP:
      return ArrowSchemaViewValidateMap(schema_view, error);

    case NANOARROW_TYPE_DICTIONARY:
      return ArrowSchemaViewValidateDictionary(schema_view, error);

    default:
      ArrowErrorSet(error, "Expected a valid enum ArrowType value but found %d",
                    schema_view->type);
      return EINVAL;
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowSchemaViewInit(struct ArrowSchemaView* schema_view,
                                   const struct ArrowSchema* schema,
                                   struct ArrowError* error) {
  if (schema == NULL) {
    ArrowErrorSet(error, "Expected non-NULL schema");
    return EINVAL;
  }

  if (schema->release == NULL) {
    ArrowErrorSet(error, "Expected non-released schema");
    return EINVAL;
  }

  schema_view->schema = schema;

  const char* format = schema->format;
  if (format == NULL) {
    ArrowErrorSet(
        error,
        "Error parsing schema->format: Expected a null-terminated string but found NULL");
    return EINVAL;
  }

  size_t format_len = strlen(format);
  if (format_len == 0) {
    ArrowErrorSet(error, "Error parsing schema->format: Expected a string with size > 0");
    return EINVAL;
  }

  const char* format_end_out;
  int result = ArrowSchemaViewParse(schema_view, format, &format_end_out, error);

  if (result != NANOARROW_OK) {
    if (error != NULL) {
      char child_error[1024];
      memcpy(child_error, ArrowErrorMessage(error), 1024);
      ArrowErrorSet(error, "Error parsing schema->format: %s", child_error);
    }

    return result;
  }

  if ((format + format_len) != format_end_out) {
    ArrowErrorSet(error, "Error parsing schema->format '%s': parsed %d/%zu characters",
                  format, (int)(format_end_out - format), format_len);
    return EINVAL;
  }

  if (schema->dictionary != NULL) {
    schema_view->type = NANOARROW_TYPE_DICTIONARY;
  }

  NANOARROW_RETURN_NOT_OK(
      ArrowSchemaViewValidate(schema_view, schema_view->storage_type, error));

  if (schema_view->storage_type != schema_view->type) {
    NANOARROW_RETURN_NOT_OK(
        ArrowSchemaViewValidate(schema_view, schema_view->type, error));
  }

  int64_t unknown_flags = schema->flags & ~NANOARROW_FLAG_ALL_SUPPORTED;
  if (unknown_flags != 0) {
    ArrowErrorSet(error, "Unknown ArrowSchema flag");
    return EINVAL;
  }

  if (schema->flags & ARROW_FLAG_DICTIONARY_ORDERED &&
      schema_view->type != NANOARROW_TYPE_DICTIONARY) {
    ArrowErrorSet(error,
                  "ARROW_FLAG_DICTIONARY_ORDERED is only relevant for dictionaries");
    return EINVAL;
  }

  if (schema->flags & ARROW_FLAG_MAP_KEYS_SORTED &&
      schema_view->type != NANOARROW_TYPE_MAP) {
    ArrowErrorSet(error, "ARROW_FLAG_MAP_KEYS_SORTED is only relevant for a map type");
    return EINVAL;
  }

  ArrowLayoutInit(&schema_view->layout, schema_view->storage_type);
  if (schema_view->storage_type == NANOARROW_TYPE_FIXED_SIZE_BINARY) {
    schema_view->layout.element_size_bits[1] = (int64_t)schema_view->fixed_size * 8;
  } else if (schema_view->storage_type == NANOARROW_TYPE_FIXED_SIZE_LIST) {
    schema_view->layout.child_size_elements = schema_view->fixed_size;
  }

  schema_view->extension_name = ArrowCharView(NULL);
  schema_view->extension_metadata = ArrowCharView(NULL);
  NANOARROW_RETURN_NOT_OK(ArrowMetadataGetValue(schema->metadata,
                                                ArrowCharView("ARROW:extension:name"),
                                                &schema_view->extension_name));
  NANOARROW_RETURN_NOT_OK(ArrowMetadataGetValue(schema->metadata,
                                                ArrowCharView("ARROW:extension:metadata"),
                                                &schema_view->extension_metadata));

  return NANOARROW_OK;
}

static int64_t ArrowSchemaTypeToStringInternal(struct ArrowSchemaView* schema_view,
                                               char* out, int64_t n) {
  const char* type_string = ArrowTypeString(schema_view->type);
  switch (schema_view->type) {
    case NANOARROW_TYPE_DECIMAL32:
    case NANOARROW_TYPE_DECIMAL64:
    case NANOARROW_TYPE_DECIMAL128:
    case NANOARROW_TYPE_DECIMAL256:
      return snprintf(out, n, "%s(%" PRId32 ", %" PRId32 ")", type_string,
                      schema_view->decimal_precision, schema_view->decimal_scale);
    case NANOARROW_TYPE_TIMESTAMP:
      return snprintf(out, n, "%s('%s', '%s')", type_string,
                      ArrowTimeUnitString(schema_view->time_unit), schema_view->timezone);
    case NANOARROW_TYPE_TIME32:
    case NANOARROW_TYPE_TIME64:
    case NANOARROW_TYPE_DURATION:
      return snprintf(out, n, "%s('%s')", type_string,
                      ArrowTimeUnitString(schema_view->time_unit));
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      return snprintf(out, n, "%s(%" PRId32 ")", type_string, schema_view->fixed_size);
    case NANOARROW_TYPE_SPARSE_UNION:
    case NANOARROW_TYPE_DENSE_UNION:
      return snprintf(out, n, "%s([%s])", type_string, schema_view->union_type_ids);
    default:
      return snprintf(out, n, "%s", type_string);
  }
}

// Helper for bookkeeping to emulate sprintf()-like behaviour spread
// among multiple sprintf calls.
static inline void ArrowToStringLogChars(char** out, int64_t n_chars_last,
                                         int64_t* n_remaining, int64_t* n_chars) {
  // In the unlikely snprintf() returning a negative value (encoding error),
  // ensure the result won't cause an out-of-bounds access.
  if (n_chars_last < 0) {
    n_chars_last = 0;
  }

  *n_chars += n_chars_last;
  *n_remaining -= n_chars_last;

  // n_remaining is never less than 0
  if (*n_remaining < 0) {
    *n_remaining = 0;
  }

  // Can't do math on a NULL pointer
  if (*out != NULL) {
    *out += n_chars_last;
  }
}

int64_t ArrowSchemaToString(const struct ArrowSchema* schema, char* out, int64_t n,
                            char recursive) {
  if (schema == NULL) {
    return snprintf(out, n, "[invalid: pointer is null]");
  }

  if (schema->release == NULL) {
    return snprintf(out, n, "[invalid: schema is released]");
  }

  struct ArrowSchemaView schema_view;
  struct ArrowError error;

  if (ArrowSchemaViewInit(&schema_view, schema, &error) != NANOARROW_OK) {
    return snprintf(out, n, "[invalid: %s]", ArrowErrorMessage(&error));
  }

  // Extension type and dictionary should include both the top-level type
  // and the storage type.
  int is_extension = schema_view.extension_name.size_bytes > 0;
  int is_dictionary = schema->dictionary != NULL;
  int64_t n_chars = 0;
  int64_t n_chars_last = 0;

  // Uncommon but not technically impossible that both are true
  if (is_extension && is_dictionary) {
    n_chars_last = snprintf(
        out, n, "%.*s{dictionary(%s)<", (int)schema_view.extension_name.size_bytes,
        schema_view.extension_name.data, ArrowTypeString(schema_view.storage_type));
  } else if (is_extension) {
    n_chars_last = snprintf(out, n, "%.*s{", (int)schema_view.extension_name.size_bytes,
                            schema_view.extension_name.data);
  } else if (is_dictionary) {
    n_chars_last =
        snprintf(out, n, "dictionary(%s)<", ArrowTypeString(schema_view.storage_type));
  }

  ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);

  if (!is_dictionary) {
    n_chars_last = ArrowSchemaTypeToStringInternal(&schema_view, out, n);
  } else {
    n_chars_last = ArrowSchemaToString(schema->dictionary, out, n, recursive);
  }

  ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);

  if (recursive && schema->format[0] == '+') {
    n_chars_last = snprintf(out, n, "<");
    ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);

    for (int64_t i = 0; i < schema->n_children; i++) {
      if (i > 0) {
        n_chars_last = snprintf(out, n, ", ");
        ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);
      }

      // ArrowSchemaToStringInternal() will validate the child and print the error,
      // but we need the name first
      if (schema->children[i] != NULL && schema->children[i]->release != NULL &&
          schema->children[i]->name != NULL) {
        n_chars_last = snprintf(out, n, "%s: ", schema->children[i]->name);
        ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);
      }

      n_chars_last = ArrowSchemaToString(schema->children[i], out, n, recursive);
      ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);
    }

    n_chars_last = snprintf(out, n, ">");
    ArrowToStringLogChars(&out, n_chars_last, &n, &n_chars);
  }

  if (is_extension && is_dictionary) {
    n_chars += snprintf(out, n, ">}");
  } else if (is_extension) {
    n_chars += snprintf(out, n, "}");
  } else if (is_dictionary) {
    n_chars += snprintf(out, n, ">");
  }

  // Ensure that we always return a positive result
  if (n_chars > 0) {
    return n_chars;
  } else {
    return 0;
  }
}

ArrowErrorCode ArrowMetadataReaderInit(struct ArrowMetadataReader* reader,
                                       const char* metadata) {
  reader->metadata = metadata;

  if (reader->metadata == NULL) {
    reader->offset = 0;
    reader->remaining_keys = 0;
  } else {
    memcpy(&reader->remaining_keys, reader->metadata, sizeof(int32_t));
    reader->offset = sizeof(int32_t);
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowMetadataReaderRead(struct ArrowMetadataReader* reader,
                                       struct ArrowStringView* key_out,
                                       struct ArrowStringView* value_out) {
  if (reader->remaining_keys <= 0) {
    return EINVAL;
  }

  int64_t pos = 0;

  int32_t key_size;
  memcpy(&key_size, reader->metadata + reader->offset + pos, sizeof(int32_t));
  pos += sizeof(int32_t);

  key_out->data = reader->metadata + reader->offset + pos;
  key_out->size_bytes = key_size;
  pos += key_size;

  int32_t value_size;
  memcpy(&value_size, reader->metadata + reader->offset + pos, sizeof(int32_t));
  pos += sizeof(int32_t);

  value_out->data = reader->metadata + reader->offset + pos;
  value_out->size_bytes = value_size;
  pos += value_size;

  reader->offset += pos;
  reader->remaining_keys--;
  return NANOARROW_OK;
}

int64_t ArrowMetadataSizeOf(const char* metadata) {
  if (metadata == NULL) {
    return 0;
  }

  struct ArrowMetadataReader reader;
  struct ArrowStringView key;
  struct ArrowStringView value;
  if (ArrowMetadataReaderInit(&reader, metadata) != NANOARROW_OK) {
    return 0;
  }

  int64_t size = sizeof(int32_t);
  while (ArrowMetadataReaderRead(&reader, &key, &value) == NANOARROW_OK) {
    size += sizeof(int32_t) + key.size_bytes + sizeof(int32_t) + value.size_bytes;
  }

  return size;
}

static ArrowErrorCode ArrowMetadataGetValueInternal(const char* metadata,
                                                    struct ArrowStringView* key,
                                                    struct ArrowStringView* value_out) {
  struct ArrowMetadataReader reader;
  struct ArrowStringView existing_key;
  struct ArrowStringView existing_value;
  NANOARROW_RETURN_NOT_OK(ArrowMetadataReaderInit(&reader, metadata));

  while (ArrowMetadataReaderRead(&reader, &existing_key, &existing_value) ==
         NANOARROW_OK) {
    int key_equal = key->size_bytes == existing_key.size_bytes &&
                    strncmp(key->data, existing_key.data, existing_key.size_bytes) == 0;
    if (key_equal) {
      value_out->data = existing_value.data;
      value_out->size_bytes = existing_value.size_bytes;
      break;
    }
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowMetadataGetValue(const char* metadata, struct ArrowStringView key,
                                     struct ArrowStringView* value_out) {
  if (value_out == NULL) {
    return EINVAL;
  }

  return ArrowMetadataGetValueInternal(metadata, &key, value_out);
}

char ArrowMetadataHasKey(const char* metadata, struct ArrowStringView key) {
  struct ArrowStringView value = ArrowCharView(NULL);
  if (ArrowMetadataGetValue(metadata, key, &value) != NANOARROW_OK) {
    return 0;
  }

  return value.data != NULL;
}

ArrowErrorCode ArrowMetadataBuilderInit(struct ArrowBuffer* buffer,
                                        const char* metadata) {
  ArrowBufferInit(buffer);
  return ArrowBufferAppend(buffer, metadata, ArrowMetadataSizeOf(metadata));
}

static ArrowErrorCode ArrowMetadataBuilderAppendInternal(struct ArrowBuffer* buffer,
                                                         struct ArrowStringView* key,
                                                         struct ArrowStringView* value) {
  if (value == NULL) {
    return NANOARROW_OK;
  }

  if (buffer->capacity_bytes == 0) {
    NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(buffer, 0));
  }

  if (((size_t)buffer->capacity_bytes) < sizeof(int32_t)) {
    return EINVAL;
  }

  int32_t n_keys;
  memcpy(&n_keys, buffer->data, sizeof(int32_t));

  int32_t key_size = (int32_t)key->size_bytes;
  int32_t value_size = (int32_t)value->size_bytes;
  NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(
      buffer, sizeof(int32_t) + key_size + sizeof(int32_t) + value_size));

  ArrowBufferAppendUnsafe(buffer, &key_size, sizeof(int32_t));
  ArrowBufferAppendUnsafe(buffer, key->data, key_size);
  ArrowBufferAppendUnsafe(buffer, &value_size, sizeof(int32_t));
  ArrowBufferAppendUnsafe(buffer, value->data, value_size);

  n_keys++;
  memcpy(buffer->data, &n_keys, sizeof(int32_t));

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowMetadataBuilderSetInternal(struct ArrowBuffer* buffer,
                                                      struct ArrowStringView* key,
                                                      struct ArrowStringView* value) {
  // Inspect the current value to see if we can avoid copying the buffer
  struct ArrowStringView current_value = ArrowCharView(NULL);
  NANOARROW_RETURN_NOT_OK(
      ArrowMetadataGetValueInternal((const char*)buffer->data, key, &current_value));

  // The key should be removed but no key exists
  if (value == NULL && current_value.data == NULL) {
    return NANOARROW_OK;
  }

  // The key/value can be appended because no key exists
  if (value != NULL && current_value.data == NULL) {
    return ArrowMetadataBuilderAppendInternal(buffer, key, value);
  }

  struct ArrowMetadataReader reader;
  struct ArrowStringView existing_key;
  struct ArrowStringView existing_value;
  NANOARROW_RETURN_NOT_OK(ArrowMetadataReaderInit(&reader, (const char*)buffer->data));

  struct ArrowBuffer new_buffer;
  NANOARROW_RETURN_NOT_OK(ArrowMetadataBuilderInit(&new_buffer, NULL));

  while (reader.remaining_keys > 0) {
    int result = ArrowMetadataReaderRead(&reader, &existing_key, &existing_value);
    if (result != NANOARROW_OK) {
      ArrowBufferReset(&new_buffer);
      return result;
    }

    if (key->size_bytes == existing_key.size_bytes &&
        strncmp((const char*)key->data, (const char*)existing_key.data,
                existing_key.size_bytes) == 0) {
      result = ArrowMetadataBuilderAppendInternal(&new_buffer, key, value);
      value = NULL;
    } else {
      result =
          ArrowMetadataBuilderAppendInternal(&new_buffer, &existing_key, &existing_value);
    }

    if (result != NANOARROW_OK) {
      ArrowBufferReset(&new_buffer);
      return result;
    }
  }

  ArrowBufferReset(buffer);
  ArrowBufferMove(&new_buffer, buffer);
  return NANOARROW_OK;
}

ArrowErrorCode ArrowMetadataBuilderAppend(struct ArrowBuffer* buffer,
                                          struct ArrowStringView key,
                                          struct ArrowStringView value) {
  return ArrowMetadataBuilderAppendInternal(buffer, &key, &value);
}

ArrowErrorCode ArrowMetadataBuilderSet(struct ArrowBuffer* buffer,
                                       struct ArrowStringView key,
                                       struct ArrowStringView value) {
  return ArrowMetadataBuilderSetInternal(buffer, &key, &value);
}

ArrowErrorCode ArrowMetadataBuilderRemove(struct ArrowBuffer* buffer,
                                          struct ArrowStringView key) {
  return ArrowMetadataBuilderSetInternal(buffer, &key, NULL);
}
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#include <errno.h>
#include <inttypes.h>
#include <stdarg.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include "nanoarrow/nanoarrow.h"

static void ArrowArrayReleaseInternal(struct ArrowArray* array) {
  // Release buffers held by this array
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  if (private_data != NULL) {
    ArrowBitmapReset(&private_data->bitmap);
    ArrowBufferReset(&private_data->buffers[0]);
    ArrowBufferReset(&private_data->buffers[1]);
    ArrowFree(private_data->buffer_data);
    for (int32_t i = 0; i < private_data->n_variadic_buffers; ++i) {
      ArrowBufferReset(&private_data->variadic_buffers[i]);
    }
    ArrowFree(private_data->variadic_buffers);
    ArrowFree(private_data);
  }

  // This object owns the memory for all the children, but those
  // children may have been generated elsewhere and might have
  // their own release() callback.
  if (array->children != NULL) {
    for (int64_t i = 0; i < array->n_children; i++) {
      if (array->children[i] != NULL) {
        if (array->children[i]->release != NULL) {
          ArrowArrayRelease(array->children[i]);
        }

        ArrowFree(array->children[i]);
      }
    }

    ArrowFree(array->children);
  }

  // This object owns the memory for the dictionary but it
  // may have been generated somewhere else and have its own
  // release() callback.
  if (array->dictionary != NULL) {
    if (array->dictionary->release != NULL) {
      ArrowArrayRelease(array->dictionary);
    }

    ArrowFree(array->dictionary);
  }

  // Mark released
  array->release = NULL;
}

static int ArrowArrayIsInternal(struct ArrowArray* array) {
  return array->release == &ArrowArrayReleaseInternal;
}

static ArrowErrorCode ArrowArraySetStorageType(struct ArrowArray* array,
                                               enum ArrowType storage_type) {
  switch (storage_type) {
    case NANOARROW_TYPE_UNINITIALIZED:
    case NANOARROW_TYPE_NA:
    case NANOARROW_TYPE_RUN_END_ENCODED:
      array->n_buffers = 0;
      break;

    case NANOARROW_TYPE_FIXED_SIZE_LIST:
    case NANOARROW_TYPE_STRUCT:
    case NANOARROW_TYPE_SPARSE_UNION:
      array->n_buffers = 1;
      break;

    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_LARGE_LIST:
    case NANOARROW_TYPE_MAP:
    case NANOARROW_TYPE_BOOL:
    case NANOARROW_TYPE_UINT8:
    case NANOARROW_TYPE_INT8:
    case NANOARROW_TYPE_UINT16:
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_UINT32:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_UINT64:
    case NANOARROW_TYPE_INT64:
    case NANOARROW_TYPE_HALF_FLOAT:
    case NANOARROW_TYPE_FLOAT:
    case NANOARROW_TYPE_DOUBLE:
    case NANOARROW_TYPE_DECIMAL32:
    case NANOARROW_TYPE_DECIMAL64:
    case NANOARROW_TYPE_DECIMAL128:
    case NANOARROW_TYPE_DECIMAL256:
    case NANOARROW_TYPE_INTERVAL_MONTHS:
    case NANOARROW_TYPE_INTERVAL_DAY_TIME:
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO:
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
    case NANOARROW_TYPE_DENSE_UNION:
      array->n_buffers = 2;
      break;
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      array->n_buffers = NANOARROW_BINARY_VIEW_FIXED_BUFFERS + 1;
      break;
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_BINARY:
    case NANOARROW_TYPE_LARGE_BINARY:
    case NANOARROW_TYPE_LIST_VIEW:
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      array->n_buffers = 3;
      break;

    default:
      return EINVAL;

      return NANOARROW_OK;
  }

  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  private_data->storage_type = storage_type;
  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayInitFromType(struct ArrowArray* array,
                                      enum ArrowType storage_type) {
  array->length = 0;
  array->null_count = 0;
  array->offset = 0;
  array->n_buffers = 0;
  array->n_children = 0;
  array->buffers = NULL;
  array->children = NULL;
  array->dictionary = NULL;
  array->release = &ArrowArrayReleaseInternal;
  array->private_data = NULL;

  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)ArrowMalloc(sizeof(struct ArrowArrayPrivateData));
  if (private_data == NULL) {
    array->release = NULL;
    return ENOMEM;
  }

  ArrowBitmapInit(&private_data->bitmap);
  ArrowBufferInit(&private_data->buffers[0]);
  ArrowBufferInit(&private_data->buffers[1]);
  private_data->buffer_data =
      (const void**)ArrowMalloc(sizeof(void*) * NANOARROW_MAX_FIXED_BUFFERS);
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; ++i) {
    private_data->buffer_data[i] = NULL;
  }
  private_data->n_variadic_buffers = 0;
  private_data->variadic_buffers = NULL;
  private_data->list_view_offset = 0;

  array->private_data = private_data;
  array->buffers = (const void**)(private_data->buffer_data);

  // These are not technically "storage" in the sense that they do not appear
  // in the ArrowSchemaView's storage_type member; however, allowing them here
  // is helpful to maximize the number of types that can avoid going through
  // ArrowArrayInitFromSchema().
  switch (storage_type) {
    case NANOARROW_TYPE_DURATION:
    case NANOARROW_TYPE_TIMESTAMP:
    case NANOARROW_TYPE_TIME64:
    case NANOARROW_TYPE_DATE64:
      storage_type = NANOARROW_TYPE_INT64;
      break;
    case NANOARROW_TYPE_TIME32:
    case NANOARROW_TYPE_DATE32:
      storage_type = NANOARROW_TYPE_INT32;
      break;
    default:
      break;
  }

  int result = ArrowArraySetStorageType(array, storage_type);
  if (result != NANOARROW_OK) {
    ArrowArrayRelease(array);
    return result;
  }

  ArrowLayoutInit(&private_data->layout, storage_type);
  // We can only know this not to be true when initializing based on a schema
  // so assume this to be true.
  private_data->union_type_id_is_child_index = 1;
  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayInitFromArrayView(struct ArrowArray* array,
                                           const struct ArrowArrayView* array_view,
                                           struct ArrowError* error) {
  NANOARROW_RETURN_NOT_OK_WITH_ERROR(
      ArrowArrayInitFromType(array, array_view->storage_type), error);
  int result;

  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  private_data->layout = array_view->layout;

  if (array_view->n_children > 0) {
    result = ArrowArrayAllocateChildren(array, array_view->n_children);
    if (result != NANOARROW_OK) {
      ArrowArrayRelease(array);
      return result;
    }

    for (int64_t i = 0; i < array_view->n_children; i++) {
      result =
          ArrowArrayInitFromArrayView(array->children[i], array_view->children[i], error);
      if (result != NANOARROW_OK) {
        ArrowArrayRelease(array);
        return result;
      }
    }
  }

  if (array_view->dictionary != NULL) {
    result = ArrowArrayAllocateDictionary(array);
    if (result != NANOARROW_OK) {
      ArrowArrayRelease(array);
      return result;
    }

    result =
        ArrowArrayInitFromArrayView(array->dictionary, array_view->dictionary, error);
    if (result != NANOARROW_OK) {
      ArrowArrayRelease(array);
      return result;
    }
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayInitFromSchema(struct ArrowArray* array,
                                        const struct ArrowSchema* schema,
                                        struct ArrowError* error) {
  struct ArrowArrayView array_view;
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewInitFromSchema(&array_view, schema, error));
  NANOARROW_RETURN_NOT_OK(ArrowArrayInitFromArrayView(array, &array_view, error));
  if (array_view.storage_type == NANOARROW_TYPE_DENSE_UNION ||
      array_view.storage_type == NANOARROW_TYPE_SPARSE_UNION) {
    struct ArrowArrayPrivateData* private_data =
        (struct ArrowArrayPrivateData*)array->private_data;
    // We can still build arrays if this isn't true; however, the append
    // functions won't work. Instead, we store this value and error only
    // when StartAppending is called.
    private_data->union_type_id_is_child_index =
        _ArrowUnionTypeIdsWillEqualChildIndices(schema->format + 4, schema->n_children);
  }

  ArrowArrayViewReset(&array_view);
  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayAllocateChildren(struct ArrowArray* array, int64_t n_children) {
  if (array->children != NULL) {
    return EINVAL;
  }

  if (n_children == 0) {
    return NANOARROW_OK;
  }

  array->children =
      (struct ArrowArray**)ArrowMalloc(n_children * sizeof(struct ArrowArray*));
  if (array->children == NULL) {
    return ENOMEM;
  }

  memset(array->children, 0, n_children * sizeof(struct ArrowArray*));

  for (int64_t i = 0; i < n_children; i++) {
    array->children[i] = (struct ArrowArray*)ArrowMalloc(sizeof(struct ArrowArray));
    if (array->children[i] == NULL) {
      return ENOMEM;
    }
    array->children[i]->release = NULL;
  }

  array->n_children = n_children;
  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayAllocateDictionary(struct ArrowArray* array) {
  if (array->dictionary != NULL) {
    return EINVAL;
  }

  array->dictionary = (struct ArrowArray*)ArrowMalloc(sizeof(struct ArrowArray));
  if (array->dictionary == NULL) {
    return ENOMEM;
  }

  array->dictionary->release = NULL;
  return NANOARROW_OK;
}

void ArrowArraySetValidityBitmap(struct ArrowArray* array, struct ArrowBitmap* bitmap) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  ArrowBufferMove(&bitmap->buffer, &private_data->bitmap.buffer);
  private_data->bitmap.size_bits = bitmap->size_bits;
  bitmap->size_bits = 0;
  private_data->buffer_data[0] = private_data->bitmap.buffer.data;
  array->null_count = -1;
}

ArrowErrorCode ArrowArraySetBuffer(struct ArrowArray* array, int64_t i,
                                   struct ArrowBuffer* buffer) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  if (i >= array->n_buffers || i < 0) {
    return EINVAL;
  }

  // Find the `i`th buffer, release what is currently there, and move the
  // supplied buffer into that slot.
  struct ArrowBuffer* dst = ArrowArrayBuffer(array, i);
  ArrowBufferReset(dst);
  ArrowBufferMove(buffer, dst);

  // Flush the pointer into array->buffers. In theory clients should call
  // ArrowArrayFinishBuilding() to flush the pointer values before passing
  // this array elsewhere; however, in early nanoarrow versions this was not
  // needed and some code may depend on this being true.
  private_data->buffer_data[i] = dst->data;
  array->buffers = private_data->buffer_data;

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowArrayViewInitFromArray(struct ArrowArrayView* array_view,
                                                  struct ArrowArray* array,
                                                  struct ArrowError* error) {
  if (!ArrowArrayIsInternal(array)) {
    ArrowErrorSet(error,
                  "Can't initialize internal ArrowArrayView from external ArrowArray");
    return EINVAL;
  }

  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  ArrowArrayViewInitFromType(array_view, private_data->storage_type);
  array_view->layout = private_data->layout;
  array_view->array = array;
  array_view->length = array->length;
  array_view->offset = array->offset;
  array_view->null_count = array->null_count;

  array_view->buffer_views[0].data.as_uint8 = private_data->bitmap.buffer.data;
  array_view->buffer_views[0].size_bytes = private_data->bitmap.buffer.size_bytes;
  array_view->buffer_views[1].data.as_uint8 = private_data->buffers[0].data;
  array_view->buffer_views[1].size_bytes = private_data->buffers[0].size_bytes;
  array_view->buffer_views[2].data.as_uint8 = private_data->buffers[1].data;
  array_view->buffer_views[2].size_bytes = private_data->buffers[1].size_bytes;

  int result = ArrowArrayViewAllocateChildren(array_view, array->n_children);
  if (result != NANOARROW_OK) {
    ArrowArrayViewReset(array_view);
    return result;
  }

  for (int64_t i = 0; i < array->n_children; i++) {
    result =
        ArrowArrayViewInitFromArray(array_view->children[i], array->children[i], error);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }
  }

  if (array->dictionary != NULL) {
    result = ArrowArrayViewAllocateDictionary(array_view);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }

    result =
        ArrowArrayViewInitFromArray(array_view->dictionary, array->dictionary, error);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }
  }

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowArrayReserveInternal(struct ArrowArray* array,
                                                struct ArrowArrayView* array_view) {
  // Loop through buffers and reserve the extra space that we know about
  for (int64_t i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    // Don't reserve on a validity buffer that hasn't been allocated yet
    if (array_view->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_VALIDITY &&
        ArrowArrayBuffer(array, i)->data == NULL) {
      continue;
    }

    int64_t additional_size_bytes =
        array_view->buffer_views[i].size_bytes - ArrowArrayBuffer(array, i)->size_bytes;

    if (additional_size_bytes > 0) {
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferReserve(ArrowArrayBuffer(array, i), additional_size_bytes));
    }
  }

  // Recursively reserve children
  for (int64_t i = 0; i < array->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(
        ArrowArrayReserveInternal(array->children[i], array_view->children[i]));
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayReserve(struct ArrowArray* array,
                                 int64_t additional_size_elements) {
  struct ArrowArrayView array_view;
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewInitFromArray(&array_view, array, NULL));

  // Calculate theoretical buffer sizes (recursively)
  ArrowArrayViewSetLength(&array_view, array->length + additional_size_elements);

  // Walk the structure (recursively)
  int result = ArrowArrayReserveInternal(array, &array_view);
  ArrowArrayViewReset(&array_view);
  if (result != NANOARROW_OK) {
    return result;
  }

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowArrayFinalizeBuffers(struct ArrowArray* array) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    if (private_data->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_VALIDITY ||
        private_data->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_NONE) {
      continue;
    }

    struct ArrowBuffer* buffer = ArrowArrayBuffer(array, i);
    if (buffer->data == NULL) {
      NANOARROW_RETURN_NOT_OK((ArrowBufferReserve(buffer, 1)));
    }
  }

  for (int64_t i = 0; i < array->n_children; i++) {
    if (ArrowArrayIsInternal(array->children[i])) {
      NANOARROW_RETURN_NOT_OK(ArrowArrayFinalizeBuffers(array->children[i]));
    }
  }

  if (array->dictionary != NULL && ArrowArrayIsInternal(array->dictionary)) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayFinalizeBuffers(array->dictionary));
  }

  return NANOARROW_OK;
}

static ArrowErrorCode ArrowArrayFlushInternalPointers(struct ArrowArray* array) {
  NANOARROW_DCHECK(ArrowArrayIsInternal(array));
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  if (array->n_buffers > NANOARROW_MAX_FIXED_BUFFERS) {
    // If the variadic sizes buffer was not set and there is at least one variadic
    // buffer, populate it now (if there are no variadic buffers there will be exactly
    // three total buffers and we don't need to do anything special here). Notably, this
    // will occur when building a BinaryView/StringView array by element using the
    // appender.
    struct ArrowBuffer* sizes_buffer = ArrowArrayBuffer(array, array->n_buffers - 1);
    if (sizes_buffer->data == NULL && sizes_buffer->size_bytes == 0) {
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferReserve(sizes_buffer, private_data->n_variadic_buffers));
      for (int64_t i = 0; i < private_data->n_variadic_buffers; i++) {
        struct ArrowBuffer* variadic_buffer =
            ArrowArrayBuffer(array, i + NANOARROW_BINARY_VIEW_FIXED_BUFFERS);
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppendInt64(sizes_buffer, variadic_buffer->size_bytes));
      }
    }
  }

  for (int32_t i = 0; i < array->n_buffers; i++) {
    private_data->buffer_data[i] = ArrowArrayBuffer(array, i)->data;
  }

  array->buffers = (const void**)(private_data->buffer_data);

  // Flush internal pointers for child/dictionary arrays if we allocated them. Clients
  // building arrays by buffer might have moved arrays from some other source (e.g.,
  // to create a record batch) and calling this function in that case will cause a crash.
  for (int64_t i = 0; i < array->n_children; i++) {
    if (ArrowArrayIsInternal(array->children[i])) {
      NANOARROW_RETURN_NOT_OK(ArrowArrayFlushInternalPointers(array->children[i]));
    }
  }

  if (array->dictionary != NULL && ArrowArrayIsInternal(array->dictionary)) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayFlushInternalPointers(array->dictionary));
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayFinishBuilding(struct ArrowArray* array,
                                        enum ArrowValidationLevel validation_level,
                                        struct ArrowError* error) {
  // Even if the data buffer is size zero, the pointer value needed to be non-null
  // in some implementations (at least one version of Arrow C++ at the time this
  // was added and C# as later discovered). Only do this fix if we can assume
  // CPU data access.
  if (validation_level >= NANOARROW_VALIDATION_LEVEL_DEFAULT) {
    NANOARROW_RETURN_NOT_OK_WITH_ERROR(ArrowArrayFinalizeBuffers(array), error);
  }

  // Make sure the value we get with array->buffers[i] is set to the actual
  // pointer (which may have changed from the original due to reallocation)
  NANOARROW_RETURN_NOT_OK_WITH_ERROR(ArrowArrayFlushInternalPointers(array), error);

  if (validation_level == NANOARROW_VALIDATION_LEVEL_NONE) {
    return NANOARROW_OK;
  }

  // For validation, initialize an ArrowArrayView with our known buffer sizes
  struct ArrowArrayView array_view;
  NANOARROW_RETURN_NOT_OK_WITH_ERROR(
      ArrowArrayViewInitFromArray(&array_view, array, error), error);
  int result = ArrowArrayViewValidate(&array_view, validation_level, error);
  ArrowArrayViewReset(&array_view);
  return result;
}

ArrowErrorCode ArrowArrayFinishBuildingDefault(struct ArrowArray* array,
                                               struct ArrowError* error) {
  return ArrowArrayFinishBuilding(array, NANOARROW_VALIDATION_LEVEL_DEFAULT, error);
}

void ArrowArrayViewInitFromType(struct ArrowArrayView* array_view,
                                enum ArrowType storage_type) {
  memset(array_view, 0, sizeof(struct ArrowArrayView));
  array_view->storage_type = storage_type;
  ArrowLayoutInit(&array_view->layout, storage_type);
}

ArrowErrorCode ArrowArrayViewAllocateChildren(struct ArrowArrayView* array_view,
                                              int64_t n_children) {
  if (array_view->children != NULL) {
    return EINVAL;
  }

  if (n_children == 0) {
    array_view->n_children = 0;
    return NANOARROW_OK;
  }

  array_view->children =
      (struct ArrowArrayView**)ArrowMalloc(n_children * sizeof(struct ArrowArrayView*));
  if (array_view->children == NULL) {
    return ENOMEM;
  }

  for (int64_t i = 0; i < n_children; i++) {
    array_view->children[i] = NULL;
  }

  array_view->n_children = n_children;

  for (int64_t i = 0; i < n_children; i++) {
    array_view->children[i] =
        (struct ArrowArrayView*)ArrowMalloc(sizeof(struct ArrowArrayView));
    if (array_view->children[i] == NULL) {
      return ENOMEM;
    }
    ArrowArrayViewInitFromType(array_view->children[i], NANOARROW_TYPE_UNINITIALIZED);
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayViewAllocateDictionary(struct ArrowArrayView* array_view) {
  if (array_view->dictionary != NULL) {
    return EINVAL;
  }

  array_view->dictionary =
      (struct ArrowArrayView*)ArrowMalloc(sizeof(struct ArrowArrayView));
  if (array_view->dictionary == NULL) {
    return ENOMEM;
  }

  ArrowArrayViewInitFromType(array_view->dictionary, NANOARROW_TYPE_UNINITIALIZED);
  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayViewInitFromSchema(struct ArrowArrayView* array_view,
                                            const struct ArrowSchema* schema,
                                            struct ArrowError* error) {
  struct ArrowSchemaView schema_view;
  int result = ArrowSchemaViewInit(&schema_view, schema, error);
  if (result != NANOARROW_OK) {
    return result;
  }

  ArrowArrayViewInitFromType(array_view, schema_view.storage_type);
  array_view->layout = schema_view.layout;

  result = ArrowArrayViewAllocateChildren(array_view, schema->n_children);
  if (result != NANOARROW_OK) {
    ArrowErrorSet(error, "ArrowArrayViewAllocateChildren() failed");
    ArrowArrayViewReset(array_view);
    return result;
  }

  for (int64_t i = 0; i < schema->n_children; i++) {
    result =
        ArrowArrayViewInitFromSchema(array_view->children[i], schema->children[i], error);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }
  }

  if (schema->dictionary != NULL) {
    result = ArrowArrayViewAllocateDictionary(array_view);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }

    result =
        ArrowArrayViewInitFromSchema(array_view->dictionary, schema->dictionary, error);
    if (result != NANOARROW_OK) {
      ArrowArrayViewReset(array_view);
      return result;
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_SPARSE_UNION ||
      array_view->storage_type == NANOARROW_TYPE_DENSE_UNION) {
    array_view->union_type_id_map = (int8_t*)ArrowMalloc(256 * sizeof(int8_t));
    if (array_view->union_type_id_map == NULL) {
      return ENOMEM;
    }

    memset(array_view->union_type_id_map, -1, 256);
    int32_t n_type_ids = _ArrowParseUnionTypeIds(schema_view.union_type_ids,
                                                 array_view->union_type_id_map + 128);
    for (int8_t child_index = 0; child_index < n_type_ids; child_index++) {
      int8_t type_id = array_view->union_type_id_map[128 + child_index];
      array_view->union_type_id_map[type_id] = child_index;
    }
  }

  return NANOARROW_OK;
}

void ArrowArrayViewReset(struct ArrowArrayView* array_view) {
  if (array_view->children != NULL) {
    for (int64_t i = 0; i < array_view->n_children; i++) {
      if (array_view->children[i] != NULL) {
        ArrowArrayViewReset(array_view->children[i]);
        ArrowFree(array_view->children[i]);
      }
    }

    ArrowFree(array_view->children);
  }

  if (array_view->dictionary != NULL) {
    ArrowArrayViewReset(array_view->dictionary);
    ArrowFree(array_view->dictionary);
  }

  if (array_view->union_type_id_map != NULL) {
    ArrowFree(array_view->union_type_id_map);
  }

  ArrowArrayViewInitFromType(array_view, NANOARROW_TYPE_UNINITIALIZED);
}

void ArrowArrayViewSetLength(struct ArrowArrayView* array_view, int64_t length) {
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    int64_t element_size_bytes = array_view->layout.element_size_bits[i] / 8;

    switch (array_view->layout.buffer_type[i]) {
      case NANOARROW_BUFFER_TYPE_VALIDITY:
        array_view->buffer_views[i].size_bytes = _ArrowBytesForBits(length);
        continue;
      case NANOARROW_BUFFER_TYPE_DATA_OFFSET:
        // Probably don't want/need to rely on the producer to have allocated an
        // offsets buffer of length 1 for a zero-size array
        array_view->buffer_views[i].size_bytes =
            (length != 0) * element_size_bytes * (length + 1);
        continue;
      case NANOARROW_BUFFER_TYPE_DATA:
        array_view->buffer_views[i].size_bytes =
            _ArrowRoundUpToMultipleOf8(array_view->layout.element_size_bits[i] * length) /
            8;
        continue;
      case NANOARROW_BUFFER_TYPE_TYPE_ID:
      case NANOARROW_BUFFER_TYPE_UNION_OFFSET:
      case NANOARROW_BUFFER_TYPE_VIEW_OFFSET:
      case NANOARROW_BUFFER_TYPE_SIZE:
        array_view->buffer_views[i].size_bytes = element_size_bytes * length;
        continue;
      case NANOARROW_BUFFER_TYPE_VARIADIC_DATA:
      case NANOARROW_BUFFER_TYPE_VARIADIC_SIZE:
      case NANOARROW_BUFFER_TYPE_NONE:
        array_view->buffer_views[i].size_bytes = 0;
        continue;
    }
  }

  switch (array_view->storage_type) {
    case NANOARROW_TYPE_STRUCT:
    case NANOARROW_TYPE_SPARSE_UNION:
      for (int64_t i = 0; i < array_view->n_children; i++) {
        ArrowArrayViewSetLength(array_view->children[i], length);
      }
      break;
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      if (array_view->n_children >= 1) {
        ArrowArrayViewSetLength(array_view->children[0],
                                length * array_view->layout.child_size_elements);
      }
    default:
      break;
  }
}

// This version recursively extracts information from the array and stores it
// in the array view, performing any checks that require the original array.
static int ArrowArrayViewSetArrayInternal(struct ArrowArrayView* array_view,
                                          const struct ArrowArray* array,
                                          struct ArrowError* error) {
  array_view->array = array;
  array_view->offset = array->offset;
  array_view->length = array->length;
  array_view->null_count = array->null_count;
  array_view->variadic_buffer_sizes = NULL;
  array_view->variadic_buffers = NULL;
  array_view->n_variadic_buffers = 0;

  int64_t buffers_required = 0;
  const int nfixed_buf = array_view->storage_type == NANOARROW_TYPE_STRING_VIEW ||
                                 array_view->storage_type == NANOARROW_TYPE_BINARY_VIEW
                             ? NANOARROW_BINARY_VIEW_FIXED_BUFFERS
                             : NANOARROW_MAX_FIXED_BUFFERS;
  for (int i = 0; i < nfixed_buf; i++) {
    if (array_view->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_NONE) {
      break;
    }

    buffers_required++;

    // Set buffer pointer
    array_view->buffer_views[i].data.data = array->buffers[i];

    // If non-null, set buffer size to unknown.
    if (array->buffers[i] == NULL) {
      array_view->buffer_views[i].size_bytes = 0;
    } else {
      array_view->buffer_views[i].size_bytes = -1;
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_STRING_VIEW ||
      array_view->storage_type == NANOARROW_TYPE_BINARY_VIEW) {
    const int64_t n_buffers = array->n_buffers;
    const int32_t nfixed_buf = NANOARROW_BINARY_VIEW_FIXED_BUFFERS;

    const int32_t nvariadic_buf = (int32_t)(n_buffers - nfixed_buf - 1);
    array_view->n_variadic_buffers = nvariadic_buf;
    buffers_required += nvariadic_buf + 1;
    array_view->variadic_buffers = array->buffers + NANOARROW_BINARY_VIEW_FIXED_BUFFERS;
    array_view->variadic_buffer_sizes = (int64_t*)array->buffers[n_buffers - 1];
  }

  if (buffers_required != array->n_buffers) {
    ArrowErrorSet(error,
                  "Expected array with %" PRId64 " buffer(s) but found %" PRId64
                  " buffer(s)",
                  buffers_required, array->n_buffers);
    return EINVAL;
  }

  // Check number of children
  if (array_view->n_children != array->n_children) {
    ArrowErrorSet(error, "Expected %" PRId64 " children but found %" PRId64 " children",
                  array_view->n_children, array->n_children);
    return EINVAL;
  }

  // Recurse for children
  for (int64_t i = 0; i < array_view->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayViewSetArrayInternal(array_view->children[i],
                                                           array->children[i], error));
  }

  // Check dictionary
  if (array->dictionary == NULL && array_view->dictionary != NULL) {
    ArrowErrorSet(error, "Expected dictionary but found NULL");
    return EINVAL;
  }

  if (array->dictionary != NULL && array_view->dictionary == NULL) {
    ArrowErrorSet(error, "Expected NULL dictionary but found dictionary member");
    return EINVAL;
  }

  if (array->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(
        ArrowArrayViewSetArrayInternal(array_view->dictionary, array->dictionary, error));
  }

  return NANOARROW_OK;
}

static int ArrowArrayViewValidateMinimal(struct ArrowArrayView* array_view,
                                         struct ArrowError* error) {
  if (array_view->length < 0) {
    ArrowErrorSet(error, "Expected length >= 0 but found length %" PRId64,
                  array_view->length);
    return EINVAL;
  }

  if (array_view->offset < 0) {
    ArrowErrorSet(error, "Expected offset >= 0 but found offset %" PRId64,
                  array_view->offset);
    return EINVAL;
  }

  // Ensure that offset + length fits within an int64 before a possible overflow
  if ((uint64_t)array_view->offset + (uint64_t)array_view->length > (uint64_t)INT64_MAX) {
    ArrowErrorSet(error, "Offset + length is > INT64_MAX");
    return EINVAL;
  }

  // Calculate buffer sizes that do not require buffer access. If marked as
  // unknown, assign the buffer size; otherwise, validate it.
  int64_t offset_plus_length = array_view->offset + array_view->length;

  // Only loop over the first two buffers because the size of the third buffer
  // is always data dependent for all current Arrow types.
  for (int i = 0; i < 2; i++) {
    int64_t element_size_bytes = array_view->layout.element_size_bits[i] / 8;
    // Initialize with a value that will cause an error if accidentally used uninitialized
    // Need to suppress the clang-tidy warning because gcc warns for possible use
    int64_t min_buffer_size_bytes =  // NOLINT(clang-analyzer-deadcode.DeadStores)
        array_view->buffer_views[i].size_bytes + 1;

    switch (array_view->layout.buffer_type[i]) {
      case NANOARROW_BUFFER_TYPE_VALIDITY:
        if (array_view->null_count == 0 && array_view->buffer_views[i].size_bytes == 0) {
          continue;
        }

        min_buffer_size_bytes = _ArrowBytesForBits(offset_plus_length);
        break;
      case NANOARROW_BUFFER_TYPE_SIZE:
        min_buffer_size_bytes = element_size_bytes * offset_plus_length;
        break;
      case NANOARROW_BUFFER_TYPE_DATA_OFFSET:
        // Probably don't want/need to rely on the producer to have allocated an
        // offsets buffer of length 1 for a zero-size array
        min_buffer_size_bytes =
            (offset_plus_length != 0) * element_size_bytes * (offset_plus_length + 1);
        break;
      case NANOARROW_BUFFER_TYPE_VIEW_OFFSET:
        min_buffer_size_bytes =
            (offset_plus_length != 0) * element_size_bytes * offset_plus_length;
        break;
      case NANOARROW_BUFFER_TYPE_DATA:
        min_buffer_size_bytes =
            _ArrowRoundUpToMultipleOf8(array_view->layout.element_size_bits[i] *
                                       offset_plus_length) /
            8;
        break;
      case NANOARROW_BUFFER_TYPE_TYPE_ID:
      case NANOARROW_BUFFER_TYPE_UNION_OFFSET:
        min_buffer_size_bytes = element_size_bytes * offset_plus_length;
        break;
      case NANOARROW_BUFFER_TYPE_VARIADIC_DATA:
      case NANOARROW_BUFFER_TYPE_VARIADIC_SIZE:
      case NANOARROW_BUFFER_TYPE_NONE:
        continue;
    }

    // Assign or validate buffer size
    if (array_view->buffer_views[i].size_bytes == -1) {
      array_view->buffer_views[i].size_bytes = min_buffer_size_bytes;
    } else if (array_view->buffer_views[i].size_bytes < min_buffer_size_bytes) {
      ArrowErrorSet(error,
                    "Expected %s array buffer %d to have size >= %" PRId64
                    " bytes but found "
                    "buffer with %" PRId64 " bytes",
                    ArrowTypeString(array_view->storage_type), i, min_buffer_size_bytes,
                    array_view->buffer_views[i].size_bytes);
      return EINVAL;
    }
  }

  // For list, fixed-size list and map views, we can validate the number of children
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_LARGE_LIST:
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
    case NANOARROW_TYPE_MAP:
    case NANOARROW_TYPE_LIST_VIEW:
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      if (array_view->n_children != 1) {
        ArrowErrorSet(error,
                      "Expected 1 child of %s array but found %" PRId64 " child arrays",
                      ArrowTypeString(array_view->storage_type), array_view->n_children);
        return EINVAL;
      }
      break;
    case NANOARROW_TYPE_RUN_END_ENCODED:
      if (array_view->n_children != 2) {
        ArrowErrorSet(
            error, "Expected 2 children for %s array but found %" PRId64 " child arrays",
            ArrowTypeString(array_view->storage_type), array_view->n_children);
        return EINVAL;
      }
      break;
    default:
      break;
  }

  // For struct, the sparse union, and the fixed-size list views, we can validate child
  // lengths.
  int64_t child_min_length;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_SPARSE_UNION:
    case NANOARROW_TYPE_STRUCT:
      child_min_length = (array_view->offset + array_view->length);
      for (int64_t i = 0; i < array_view->n_children; i++) {
        if (array_view->children[i]->length < child_min_length) {
          ArrowErrorSet(error,
                        "Expected struct child %" PRId64 " to have length >= %" PRId64
                        " but found child with "
                        "length %" PRId64,
                        i + 1, child_min_length, array_view->children[i]->length);
          return EINVAL;
        }
      }
      break;

    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      child_min_length = (array_view->offset + array_view->length) *
                         array_view->layout.child_size_elements;
      if (array_view->children[0]->length < child_min_length) {
        ArrowErrorSet(error,
                      "Expected child of fixed_size_list array to have length >= %" PRId64
                      " but "
                      "found array with length %" PRId64,
                      child_min_length, array_view->children[0]->length);
        return EINVAL;
      }
      break;

    case NANOARROW_TYPE_RUN_END_ENCODED: {
      if (array_view->n_children != 2) {
        ArrowErrorSet(error,
                      "Expected 2 children for run-end encoded array but found %" PRId64,
                      array_view->n_children);
        return EINVAL;
      }
      struct ArrowArrayView* run_ends_view = array_view->children[0];
      struct ArrowArrayView* values_view = array_view->children[1];
      int64_t max_length;
      switch (run_ends_view->storage_type) {
        case NANOARROW_TYPE_INT16:
          max_length = INT16_MAX;
          break;
        case NANOARROW_TYPE_INT32:
          max_length = INT32_MAX;
          break;
        case NANOARROW_TYPE_INT64:
          max_length = INT64_MAX;
          break;
        default:
          ArrowErrorSet(
              error,
              "Run-end encoded array only supports INT16, INT32 or INT64 run-ends "
              "but found run-ends type %s",
              ArrowTypeString(run_ends_view->storage_type));
          return EINVAL;
      }

      // There is already a check above that offset_plus_length < INT64_MAX
      if (offset_plus_length > max_length) {
        ArrowErrorSet(error,
                      "Offset + length of a run-end encoded array must fit in a value"
                      " of the run end type %s but is %" PRId64 " + %" PRId64,
                      ArrowTypeString(run_ends_view->storage_type), array_view->offset,
                      array_view->length);
        return EINVAL;
      }

      if (run_ends_view->length > values_view->length) {
        ArrowErrorSet(error,
                      "Length of run_ends is greater than the length of values: %" PRId64
                      " > %" PRId64,
                      run_ends_view->length, values_view->length);
        return EINVAL;
      }

      if (run_ends_view->length == 0 && values_view->length != 0) {
        ArrowErrorSet(error,
                      "Run-end encoded array has zero length %" PRId64
                      ", but values array has "
                      "non-zero length",
                      values_view->length);
        return EINVAL;
      }

      if (run_ends_view->null_count != 0) {
        ArrowErrorSet(error, "Null count must be 0 for run ends array, but is %" PRId64,
                      run_ends_view->null_count);
        return EINVAL;
      }
      break;
    }

    default:
      break;
  }

  // Recurse for children
  for (int64_t i = 0; i < array_view->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(
        ArrowArrayViewValidateMinimal(array_view->children[i], error));
  }

  // Recurse for dictionary
  if (array_view->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateMinimal(array_view->dictionary, error));
  }

  return NANOARROW_OK;
}

static int ArrowArrayViewValidateDefault(struct ArrowArrayView* array_view,
                                         struct ArrowError* error) {
  // Perform minimal validation. This will validate or assign
  // buffer sizes as long as buffer access is not required.
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateMinimal(array_view, error));

  // Calculate buffer sizes or child lengths that require accessing the offsets
  // buffer. Where appropriate, validate that the first offset is >= 0.
  // If a buffer size is marked as unknown, assign it; otherwise, validate it.
  int64_t offset_plus_length = array_view->offset + array_view->length;

  int64_t first_offset;
  int64_t last_offset;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_BINARY:
      if (array_view->buffer_views[1].size_bytes != 0) {
        first_offset = array_view->buffer_views[1].data.as_int32[array_view->offset];
        if (first_offset < 0) {
          ArrowErrorSet(error, "Expected first offset >= 0 but found %" PRId64,
                        first_offset);
          return EINVAL;
        }

        last_offset = array_view->buffer_views[1].data.as_int32[offset_plus_length];
        if (last_offset < 0) {
          ArrowErrorSet(error, "Expected last offset >= 0 but found %" PRId64,
                        last_offset);
          return EINVAL;
        }

        // If the data buffer size is unknown, assign it; otherwise, check it
        if (array_view->buffer_views[2].size_bytes == -1) {
          array_view->buffer_views[2].size_bytes = last_offset;
        } else if (array_view->buffer_views[2].size_bytes < last_offset) {
          ArrowErrorSet(error,
                        "Expected %s array buffer 2 to have size >= %" PRId64
                        " bytes but found "
                        "buffer with %" PRId64 " bytes",
                        ArrowTypeString(array_view->storage_type), last_offset,
                        array_view->buffer_views[2].size_bytes);
          return EINVAL;
        }
      } else if (array_view->buffer_views[2].size_bytes == -1) {
        // If the data buffer size is unknown and there are no bytes in the offset buffer,
        // set the data buffer size to 0.
        array_view->buffer_views[2].size_bytes = 0;
      }
      break;

    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_LARGE_BINARY:
      if (array_view->buffer_views[1].size_bytes != 0) {
        first_offset = array_view->buffer_views[1].data.as_int64[array_view->offset];
        if (first_offset < 0) {
          ArrowErrorSet(error, "Expected first offset >= 0 but found %" PRId64,
                        first_offset);
          return EINVAL;
        }

        last_offset = array_view->buffer_views[1].data.as_int64[offset_plus_length];
        if (last_offset < 0) {
          ArrowErrorSet(error, "Expected last offset >= 0 but found %" PRId64,
                        last_offset);
          return EINVAL;
        }

        // If the data buffer size is unknown, assign it; otherwise, check it
        if (array_view->buffer_views[2].size_bytes == -1) {
          array_view->buffer_views[2].size_bytes = last_offset;
        } else if (array_view->buffer_views[2].size_bytes < last_offset) {
          ArrowErrorSet(error,
                        "Expected %s array buffer 2 to have size >= %" PRId64
                        " bytes but found "
                        "buffer with %" PRId64 " bytes",
                        ArrowTypeString(array_view->storage_type), last_offset,
                        array_view->buffer_views[2].size_bytes);
          return EINVAL;
        }
      } else if (array_view->buffer_views[2].size_bytes == -1) {
        // If the data buffer size is unknown and there are no bytes in the offset
        // buffer, set the data buffer size to 0.
        array_view->buffer_views[2].size_bytes = 0;
      }
      break;

    case NANOARROW_TYPE_STRUCT:
      for (int64_t i = 0; i < array_view->n_children; i++) {
        if (array_view->children[i]->length < offset_plus_length) {
          ArrowErrorSet(error,
                        "Expected struct child %" PRId64 " to have length >= %" PRId64
                        " but found child with "
                        "length %" PRId64,
                        i + 1, offset_plus_length, array_view->children[i]->length);
          return EINVAL;
        }
      }
      break;

    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_MAP:
      if (array_view->buffer_views[1].size_bytes != 0) {
        first_offset = array_view->buffer_views[1].data.as_int32[array_view->offset];
        if (first_offset < 0) {
          ArrowErrorSet(error, "Expected first offset >= 0 but found %" PRId64,
                        first_offset);
          return EINVAL;
        }

        last_offset = array_view->buffer_views[1].data.as_int32[offset_plus_length];
        if (last_offset < 0) {
          ArrowErrorSet(error, "Expected last offset >= 0 but found %" PRId64,
                        last_offset);
          return EINVAL;
        }

        if (array_view->children[0]->length < last_offset) {
          ArrowErrorSet(error,
                        "Expected child of %s array to have length >= %" PRId64
                        " but found array with "
                        "length %" PRId64,
                        ArrowTypeString(array_view->storage_type), last_offset,
                        array_view->children[0]->length);
          return EINVAL;
        }
      }
      break;

    case NANOARROW_TYPE_LARGE_LIST:
      if (array_view->buffer_views[1].size_bytes != 0) {
        first_offset = array_view->buffer_views[1].data.as_int64[array_view->offset];
        if (first_offset < 0) {
          ArrowErrorSet(error, "Expected first offset >= 0 but found %" PRId64,
                        first_offset);
          return EINVAL;
        }

        last_offset = array_view->buffer_views[1].data.as_int64[offset_plus_length];
        if (last_offset < 0) {
          ArrowErrorSet(error, "Expected last offset >= 0 but found %" PRId64,
                        last_offset);
          return EINVAL;
        }

        if (array_view->children[0]->length < last_offset) {
          ArrowErrorSet(error,
                        "Expected child of %s array to have length >= %" PRId64
                        " but found array "
                        "with length %" PRId64,
                        ArrowTypeString(array_view->storage_type), last_offset,
                        array_view->children[0]->length);
          return EINVAL;
        }
      }
      break;

    case NANOARROW_TYPE_RUN_END_ENCODED: {
      struct ArrowArrayView* run_ends_view = array_view->children[0];
      if (run_ends_view->length == 0) {
        break;
      }

      int64_t first_run_end = ArrowArrayViewGetIntUnsafe(run_ends_view, 0);
      if (first_run_end < 1) {
        ArrowErrorSet(
            error,
            "All run ends must be greater than 0 but the first run end is %" PRId64,
            first_run_end);
        return EINVAL;
      }

      // offset + length < INT64_MAX is checked in ArrowArrayViewValidateMinimal()
      int64_t last_run_end =
          ArrowArrayViewGetIntUnsafe(run_ends_view, run_ends_view->length - 1);
      if (last_run_end < offset_plus_length) {
        ArrowErrorSet(error,
                      "Last run end is %" PRId64 " but it should be >= (%" PRId64
                      " + %" PRId64 ")",
                      last_run_end, array_view->offset, array_view->length);
        return EINVAL;
      }
      break;
    }
    default:
      break;
  }

  // Recurse for children
  for (int64_t i = 0; i < array_view->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(
        ArrowArrayViewValidateDefault(array_view->children[i], error));
  }

  // Recurse for dictionary
  if (array_view->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateDefault(array_view->dictionary, error));
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayViewSetArray(struct ArrowArrayView* array_view,
                                      const struct ArrowArray* array,
                                      struct ArrowError* error) {
  // Extract information from the array into the array view
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewSetArrayInternal(array_view, array, error));

  // Run default validation. Because we've marked all non-NULL buffers as having unknown
  // size, validation will also update the buffer sizes as it goes.
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateDefault(array_view, error));

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayViewSetArrayMinimal(struct ArrowArrayView* array_view,
                                             const struct ArrowArray* array,
                                             struct ArrowError* error) {
  // Extract information from the array into the array view
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewSetArrayInternal(array_view, array, error));

  // Run default validation. Because we've marked all non-NULL buffers as having unknown
  // size, validation will also update the buffer sizes as it goes.
  NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateMinimal(array_view, error));

  return NANOARROW_OK;
}

static int ArrowAssertIncreasingInt32(struct ArrowBufferView view,
                                      struct ArrowError* error) {
  if (view.size_bytes <= (int64_t)sizeof(int32_t)) {
    return NANOARROW_OK;
  }

  for (int64_t i = 1; i < view.size_bytes / (int64_t)sizeof(int32_t); i++) {
    if (view.data.as_int32[i] < view.data.as_int32[i - 1]) {
      ArrowErrorSet(error, "[%" PRId64 "] Expected element size >= 0", i);
      return EINVAL;
    }
  }

  return NANOARROW_OK;
}

static int ArrowAssertIncreasingInt64(struct ArrowBufferView view,
                                      struct ArrowError* error) {
  if (view.size_bytes <= (int64_t)sizeof(int64_t)) {
    return NANOARROW_OK;
  }

  for (int64_t i = 1; i < view.size_bytes / (int64_t)sizeof(int64_t); i++) {
    if (view.data.as_int64[i] < view.data.as_int64[i - 1]) {
      ArrowErrorSet(error, "[%" PRId64 "] Expected element size >= 0", i);
      return EINVAL;
    }
  }

  return NANOARROW_OK;
}

static int ArrowAssertRangeInt8(struct ArrowBufferView view, int8_t min_value,
                                int8_t max_value, struct ArrowError* error) {
  for (int64_t i = 0; i < view.size_bytes; i++) {
    if (view.data.as_int8[i] < min_value || view.data.as_int8[i] > max_value) {
      ArrowErrorSet(error,
                    "[%" PRId64 "] Expected buffer value between %" PRId8 " and %" PRId8
                    " but found value %" PRId8,
                    i, min_value, max_value, view.data.as_int8[i]);
      return EINVAL;
    }
  }

  return NANOARROW_OK;
}

static int ArrowAssertInt8In(struct ArrowBufferView view, const int8_t* values,
                             int64_t n_values, struct ArrowError* error) {
  for (int64_t i = 0; i < view.size_bytes; i++) {
    int item_found = 0;
    for (int64_t j = 0; j < n_values; j++) {
      if (view.data.as_int8[i] == values[j]) {
        item_found = 1;
        break;
      }
    }

    if (!item_found) {
      ArrowErrorSet(error, "[%" PRId64 "] Unexpected buffer value %" PRId8, i,
                    view.data.as_int8[i]);
      return EINVAL;
    }
  }

  return NANOARROW_OK;
}

static int ArrowArrayViewValidateFull(struct ArrowArrayView* array_view,
                                      struct ArrowError* error) {
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    switch (array_view->layout.buffer_type[i]) {
      // Only validate the portion of the buffer that is strictly required,
      // which includes not validating the offset buffer of a zero-length array.
      case NANOARROW_BUFFER_TYPE_DATA_OFFSET:
        if (array_view->length == 0) {
          continue;
        }
        if (array_view->layout.element_size_bits[i] == 32) {
          struct ArrowBufferView sliced_offsets;
          sliced_offsets.data.as_int32 =
              array_view->buffer_views[i].data.as_int32 + array_view->offset;
          sliced_offsets.size_bytes = (array_view->length + 1) * sizeof(int32_t);
          NANOARROW_RETURN_NOT_OK(ArrowAssertIncreasingInt32(sliced_offsets, error));
        } else {
          struct ArrowBufferView sliced_offsets;
          sliced_offsets.data.as_int64 =
              array_view->buffer_views[i].data.as_int64 + array_view->offset;
          sliced_offsets.size_bytes = (array_view->length + 1) * sizeof(int64_t);
          NANOARROW_RETURN_NOT_OK(ArrowAssertIncreasingInt64(sliced_offsets, error));
        }
        break;
      default:
        break;
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_DENSE_UNION ||
      array_view->storage_type == NANOARROW_TYPE_SPARSE_UNION) {
    struct ArrowBufferView sliced_type_ids;
    sliced_type_ids.size_bytes = array_view->length * sizeof(int8_t);
    if (array_view->length > 0) {
      sliced_type_ids.data.as_int8 =
          array_view->buffer_views[0].data.as_int8 + array_view->offset;
    } else {
      sliced_type_ids.data.as_int8 = NULL;
    }

    if (array_view->union_type_id_map == NULL) {
      // If the union_type_id map is NULL (e.g., when using ArrowArrayInitFromType() +
      // ArrowArrayAllocateChildren() + ArrowArrayFinishBuilding()), we don't have enough
      // information to validate this buffer.
      ArrowErrorSet(error,
                    "Insufficient information provided for validation of union array");
      return EINVAL;
    } else if (_ArrowParsedUnionTypeIdsWillEqualChildIndices(
                   array_view->union_type_id_map, array_view->n_children,
                   array_view->n_children)) {
      NANOARROW_RETURN_NOT_OK(ArrowAssertRangeInt8(
          sliced_type_ids, 0, (int8_t)(array_view->n_children - 1), error));
    } else {
      NANOARROW_RETURN_NOT_OK(ArrowAssertInt8In(sliced_type_ids,
                                                array_view->union_type_id_map + 128,
                                                array_view->n_children, error));
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_DENSE_UNION &&
      array_view->union_type_id_map != NULL) {
    // Check that offsets refer to child elements that actually exist
    for (int64_t i = 0; i < array_view->length; i++) {
      int8_t child_id = ArrowArrayViewUnionChildIndex(array_view, i);
      int64_t offset = ArrowArrayViewUnionChildOffset(array_view, i);
      int64_t child_length = array_view->children[child_id]->length;
      if (offset < 0 || offset > child_length) {
        ArrowErrorSet(error,
                      "[%" PRId64 "] Expected union offset for child id %" PRId8
                      " to be between 0 and %" PRId64
                      " but "
                      "found offset value %" PRId64,
                      i, child_id, child_length, offset);
        return EINVAL;
      }
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_RUN_END_ENCODED) {
    struct ArrowArrayView* run_ends_view = array_view->children[0];
    if (run_ends_view->length > 0) {
      int64_t last_run_end = ArrowArrayViewGetIntUnsafe(run_ends_view, 0);
      for (int64_t i = 1; i < run_ends_view->length; i++) {
        const int64_t run_end = ArrowArrayViewGetIntUnsafe(run_ends_view, i);
        if (run_end <= last_run_end) {
          ArrowErrorSet(
              error,
              "Every run end must be strictly greater than the previous run end, "
              "but run_ends[%" PRId64 " is %" PRId64 " and run_ends[%" PRId64
              "] is %" PRId64,
              i, run_end, i - 1, last_run_end);
          return EINVAL;
        }
        last_run_end = run_end;
      }
    }
  }

  if (array_view->storage_type == NANOARROW_TYPE_LIST_VIEW ||
      array_view->storage_type == NANOARROW_TYPE_LARGE_LIST_VIEW) {
    int64_t child_len = array_view->children[0]->length;

    struct ArrowBufferView offsets, sizes;
    offsets.data.data = array_view->buffer_views[1].data.data;
    sizes.data.data = array_view->buffer_views[2].data.data;

    for (int64_t i = array_view->offset; i < array_view->length + array_view->offset;
         i++) {
      int64_t offset, size;
      if (array_view->storage_type == NANOARROW_TYPE_LIST_VIEW) {
        offset = offsets.data.as_int32[i];
        size = sizes.data.as_int32[i];
      } else {
        offset = offsets.data.as_int64[i];
        size = sizes.data.as_int64[i];
      }

      if (offset < 0) {
        ArrowErrorSet(error, "Invalid negative offset %" PRId64 " at index %" PRId64,
                      offset, i);
        return EINVAL;
      }

      if (size < 0) {
        ArrowErrorSet(error, "Invalid negative size %" PRId64 " at index %" PRId64, size,
                      i);
        return EINVAL;
      }

      if ((offset + size) > child_len) {
        ArrowErrorSet(error,
                      "Offset: %" PRId64 " + size: %" PRId64 " at index: %" PRId64
                      " exceeds length of child view: %" PRId64,
                      offset, size, i, child_len);
        return EINVAL;
      }
    }
  }

  // Recurse for children
  for (int64_t i = 0; i < array_view->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateFull(array_view->children[i], error));
  }

  // Dictionary validation not implemented
  if (array_view->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateFull(array_view->dictionary, error));
    // TODO: validate the indices
  }

  return NANOARROW_OK;
}

ArrowErrorCode ArrowArrayViewValidate(struct ArrowArrayView* array_view,
                                      enum ArrowValidationLevel validation_level,
                                      struct ArrowError* error) {
  switch (validation_level) {
    case NANOARROW_VALIDATION_LEVEL_NONE:
      return NANOARROW_OK;
    case NANOARROW_VALIDATION_LEVEL_MINIMAL:
      return ArrowArrayViewValidateMinimal(array_view, error);
    case NANOARROW_VALIDATION_LEVEL_DEFAULT:
      return ArrowArrayViewValidateDefault(array_view, error);
    case NANOARROW_VALIDATION_LEVEL_FULL:
      NANOARROW_RETURN_NOT_OK(ArrowArrayViewValidateDefault(array_view, error));
      return ArrowArrayViewValidateFull(array_view, error);
  }

  ArrowErrorSet(error, "validation_level not recognized");
  return EINVAL;
}

struct ArrowComparisonInternalState {
  enum ArrowCompareLevel level;
  int is_equal;
  struct ArrowError* reason;
};

NANOARROW_CHECK_PRINTF_ATTRIBUTE static void ArrowComparePrependPath(
    struct ArrowError* out, const char* fmt, ...) {
  if (out == NULL) {
    return;
  }

  char prefix[128];
  prefix[0] = '\0';
  va_list args;
  va_start(args, fmt);
  int prefix_len = vsnprintf(prefix, sizeof(prefix), fmt, args);
  va_end(args);

  if (prefix_len <= 0) {
    return;
  }

  size_t out_len = strlen(out->message);
  size_t out_len_to_move = sizeof(struct ArrowError) - prefix_len - 1;
  if (out_len_to_move > out_len) {
    out_len_to_move = out_len;
  }

  memmove(out->message + prefix_len, out->message, out_len_to_move);
  memcpy(out->message, prefix, prefix_len);
  out->message[out_len + prefix_len] = '\0';
}

#define SET_NOT_EQUAL_AND_RETURN_IF_IMPL(cond_, state_, reason_) \
  do {                                                           \
    if (cond_) {                                                 \
      ArrowErrorSet(state_->reason, ": %s", reason_);            \
      state_->is_equal = 0;                                      \
      return;                                                    \
    }                                                            \
  } while (0)

#define SET_NOT_EQUAL_AND_RETURN_IF(condition_, state_) \
  SET_NOT_EQUAL_AND_RETURN_IF_IMPL(condition_, state_, #condition_)

static void ArrowArrayViewCompareBuffer(const struct ArrowArrayView* actual,
                                        const struct ArrowArrayView* expected, int i,
                                        struct ArrowComparisonInternalState* state) {
  SET_NOT_EQUAL_AND_RETURN_IF(
      actual->buffer_views[i].size_bytes != expected->buffer_views[i].size_bytes, state);

  int64_t buffer_size = actual->buffer_views[i].size_bytes;
  if (buffer_size > 0) {
    SET_NOT_EQUAL_AND_RETURN_IF(
        memcmp(actual->buffer_views[i].data.data, expected->buffer_views[i].data.data,
               buffer_size) != 0,
        state);
  }
}

static void ArrowArrayViewCompareIdentical(const struct ArrowArrayView* actual,
                                           const struct ArrowArrayView* expected,
                                           struct ArrowComparisonInternalState* state) {
  SET_NOT_EQUAL_AND_RETURN_IF(actual->storage_type != expected->storage_type, state);
  SET_NOT_EQUAL_AND_RETURN_IF(actual->n_children != expected->n_children, state);
  SET_NOT_EQUAL_AND_RETURN_IF(actual->dictionary == NULL && expected->dictionary != NULL,
                              state);
  SET_NOT_EQUAL_AND_RETURN_IF(actual->dictionary != NULL && expected->dictionary == NULL,
                              state);

  SET_NOT_EQUAL_AND_RETURN_IF(actual->length != expected->length, state);
  SET_NOT_EQUAL_AND_RETURN_IF(actual->offset != expected->offset, state);
  SET_NOT_EQUAL_AND_RETURN_IF(actual->null_count != expected->null_count, state);

  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    ArrowArrayViewCompareBuffer(actual, expected, i, state);
    if (!state->is_equal) {
      ArrowComparePrependPath(state->reason, ".buffers[%d]", i);
      return;
    }
  }

  for (int64_t i = 0; i < actual->n_children; i++) {
    ArrowArrayViewCompareIdentical(actual->children[i], expected->children[i], state);
    if (!state->is_equal) {
      ArrowComparePrependPath(state->reason, ".children[%" PRId64 "]", i);
      return;
    }
  }

  if (actual->dictionary != NULL) {
    ArrowArrayViewCompareIdentical(actual->dictionary, expected->dictionary, state);
    if (!state->is_equal) {
      ArrowComparePrependPath(state->reason, ".dictionary");
      return;
    }
  }
}

// Top-level entry point to take care of creating, cleaning up, and
// propagating the ArrowComparisonInternalState to the caller
ArrowErrorCode ArrowArrayViewCompare(const struct ArrowArrayView* actual,
                                     const struct ArrowArrayView* expected,
                                     enum ArrowCompareLevel level, int* out,
                                     struct ArrowError* reason) {
  struct ArrowComparisonInternalState state;
  state.level = level;
  state.is_equal = 1;
  state.reason = reason;

  switch (level) {
    case NANOARROW_COMPARE_IDENTICAL:
      ArrowArrayViewCompareIdentical(actual, expected, &state);
      break;
    default:
      return EINVAL;
  }

  *out = state.is_equal;
  if (!state.is_equal) {
    ArrowComparePrependPath(state.reason, "root");
  }

  return NANOARROW_OK;
}

#undef SET_NOT_EQUAL_AND_RETURN_IF
#undef SET_NOT_EQUAL_AND_RETURN_IF_IMPL
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#include <errno.h>

#include "nanoarrow/nanoarrow.h"

struct BasicArrayStreamPrivate {
  struct ArrowSchema schema;
  int64_t n_arrays;
  struct ArrowArray* arrays;
  int64_t arrays_i;
};

static int ArrowBasicArrayStreamGetSchema(struct ArrowArrayStream* array_stream,
                                          struct ArrowSchema* schema) {
  if (array_stream == NULL || array_stream->release == NULL) {
    return EINVAL;
  }

  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)array_stream->private_data;
  return ArrowSchemaDeepCopy(&private_data->schema, schema);
}

static int ArrowBasicArrayStreamGetNext(struct ArrowArrayStream* array_stream,
                                        struct ArrowArray* array) {
  if (array_stream == NULL || array_stream->release == NULL) {
    return EINVAL;
  }

  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)array_stream->private_data;

  if (private_data->arrays_i == private_data->n_arrays) {
    array->release = NULL;
    return NANOARROW_OK;
  }

  ArrowArrayMove(&private_data->arrays[private_data->arrays_i++], array);
  return NANOARROW_OK;
}

static const char* ArrowBasicArrayStreamGetLastError(
    struct ArrowArrayStream* array_stream) {
  NANOARROW_UNUSED(array_stream);
  return NULL;
}

static void ArrowBasicArrayStreamRelease(struct ArrowArrayStream* array_stream) {
  if (array_stream == NULL || array_stream->release == NULL) {
    return;
  }

  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)array_stream->private_data;

  if (private_data->schema.release != NULL) {
    ArrowSchemaRelease(&private_data->schema);
  }

  for (int64_t i = 0; i < private_data->n_arrays; i++) {
    if (private_data->arrays[i].release != NULL) {
      ArrowArrayRelease(&private_data->arrays[i]);
    }
  }

  if (private_data->arrays != NULL) {
    ArrowFree(private_data->arrays);
  }

  ArrowFree(private_data);
  array_stream->release = NULL;
}

ArrowErrorCode ArrowBasicArrayStreamInit(struct ArrowArrayStream* array_stream,
                                         struct ArrowSchema* schema, int64_t n_arrays) {
  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)ArrowMalloc(
          sizeof(struct BasicArrayStreamPrivate));
  if (private_data == NULL) {
    return ENOMEM;
  }

  ArrowSchemaMove(schema, &private_data->schema);

  private_data->n_arrays = n_arrays;
  private_data->arrays = NULL;
  private_data->arrays_i = 0;

  if (n_arrays > 0) {
    private_data->arrays =
        (struct ArrowArray*)ArrowMalloc(n_arrays * sizeof(struct ArrowArray));
    if (private_data->arrays == NULL) {
      ArrowBasicArrayStreamRelease(array_stream);
      ArrowFree(private_data);
      return ENOMEM;
    }
  }

  for (int64_t i = 0; i < private_data->n_arrays; i++) {
    private_data->arrays[i].release = NULL;
  }

  array_stream->get_schema = &ArrowBasicArrayStreamGetSchema;
  array_stream->get_next = &ArrowBasicArrayStreamGetNext;
  array_stream->get_last_error = ArrowBasicArrayStreamGetLastError;
  array_stream->release = ArrowBasicArrayStreamRelease;
  array_stream->private_data = private_data;
  return NANOARROW_OK;
}

void ArrowBasicArrayStreamSetArray(struct ArrowArrayStream* array_stream, int64_t i,
                                   struct ArrowArray* array) {
  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)array_stream->private_data;
  ArrowArrayMove(array, &private_data->arrays[i]);
}

ArrowErrorCode ArrowBasicArrayStreamValidate(const struct ArrowArrayStream* array_stream,
                                             struct ArrowError* error) {
  struct BasicArrayStreamPrivate* private_data =
      (struct BasicArrayStreamPrivate*)array_stream->private_data;

  struct ArrowArrayView array_view;
  NANOARROW_RETURN_NOT_OK(
      ArrowArrayViewInitFromSchema(&array_view, &private_data->schema, error));

  for (int64_t i = 0; i < private_data->n_arrays; i++) {
    if (private_data->arrays[i].release != NULL) {
      int result = ArrowArrayViewSetArray(&array_view, &private_data->arrays[i], error);
      if (result != NANOARROW_OK) {
        ArrowArrayViewReset(&array_view);
        return result;
      }
    }
  }

  ArrowArrayViewReset(&array_view);
  return NANOARROW_OK;
}


================================================
FILE: data/lang/cpp/nanoarrow/nanoarrow.h
================================================
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#ifndef NANOARROW_CONFIG_H_INCLUDED
#define NANOARROW_CONFIG_H_INCLUDED

#define NANOARROW_VERSION_MAJOR 0
#define NANOARROW_VERSION_MINOR 8
#define NANOARROW_VERSION_PATCH 0
#define NANOARROW_VERSION "0.8.0"

#define NANOARROW_VERSION_INT                                        \
  (NANOARROW_VERSION_MAJOR * 10000 + NANOARROW_VERSION_MINOR * 100 + \
   NANOARROW_VERSION_PATCH)

// #define NANOARROW_NAMESPACE YourNamespaceHere

#if !defined(NANOARROW_CXX_NAMESPACE)
#define NANOARROW_CXX_NAMESPACE nanoarrow
#endif

#define NANOARROW_CXX_NAMESPACE_BEGIN namespace NANOARROW_CXX_NAMESPACE {
#define NANOARROW_CXX_NAMESPACE_END }

#endif
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#ifndef NANOARROW_NANOARROW_TYPES_H_INCLUDED
#define NANOARROW_NANOARROW_TYPES_H_INCLUDED

#include <stdint.h>
#include <string.h>


#if defined(NANOARROW_DEBUG) && !defined(NANOARROW_PRINT_AND_DIE)
#include <stdio.h>
#include <stdlib.h>
#endif

#ifdef __cplusplus
extern "C" {
#endif

// Extra guard for versions of Arrow without the canonical guard
#ifndef ARROW_FLAG_DICTIONARY_ORDERED

/// \defgroup nanoarrow-arrow-cdata Arrow C Data interface
///
/// The Arrow C Data (https://arrow.apache.org/docs/format/CDataInterface.html)
/// and Arrow C Stream (https://arrow.apache.org/docs/format/CStreamInterface.html)
/// interfaces are part of the
/// Arrow Columnar Format specification
/// (https://arrow.apache.org/docs/format/Columnar.html). See the Arrow documentation for
/// documentation of these structures.
///
/// @{

#ifndef ARROW_C_DATA_INTERFACE
#define ARROW_C_DATA_INTERFACE

#define ARROW_FLAG_DICTIONARY_ORDERED 1
#define ARROW_FLAG_NULLABLE 2
#define ARROW_FLAG_MAP_KEYS_SORTED 4

struct ArrowSchema {
  // Array type description
  const char* format;
  const char* name;
  const char* metadata;
  int64_t flags;
  int64_t n_children;
  struct ArrowSchema** children;
  struct ArrowSchema* dictionary;

  // Release callback
  void (*release)(struct ArrowSchema*);
  // Opaque producer-specific data
  void* private_data;
};

struct ArrowArray {
  // Array data description
  int64_t length;
  int64_t null_count;
  int64_t offset;
  int64_t n_buffers;
  int64_t n_children;
  const void** buffers;
  struct ArrowArray** children;
  struct ArrowArray* dictionary;

  // Release callback
  void (*release)(struct ArrowArray*);
  // Opaque producer-specific data
  void* private_data;
};

#endif  // ARROW_C_DATA_INTERFACE

#ifndef ARROW_C_STREAM_INTERFACE
#define ARROW_C_STREAM_INTERFACE

struct ArrowArrayStream {
  // Callback to get the stream type
  // (will be the same for all arrays in the stream).
  //
  // Return value: 0 if successful, an `errno`-compatible error code otherwise.
  //
  // If successful, the ArrowSchema must be released independently from the stream.
  int (*get_schema)(struct ArrowArrayStream*, struct ArrowSchema* out);

  // Callback to get the next array
  // (if no error and the array is released, the stream has ended)
  //
  // Return value: 0 if successful, an `errno`-compatible error code otherwise.
  //
  // If successful, the ArrowArray must be released independently from the stream.
  int (*get_next)(struct ArrowArrayStream*, struct ArrowArray* out);

  // Callback to get optional detailed error information.
  // This must only be called if the last stream operation failed
  // with a non-0 return code.
  //
  // Return value: pointer to a null-terminated character array describing
  // the last error, or NULL if no description is available.
  //
  // The returned pointer is only valid until the next operation on this stream
  // (including release).
  const char* (*get_last_error)(struct ArrowArrayStream*);

  // Release callback: release the stream's own resources.
  // Note that arrays returned by `get_next` must be individually released.
  void (*release)(struct ArrowArrayStream*);

  // Opaque producer-specific data
  void* private_data;
};

#endif  // ARROW_C_STREAM_INTERFACE
#endif  // ARROW_FLAG_DICTIONARY_ORDERED

/// @}

// Utility macros
#define _NANOARROW_CONCAT(x, y) x##y
#define _NANOARROW_MAKE_NAME(x, y) _NANOARROW_CONCAT(x, y)

#define _NANOARROW_RETURN_NOT_OK_IMPL(NAME, EXPR) \
  do {                                            \
    const int NAME = (EXPR);                      \
    if (NAME) return NAME;                        \
  } while (0)

#define _NANOARROW_CHECK_RANGE(x_, min_, max_) \
  NANOARROW_RETURN_NOT_OK((x_ >= min_ && x_ <= max_) ? NANOARROW_OK : EINVAL)

#define _NANOARROW_CHECK_UPPER_LIMIT(x_, max_) \
  NANOARROW_RETURN_NOT_OK((x_ <= max_) ? NANOARROW_OK : EINVAL)

#if defined(NANOARROW_DEBUG)
#define _NANOARROW_RETURN_NOT_OK_WITH_ERROR_IMPL(NAME, EXPR, ERROR_PTR_EXPR, EXPR_STR) \
  do {                                                                                 \
    const int NAME = (EXPR);                                                           \
    if (NAME) {                                                                        \
      ArrowErrorSet((ERROR_PTR_EXPR), "%s failed with errno %d\n* %s:%d", EXPR_STR,    \
                    NAME, __FILE__, __LINE__);                                         \
      return NAME;                                                                     \
    }                                                                                  \
  } while (0)
#else
#define _NANOARROW_RETURN_NOT_OK_WITH_ERROR_IMPL(NAME, EXPR, ERROR_PTR_EXPR, EXPR_STR) \
  do {                                                                                 \
    const int NAME = (EXPR);                                                           \
    if (NAME) {                                                                        \
      ArrowErrorSet((ERROR_PTR_EXPR), "%s failed with errno %d", EXPR_STR, NAME);      \
      return NAME;                                                                     \
    }                                                                                  \
  } while (0)
#endif

#if defined(NANOARROW_DEBUG)
// For checking ArrowErrorSet() calls for valid printf format strings/arguments
// If using mingw's c99-compliant printf, we need a different format-checking attribute
#if defined(__USE_MINGW_ANSI_STDIO) && defined(__MINGW_PRINTF_FORMAT)
#define NANOARROW_CHECK_PRINTF_ATTRIBUTE \
  __attribute__((format(__MINGW_PRINTF_FORMAT, 2, 3)))
#elif defined(__GNUC__)
#define NANOARROW_CHECK_PRINTF_ATTRIBUTE __attribute__((format(printf, 2, 3)))
#else
#define NANOARROW_CHECK_PRINTF_ATTRIBUTE
#endif

// For checking calls to functions that return ArrowErrorCode
#if defined(__GNUC__) && (__GNUC__ >= 4)
#define NANOARROW_CHECK_RETURN_ATTRIBUTE __attribute__((warn_unused_result))
#elif defined(_MSC_VER) && (_MSC_VER >= 1700)
#define NANOARROW_CHECK_RETURN_ATTRIBUTE _Check_return_
#else
#define NANOARROW_CHECK_RETURN_ATTRIBUTE
#endif

#else
#define NANOARROW_CHECK_RETURN_ATTRIBUTE
#define NANOARROW_CHECK_PRINTF_ATTRIBUTE
#endif

#define NANOARROW_UNUSED(x) (void)(x)

/// \brief Return code for success.
/// \ingroup nanoarrow-errors
#define NANOARROW_OK 0

/// \brief Represents an errno-compatible error code
/// \ingroup nanoarrow-errors
typedef int ArrowErrorCode;

#if defined(NANOARROW_DEBUG)
#define ArrowErrorCode NANOARROW_CHECK_RETURN_ATTRIBUTE ArrowErrorCode
#endif

/// \brief Flags supported by ArrowSchemaViewInit()
/// \ingroup nanoarrow-schema-view
#define NANOARROW_FLAG_ALL_SUPPORTED \
  (ARROW_FLAG_DICTIONARY_ORDERED | ARROW_FLAG_NULLABLE | ARROW_FLAG_MAP_KEYS_SORTED)

/// \brief Error type containing a UTF-8 encoded message.
/// \ingroup nanoarrow-errors
struct ArrowError {
  /// \brief A character buffer with space for an error message.
  char message[1024];
};

/// \brief Ensure an ArrowError is null-terminated by zeroing the first character.
/// \ingroup nanoarrow-errors
///
/// If error is NULL, this function does nothing.
static inline void ArrowErrorInit(struct ArrowError* error) {
  if (error != NULL) {
    error->message[0] = '\0';
  }
}

/// \brief Get the contents of an error
/// \ingroup nanoarrow-errors
///
/// If error is NULL, returns "", or returns the contents of the error message
/// otherwise.
static inline const char* ArrowErrorMessage(struct ArrowError* error) {
  if (error == NULL) {
    return "";
  } else {
    return error->message;
  }
}

/// \brief Set the contents of an error from an existing null-terminated string
/// \ingroup nanoarrow-errors
///
/// If error is NULL, this function does nothing.
static inline void ArrowErrorSetString(struct ArrowError* error, const char* src) {
  if (error == NULL) {
    return;
  }

  int64_t src_len = strlen(src);
  if (src_len >= ((int64_t)sizeof(error->message))) {
    memcpy(error->message, src, sizeof(error->message) - 1);
    error->message[sizeof(error->message) - 1] = '\0';
  } else {
    memcpy(error->message, src, src_len);
    error->message[src_len] = '\0';
  }
}

/// \brief Check the result of an expression and return it if not NANOARROW_OK
/// \ingroup nanoarrow-errors
#define NANOARROW_RETURN_NOT_OK(EXPR) \
  _NANOARROW_RETURN_NOT_OK_IMPL(_NANOARROW_MAKE_NAME(errno_status_, __COUNTER__), EXPR)

/// \brief Check the result of an expression and return it if not NANOARROW_OK,
/// adding an auto-generated message to an ArrowError.
/// \ingroup nanoarrow-errors
///
/// This macro is used to ensure that functions that accept an ArrowError
/// as input always set its message when returning an error code (e.g., when calling
/// a nanoarrow function that does *not* accept ArrowError).
#define NANOARROW_RETURN_NOT_OK_WITH_ERROR(EXPR, ERROR_EXPR) \
  _NANOARROW_RETURN_NOT_OK_WITH_ERROR_IMPL(                  \
      _NANOARROW_MAKE_NAME(errno_status_, __COUNTER__), EXPR, ERROR_EXPR, #EXPR)

#if defined(NANOARROW_DEBUG) && !defined(NANOARROW_PRINT_AND_DIE)
#define NANOARROW_PRINT_AND_DIE(VALUE, EXPR_STR)                                 \
  do {                                                                           \
    fprintf(stderr, "%s failed with code %d\n* %s:%d\n", EXPR_STR, (int)(VALUE), \
            __FILE__, (int)__LINE__);                                            \
    abort();                                                                     \
  } while (0)
#endif

#if defined(NANOARROW_DEBUG)
#define _NANOARROW_ASSERT_OK_IMPL(NAME, EXPR, EXPR_STR) \
  do {                                                  \
    const int NAME = (EXPR);                            \
    if (NAME) NANOARROW_PRINT_AND_DIE(NAME, EXPR_STR);  \
  } while (0)

/// \brief Assert that an expression's value is NANOARROW_OK
/// \ingroup nanoarrow-errors
///
/// If nanoarrow was built in debug mode (i.e., defined(NANOARROW_DEBUG) is true),
/// print a message to stderr and abort. If nanoarrow was built in release mode,
/// this statement has no effect. You can customize fatal error behaviour
/// be defining the NANOARROW_PRINT_AND_DIE macro before including nanoarrow.h
/// This macro is provided as a convenience for users and is not used internally.
#define NANOARROW_ASSERT_OK(EXPR) \
  _NANOARROW_ASSERT_OK_IMPL(_NANOARROW_MAKE_NAME(errno_status_, __COUNTER__), EXPR, #EXPR)

#define _NANOARROW_DCHECK_IMPL(EXPR, EXPR_STR)          \
  do {                                                  \
    if (!(EXPR)) NANOARROW_PRINT_AND_DIE(-1, EXPR_STR); \
  } while (0)

#define NANOARROW_DCHECK(EXPR) _NANOARROW_DCHECK_IMPL(EXPR, #EXPR)
#else
#define NANOARROW_ASSERT_OK(EXPR) (void)(EXPR)
#define NANOARROW_DCHECK(EXPR)
#endif

static inline void ArrowSchemaMove(struct ArrowSchema* src, struct ArrowSchema* dst) {
  NANOARROW_DCHECK(src != NULL);
  NANOARROW_DCHECK(dst != NULL);

  memcpy(dst, src, sizeof(struct ArrowSchema));
  src->release = NULL;
}

static inline void ArrowSchemaRelease(struct ArrowSchema* schema) {
  NANOARROW_DCHECK(schema != NULL);
  schema->release(schema);
  NANOARROW_DCHECK(schema->release == NULL);
}

static inline void ArrowArrayMove(struct ArrowArray* src, struct ArrowArray* dst) {
  NANOARROW_DCHECK(src != NULL);
  NANOARROW_DCHECK(dst != NULL);

  memcpy(dst, src, sizeof(struct ArrowArray));
  src->release = NULL;
}

static inline void ArrowArrayRelease(struct ArrowArray* array) {
  NANOARROW_DCHECK(array != NULL);
  array->release(array);
  NANOARROW_DCHECK(array->release == NULL);
}

static inline void ArrowArrayStreamMove(struct ArrowArrayStream* src,
                                        struct ArrowArrayStream* dst) {
  NANOARROW_DCHECK(src != NULL);
  NANOARROW_DCHECK(dst != NULL);

  memcpy(dst, src, sizeof(struct ArrowArrayStream));
  src->release = NULL;
}

static inline const char* ArrowArrayStreamGetLastError(
    struct ArrowArrayStream* array_stream) {
  NANOARROW_DCHECK(array_stream != NULL);

  const char* value = array_stream->get_last_error(array_stream);
  if (value == NULL) {
    return "";
  } else {
    return value;
  }
}

static inline ArrowErrorCode ArrowArrayStreamGetSchema(
    struct ArrowArrayStream* array_stream, struct ArrowSchema* out,
    struct ArrowError* error) {
  NANOARROW_DCHECK(array_stream != NULL);

  int result = array_stream->get_schema(array_stream, out);
  if (result != NANOARROW_OK && error != NULL) {
    ArrowErrorSetString(error, ArrowArrayStreamGetLastError(array_stream));
  }

  return result;
}

static inline ArrowErrorCode ArrowArrayStreamGetNext(
    struct ArrowArrayStream* array_stream, struct ArrowArray* out,
    struct ArrowError* error) {
  NANOARROW_DCHECK(array_stream != NULL);

  int result = array_stream->get_next(array_stream, out);
  if (result != NANOARROW_OK && error != NULL) {
    ArrowErrorSetString(error, ArrowArrayStreamGetLastError(array_stream));
  }

  return result;
}

static inline void ArrowArrayStreamRelease(struct ArrowArrayStream* array_stream) {
  NANOARROW_DCHECK(array_stream != NULL);
  array_stream->release(array_stream);
  NANOARROW_DCHECK(array_stream->release == NULL);
}

static char _ArrowIsLittleEndian(void) {
  uint32_t check = 1;
  char first_byte;
  memcpy(&first_byte, &check, sizeof(char));
  return first_byte;
}

/// \brief Arrow type enumerator
/// \ingroup nanoarrow-utils
///
/// These names are intended to map to the corresponding arrow::Type::type
/// enumerator; however, the numeric values are specifically not equal
/// (i.e., do not rely on numeric comparison).
enum ArrowType {
  NANOARROW_TYPE_UNINITIALIZED = 0,
  NANOARROW_TYPE_NA = 1,
  NANOARROW_TYPE_BOOL,
  NANOARROW_TYPE_UINT8,
  NANOARROW_TYPE_INT8,
  NANOARROW_TYPE_UINT16,
  NANOARROW_TYPE_INT16,
  NANOARROW_TYPE_UINT32,
  NANOARROW_TYPE_INT32,
  NANOARROW_TYPE_UINT64,
  NANOARROW_TYPE_INT64,
  NANOARROW_TYPE_HALF_FLOAT,
  NANOARROW_TYPE_FLOAT,
  NANOARROW_TYPE_DOUBLE,
  NANOARROW_TYPE_STRING,
  NANOARROW_TYPE_BINARY,
  NANOARROW_TYPE_FIXED_SIZE_BINARY,
  NANOARROW_TYPE_DATE32,
  NANOARROW_TYPE_DATE64,
  NANOARROW_TYPE_TIMESTAMP,
  NANOARROW_TYPE_TIME32,
  NANOARROW_TYPE_TIME64,
  NANOARROW_TYPE_INTERVAL_MONTHS,
  NANOARROW_TYPE_INTERVAL_DAY_TIME,
  NANOARROW_TYPE_DECIMAL128,
  NANOARROW_TYPE_DECIMAL256,
  NANOARROW_TYPE_LIST,
  NANOARROW_TYPE_STRUCT,
  NANOARROW_TYPE_SPARSE_UNION,
  NANOARROW_TYPE_DENSE_UNION,
  NANOARROW_TYPE_DICTIONARY,
  NANOARROW_TYPE_MAP,
  NANOARROW_TYPE_EXTENSION,
  NANOARROW_TYPE_FIXED_SIZE_LIST,
  NANOARROW_TYPE_DURATION,
  NANOARROW_TYPE_LARGE_STRING,
  NANOARROW_TYPE_LARGE_BINARY,
  NANOARROW_TYPE_LARGE_LIST,
  NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO,
  NANOARROW_TYPE_RUN_END_ENCODED,
  NANOARROW_TYPE_BINARY_VIEW,
  NANOARROW_TYPE_STRING_VIEW,
  NANOARROW_TYPE_DECIMAL32,
  NANOARROW_TYPE_DECIMAL64,
  NANOARROW_TYPE_LIST_VIEW,
  NANOARROW_TYPE_LARGE_LIST_VIEW,
};

/// \brief Get a string value of an enum ArrowType value
/// \ingroup nanoarrow-utils
///
/// Returns NULL for invalid values for type
static inline const char* ArrowTypeString(enum ArrowType type);

static inline const char* ArrowTypeString(enum ArrowType type) {
  switch (type) {
    case NANOARROW_TYPE_NA:
      return "na";
    case NANOARROW_TYPE_BOOL:
      return "bool";
    case NANOARROW_TYPE_UINT8:
      return "uint8";
    case NANOARROW_TYPE_INT8:
      return "int8";
    case NANOARROW_TYPE_UINT16:
      return "uint16";
    case NANOARROW_TYPE_INT16:
      return "int16";
    case NANOARROW_TYPE_UINT32:
      return "uint32";
    case NANOARROW_TYPE_INT32:
      return "int32";
    case NANOARROW_TYPE_UINT64:
      return "uint64";
    case NANOARROW_TYPE_INT64:
      return "int64";
    case NANOARROW_TYPE_HALF_FLOAT:
      return "half_float";
    case NANOARROW_TYPE_FLOAT:
      return "float";
    case NANOARROW_TYPE_DOUBLE:
      return "double";
    case NANOARROW_TYPE_STRING:
      return "string";
    case NANOARROW_TYPE_BINARY:
      return "binary";
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      return "fixed_size_binary";
    case NANOARROW_TYPE_DATE32:
      return "date32";
    case NANOARROW_TYPE_DATE64:
      return "date64";
    case NANOARROW_TYPE_TIMESTAMP:
      return "timestamp";
    case NANOARROW_TYPE_TIME32:
      return "time32";
    case NANOARROW_TYPE_TIME64:
      return "time64";
    case NANOARROW_TYPE_INTERVAL_MONTHS:
      return "interval_months";
    case NANOARROW_TYPE_INTERVAL_DAY_TIME:
      return "interval_day_time";
    case NANOARROW_TYPE_DECIMAL32:
      return "decimal32";
    case NANOARROW_TYPE_DECIMAL64:
      return "decimal64";
    case NANOARROW_TYPE_DECIMAL128:
      return "decimal128";
    case NANOARROW_TYPE_DECIMAL256:
      return "decimal256";
    case NANOARROW_TYPE_LIST:
      return "list";
    case NANOARROW_TYPE_STRUCT:
      return "struct";
    case NANOARROW_TYPE_SPARSE_UNION:
      return "sparse_union";
    case NANOARROW_TYPE_DENSE_UNION:
      return "dense_union";
    case NANOARROW_TYPE_DICTIONARY:
      return "dictionary";
    case NANOARROW_TYPE_MAP:
      return "map";
    case NANOARROW_TYPE_EXTENSION:
      return "extension";
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      return "fixed_size_list";
    case NANOARROW_TYPE_DURATION:
      return "duration";
    case NANOARROW_TYPE_LARGE_STRING:
      return "large_string";
    case NANOARROW_TYPE_LARGE_BINARY:
      return "large_binary";
    case NANOARROW_TYPE_LARGE_LIST:
      return "large_list";
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO:
      return "interval_month_day_nano";
    case NANOARROW_TYPE_RUN_END_ENCODED:
      return "run_end_encoded";
    case NANOARROW_TYPE_BINARY_VIEW:
      return "binary_view";
    case NANOARROW_TYPE_STRING_VIEW:
      return "string_view";
    case NANOARROW_TYPE_LIST_VIEW:
      return "list_view";
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      return "large_list_view";
    default:
      return NULL;
  }
}

/// \brief Arrow time unit enumerator
/// \ingroup nanoarrow-utils
///
/// These names and values map to the corresponding arrow::TimeUnit::type
/// enumerator.
enum ArrowTimeUnit {
  NANOARROW_TIME_UNIT_SECOND = 0,
  NANOARROW_TIME_UNIT_MILLI = 1,
  NANOARROW_TIME_UNIT_MICRO = 2,
  NANOARROW_TIME_UNIT_NANO = 3
};

/// \brief Validation level enumerator
/// \ingroup nanoarrow-array
enum ArrowValidationLevel {
  /// \brief Do not validate buffer sizes or content.
  NANOARROW_VALIDATION_LEVEL_NONE = 0,

  /// \brief Validate buffer sizes that depend on array length but do not validate buffer
  /// sizes that depend on buffer data access.
  NANOARROW_VALIDATION_LEVEL_MINIMAL = 1,

  /// \brief Validate all buffer sizes, including those that require buffer data access,
  /// but do not perform any checks that are O(1) along the length of the buffers.
  NANOARROW_VALIDATION_LEVEL_DEFAULT = 2,

  /// \brief Validate all buffer sizes and all buffer content. This is useful in the
  /// context of untrusted input or input that may have been corrupted in transit.
  NANOARROW_VALIDATION_LEVEL_FULL = 3
};

/// \brief Comparison level enumerator
/// \ingroup nanoarrow-utils
enum ArrowCompareLevel {
  /// \brief Consider arrays equal if buffers contain identical content
  /// and have identical offset, null count, and length. Note that this is
  /// a much stricter check than logical equality, which would take into
  /// account potentially different content of null slots, arrays with a
  /// non-zero offset, and other considerations.
  NANOARROW_COMPARE_IDENTICAL,
};

/// \brief Get a string value of an enum ArrowTimeUnit value
/// \ingroup nanoarrow-utils
///
/// Returns NULL for invalid values for time_unit
static inline const char* ArrowTimeUnitString(enum ArrowTimeUnit time_unit);

static inline const char* ArrowTimeUnitString(enum ArrowTimeUnit time_unit) {
  switch (time_unit) {
    case NANOARROW_TIME_UNIT_SECOND:
      return "s";
    case NANOARROW_TIME_UNIT_MILLI:
      return "ms";
    case NANOARROW_TIME_UNIT_MICRO:
      return "us";
    case NANOARROW_TIME_UNIT_NANO:
      return "ns";
    default:
      return NULL;
  }
}

/// \brief Functional types of buffers as described in the Arrow Columnar Specification
/// \ingroup nanoarrow-array-view
enum ArrowBufferType {
  NANOARROW_BUFFER_TYPE_NONE,
  NANOARROW_BUFFER_TYPE_VALIDITY,
  NANOARROW_BUFFER_TYPE_TYPE_ID,
  NANOARROW_BUFFER_TYPE_UNION_OFFSET,
  NANOARROW_BUFFER_TYPE_DATA_OFFSET,
  NANOARROW_BUFFER_TYPE_DATA,
  NANOARROW_BUFFER_TYPE_VARIADIC_DATA,
  NANOARROW_BUFFER_TYPE_VARIADIC_SIZE,
  NANOARROW_BUFFER_TYPE_VIEW_OFFSET,
  NANOARROW_BUFFER_TYPE_SIZE,
};

/// \brief The maximum number of fixed buffers in an ArrowArrayView or ArrowLayout
/// \ingroup nanoarrow-array-view
#define NANOARROW_MAX_FIXED_BUFFERS 3

/// \brief An non-owning view of a string
/// \ingroup nanoarrow-utils
struct ArrowStringView {
  /// \brief A pointer to the start of the string
  ///
  /// If size_bytes is 0, this value may be NULL.
  const char* data;

  /// \brief The size of the string in bytes,
  ///
  /// (Not including the null terminator.)
  int64_t size_bytes;
};

/// \brief Return a view of a const C string
/// \ingroup nanoarrow-utils
static inline struct ArrowStringView ArrowCharView(const char* value);

static inline struct ArrowStringView ArrowCharView(const char* value) {
  struct ArrowStringView out;

  out.data = value;
  if (value) {
    out.size_bytes = (int64_t)strlen(value);
  } else {
    out.size_bytes = 0;
  }

  return out;
}

union ArrowBufferViewData {
  const void* data;
  const int8_t* as_int8;
  const uint8_t* as_uint8;
  const int16_t* as_int16;
  const uint16_t* as_uint16;
  const int32_t* as_int32;
  const uint32_t* as_uint32;
  const int64_t* as_int64;
  const uint64_t* as_uint64;
  const double* as_double;
  const float* as_float;
  const char* as_char;
  const union ArrowBinaryView* as_binary_view;
};

/// \brief An non-owning view of a buffer
/// \ingroup nanoarrow-utils
struct ArrowBufferView {
  /// \brief A pointer to the start of the buffer
  ///
  /// If size_bytes is 0, this value may be NULL.
  union ArrowBufferViewData data;

  /// \brief The size of the buffer in bytes
  int64_t size_bytes;
};

/// \brief Array buffer allocation and deallocation
/// \ingroup nanoarrow-buffer
///
/// Container for allocate, reallocate, and free methods that can be used
/// to customize allocation and deallocation of buffers when constructing
/// an ArrowArray.
struct ArrowBufferAllocator {
  /// \brief Reallocate a buffer or return NULL if it cannot be reallocated
  uint8_t* (*reallocate)(struct ArrowBufferAllocator* allocator, uint8_t* ptr,
                         int64_t old_size, int64_t new_size);

  /// \brief Deallocate a buffer allocated by this allocator
  void (*free)(struct ArrowBufferAllocator* allocator, uint8_t* ptr, int64_t size);

  /// \brief Opaque data specific to the allocator
  void* private_data;
};

typedef void (*ArrowBufferDeallocatorCallback)(struct ArrowBufferAllocator* allocator,
                                               uint8_t* ptr, int64_t size);

/// \brief An owning mutable view of a buffer
/// \ingroup nanoarrow-buffer
struct ArrowBuffer {
  /// \brief A pointer to the start of the buffer
  ///
  /// If capacity_bytes is 0, this value may be NULL.
  uint8_t* data;

  /// \brief The size of the buffer in bytes
  int64_t size_bytes;

  /// \brief The capacity of the buffer in bytes
  int64_t capacity_bytes;

  /// \brief The allocator that will be used to reallocate and/or free the buffer
  struct ArrowBufferAllocator allocator;
};

/// \brief An owning mutable view of a bitmap
/// \ingroup nanoarrow-bitmap
struct ArrowBitmap {
  /// \brief An ArrowBuffer to hold the allocated memory
  struct ArrowBuffer buffer;

  /// \brief The number of bits that have been appended to the bitmap
  int64_t size_bits;
};

/// \brief A description of an arrangement of buffers
/// \ingroup nanoarrow-utils
///
/// Contains the minimum amount of information required to
/// calculate the size of each buffer in an ArrowArray knowing only
/// the length and offset of the array.
struct ArrowLayout {
  /// \brief The function of each buffer
  enum ArrowBufferType buffer_type[NANOARROW_MAX_FIXED_BUFFERS];

  /// \brief The data type of each buffer
  enum ArrowType buffer_data_type[NANOARROW_MAX_FIXED_BUFFERS];

  /// \brief The size of an element each buffer or 0 if this size is variable or unknown
  int64_t element_size_bits[NANOARROW_MAX_FIXED_BUFFERS];

  /// \brief The number of elements in the child array per element in this array for a
  /// fixed-size list
  int64_t child_size_elements;
};

/// \brief A non-owning view of an ArrowArray
/// \ingroup nanoarrow-array-view
///
/// This data structure provides access to the values contained within
/// an ArrowArray with fields provided in a more readily-extractible
/// form. You can re-use an ArrowArrayView for multiple ArrowArrays
/// with the same storage type, use it to represent a hypothetical
/// ArrowArray that does not exist yet, or use it to validate the buffers
/// of a future ArrowArray.
struct ArrowArrayView {
  /// \brief The underlying ArrowArray or NULL if it has not been set or
  /// if the buffers in this ArrowArrayView are not backed by an ArrowArray.
  const struct ArrowArray* array;

  /// \brief The number of elements from the physical start of the buffers.
  int64_t offset;

  /// \brief The number of elements in this view.
  int64_t length;

  /// \brief A cached null count or -1 to indicate that this value is unknown.
  int64_t null_count;

  /// \brief The type used to store values in this array
  ///
  /// This type represents only the minimum required information to
  /// extract values from the array buffers (e.g., for a Date32 array,
  /// this value will be NANOARROW_TYPE_INT32). For dictionary-encoded
  /// arrays, this will be the index type.
  enum ArrowType storage_type;

  /// \brief The buffer types, strides, and sizes of this Array's buffers
  struct ArrowLayout layout;

  /// \brief This Array's buffers as ArrowBufferView objects
  struct ArrowBufferView buffer_views[NANOARROW_MAX_FIXED_BUFFERS];

  /// \brief The number of children of this view
  int64_t n_children;

  /// \brief Pointers to views of this array's children
  struct ArrowArrayView** children;

  /// \brief Pointer to a view of this array's dictionary
  struct ArrowArrayView* dictionary;

  /// \brief Union type id to child index mapping
  ///
  /// If storage_type is a union type, a 256-byte ArrowMalloc()ed buffer
  /// such that child_index == union_type_id_map[type_id] and
  /// type_id == union_type_id_map[128 + child_index]. This value may be
  /// NULL in the case where child_id == type_id.
  int8_t* union_type_id_map;

  /// \brief Number of variadic buffers
  int32_t n_variadic_buffers;

  /// \brief Pointers to variadic buffers of binary/string_view arrays
  const void** variadic_buffers;

  /// \brief Size of each variadic buffer
  int64_t* variadic_buffer_sizes;
};

// Used as the private data member for ArrowArrays allocated here and accessed
// internally within inline ArrowArray* helpers.
struct ArrowArrayPrivateData {
  // Holder for the validity buffer (or first buffer for union types, which are
  // the only type whose first buffer is not a valdiity buffer)
  struct ArrowBitmap bitmap;

  // Holder for additional buffers as required
  struct ArrowBuffer buffers[NANOARROW_MAX_FIXED_BUFFERS - 1];

  // The array of pointers to buffers. This must be updated after a sequence
  // of appends to synchronize its values with the actual buffer addresses
  // (which may have been reallocated during that time)
  const void** buffer_data;

  // The storage data type, or NANOARROW_TYPE_UNINITIALIZED if unknown
  enum ArrowType storage_type;

  // The buffer arrangement for the storage type
  struct ArrowLayout layout;

  // Flag to indicate if there are non-sequence union type ids.
  // In the future this could be replaced with a type id<->child mapping
  // to support constructing unions in append mode where type_id != child_index
  int8_t union_type_id_is_child_index;

  // Number of variadic buffers for binary view types
  int32_t n_variadic_buffers;

  // Variadic buffers for binary view types
  struct ArrowBuffer* variadic_buffers;

  // The current offset used to build list views
  int64_t list_view_offset;
};

/// \brief A representation of an interval.
/// \ingroup nanoarrow-utils
struct ArrowInterval {
  /// \brief The type of interval being used
  enum ArrowType type;
  /// \brief The number of months represented by the interval
  int32_t months;
  /// \brief The number of days represented by the interval
  int32_t days;
  /// \brief The number of ms represented by the interval
  int32_t ms;
  /// \brief The number of ns represented by the interval
  int64_t ns;
};

/// \brief Zero initialize an Interval with a given unit
/// \ingroup nanoarrow-utils
static inline void ArrowIntervalInit(struct ArrowInterval* interval,
                                     enum ArrowType type) {
  memset(interval, 0, sizeof(struct ArrowInterval));
  interval->type = type;
}

/// \brief A representation of a fixed-precision decimal number
/// \ingroup nanoarrow-utils
///
/// This structure should be initialized with ArrowDecimalInit() once and
/// values set using ArrowDecimalSetInt(), ArrowDecimalSetBytes128(),
/// or ArrowDecimalSetBytes256().
struct ArrowDecimal {
  /// \brief An array of 64-bit integers of n_words length defined in native-endian order.
  /// For a 32-bit decimal value, index 0 will be a 32-bit integer value.
  uint64_t words[4];

  /// \brief The number of significant digits this decimal number can represent
  int32_t precision;

  /// \brief The number of digits after the decimal point. This can be negative.
  int32_t scale;

  /// \brief The number of 64-bit words in the words array. For the special case of a
  /// 32-bit decimal value, this will be 0.
  int n_words;

  /// \brief Cached value used by the implementation
  int high_word_index;

  /// \brief Cached value used by the implementation
  int low_word_index;
};

/// \brief Initialize a decimal with a given set of type parameters
/// \ingroup nanoarrow-utils
static inline void ArrowDecimalInit(struct ArrowDecimal* decimal, int32_t bitwidth,
                                    int32_t precision, int32_t scale) {
  memset(decimal->words, 0, sizeof(decimal->words));
  decimal->precision = precision;
  decimal->scale = scale;
  // n_words will be 0 for bitwidth == 32
  decimal->n_words = (int)(bitwidth / 8 / sizeof(uint64_t));

  if (_ArrowIsLittleEndian()) {
    decimal->low_word_index = 0;
    decimal->high_word_index = decimal->n_words > 0 ? decimal->n_words - 1 : 0;
  } else {
    decimal->low_word_index = decimal->n_words > 0 ? decimal->n_words - 1 : 0;
    decimal->high_word_index = 0;
  }
}

/// \brief Get a signed integer value of a sufficiently small ArrowDecimal
///
/// This does not check if the decimal's precision sufficiently small to fit
/// within the signed 64-bit integer range (A precision less than or equal
/// to 18 is sufficiently small).
static inline int64_t ArrowDecimalGetIntUnsafe(const struct ArrowDecimal* decimal) {
  if (decimal->n_words == 0) {
    int32_t value;
    memcpy(&value, decimal->words, sizeof(int32_t));
    return value;
  }

  return (int64_t)decimal->words[decimal->low_word_index];
}

/// \brief Copy the bytes of this decimal into a sufficiently large buffer
/// \ingroup nanoarrow-utils
static inline void ArrowDecimalGetBytes(const struct ArrowDecimal* decimal,
                                        uint8_t* out) {
  if (decimal->n_words == 0) {
    memcpy(out, decimal->words, sizeof(int32_t));
  } else {
    memcpy(out, decimal->words, decimal->n_words * sizeof(uint64_t));
  }
}

/// \brief Returns 1 if the value represented by decimal is >= 0 or -1 otherwise
/// \ingroup nanoarrow-utils
static inline int64_t ArrowDecimalSign(const struct ArrowDecimal* decimal) {
  if (decimal->n_words == 0) {
    return ArrowDecimalGetIntUnsafe(decimal) >= 0 ? 1 : -1;
  } else {
    return 1 | ((int64_t)(decimal->words[decimal->high_word_index]) >> 63);
  }
}

/// \brief Sets the integer value of this decimal
/// \ingroup nanoarrow-utils
static inline void ArrowDecimalSetInt(struct ArrowDecimal* decimal, int64_t value) {
  if (decimal->n_words == 0) {
    int32_t value32 = (int32_t)value;
    memcpy(decimal->words, &value32, sizeof(int32_t));
    return;
  }

  if (value < 0) {
    memset(decimal->words, 0xff, decimal->n_words * sizeof(uint64_t));
  } else {
    memset(decimal->words, 0, decimal->n_words * sizeof(uint64_t));
  }

  decimal->words[decimal->low_word_index] = value;
}

/// \brief Negate the value of this decimal in place
/// \ingroup nanoarrow-utils
static inline void ArrowDecimalNegate(struct ArrowDecimal* decimal) {
  if (decimal->n_words == 0) {
    int32_t value;
    memcpy(&value, decimal->words, sizeof(int32_t));
    value = -value;
    memcpy(decimal->words, &value, sizeof(int32_t));
    return;
  }

  uint64_t carry = 1;

  if (decimal->low_word_index == 0) {
    for (int i = 0; i < decimal->n_words; i++) {
      uint64_t elem = decimal->words[i];
      elem = ~elem + carry;
      carry &= (elem == 0);
      decimal->words[i] = elem;
    }
  } else {
    for (int i = decimal->low_word_index; i >= 0; i--) {
      uint64_t elem = decimal->words[i];
      elem = ~elem + carry;
      carry &= (elem == 0);
      decimal->words[i] = elem;
    }
  }
}

/// \brief Copy bytes from a buffer into this decimal
/// \ingroup nanoarrow-utils
static inline void ArrowDecimalSetBytes(struct ArrowDecimal* decimal,
                                        const uint8_t* value) {
  if (decimal->n_words == 0) {
    memcpy(decimal->words, value, sizeof(int32_t));
  } else {
    memcpy(decimal->words, value, decimal->n_words * sizeof(uint64_t));
  }
}

#ifdef __cplusplus
}
#endif

#endif
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#ifndef NANOARROW_H_INCLUDED
#define NANOARROW_H_INCLUDED

#include <stddef.h>
#include <stdint.h>
#include <stdlib.h>


// If using CMake, optionally pass -DNANOARROW_NAMESPACE=MyNamespace which will set this
// define in nanoarrow_config.h. If not, you can optionally #define NANOARROW_NAMESPACE
// MyNamespace here.

// This section remaps the non-prefixed symbols to the prefixed symbols so that
// code written against this build can be used independent of the value of
// NANOARROW_NAMESPACE.
#ifdef NANOARROW_NAMESPACE
#define NANOARROW_CAT(A, B) A##B
#define NANOARROW_SYMBOL(A, B) NANOARROW_CAT(A, B)

#define ArrowNanoarrowVersion NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowNanoarrowVersion)
#define ArrowNanoarrowVersionInt \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowNanoarrowVersionInt)
#define ArrowMalloc NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMalloc)
#define ArrowRealloc NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowRealloc)
#define ArrowFree NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowFree)
#define ArrowBufferAllocatorDefault \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowBufferAllocatorDefault)
#define ArrowBufferDeallocator \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowBufferDeallocator)
#define ArrowErrorSet NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowErrorSet)
#define ArrowLayoutInit NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowLayoutInit)
#define ArrowDecimalSetDigits NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowDecimalSetDigits)
#define ArrowDecimalAppendDigitsToBuffer \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowDecimalAppendDigitsToBuffer)
#define ArrowDecimalAppendStringToBuffer \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowDecimalAppendStringToBuffer)
#define ArrowSchemaInit NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaInit)
#define ArrowSchemaInitFromType \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaInitFromType)
#define ArrowSchemaSetType NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetType)
#define ArrowSchemaSetTypeStruct \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeStruct)
#define ArrowSchemaSetTypeFixedSize \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeFixedSize)
#define ArrowSchemaSetTypeDecimal \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeDecimal)
#define ArrowSchemaSetTypeRunEndEncoded \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeRunEndEncoded)
#define ArrowSchemaSetTypeDateTime \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeDateTime)
#define ArrowSchemaSetTypeUnion \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetTypeUnion)
#define ArrowSchemaDeepCopy NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaDeepCopy)
#define ArrowSchemaSetFormat NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetFormat)
#define ArrowSchemaSetName NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetName)
#define ArrowSchemaSetMetadata \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaSetMetadata)
#define ArrowSchemaAllocateChildren \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaAllocateChildren)
#define ArrowSchemaAllocateDictionary \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaAllocateDictionary)
#define ArrowMetadataReaderInit \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataReaderInit)
#define ArrowMetadataReaderRead \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataReaderRead)
#define ArrowMetadataSizeOf NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataSizeOf)
#define ArrowMetadataHasKey NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataHasKey)
#define ArrowMetadataGetValue NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataGetValue)
#define ArrowMetadataBuilderInit \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataBuilderInit)
#define ArrowMetadataBuilderAppend \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataBuilderAppend)
#define ArrowMetadataBuilderSet \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataBuilderSet)
#define ArrowMetadataBuilderRemove \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowMetadataBuilderRemove)
#define ArrowSchemaViewInit NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaViewInit)
#define ArrowSchemaToString NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowSchemaToString)
#define ArrowArrayInitFromType \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayInitFromType)
#define ArrowArrayInitFromSchema \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayInitFromSchema)
#define ArrowArrayInitFromArrayView \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayInitFromArrayView)
#define ArrowArrayInitFromArrayView \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayInitFromArrayView)
#define ArrowArrayAllocateChildren \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayAllocateChildren)
#define ArrowArrayAllocateDictionary \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayAllocateDictionary)
#define ArrowArraySetValidityBitmap \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArraySetValidityBitmap)
#define ArrowArraySetBuffer NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArraySetBuffer)
#define ArrowArrayReserve NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayReserve)
#define ArrowArrayFinishBuilding \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayFinishBuilding)
#define ArrowArrayFinishBuildingDefault \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayFinishBuildingDefault)
#define ArrowArrayViewInitFromType \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewInitFromType)
#define ArrowArrayViewInitFromSchema \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewInitFromSchema)
#define ArrowArrayViewAllocateChildren \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewAllocateChildren)
#define ArrowArrayViewAllocateDictionary \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewAllocateDictionary)
#define ArrowArrayViewSetLength \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewSetLength)
#define ArrowArrayViewSetArray \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewSetArray)
#define ArrowArrayViewSetArrayMinimal \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewSetArrayMinimal)
#define ArrowArrayViewValidate \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewValidate)
#define ArrowArrayViewCompare NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewCompare)
#define ArrowArrayViewReset NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowArrayViewReset)
#define ArrowBasicArrayStreamInit \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowBasicArrayStreamInit)
#define ArrowBasicArrayStreamSetArray \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowBasicArrayStreamSetArray)
#define ArrowBasicArrayStreamValidate \
  NANOARROW_SYMBOL(NANOARROW_NAMESPACE, ArrowBasicArrayStreamValidate)

#endif

#if (defined _WIN32 || defined __CYGWIN__) && defined(NANOARROW_BUILD_DLL)
#if defined(NANOARROW_EXPORT_DLL)
#define NANOARROW_DLL __declspec(dllexport)
#else
#define NANOARROW_DLL __declspec(dllimport)
#endif  // defined(NANOARROW_EXPORT_DLL)
#elif !defined(NANOARROW_DLL)
#if defined(__GNUC__) && __GNUC__ >= 4
#define NANOARROW_DLL __attribute__((visibility("default")))
#else
#define NANOARROW_DLL
#endif  // __GNUC__ >= 4
#endif

#ifdef __cplusplus
extern "C" {
#endif

/// \defgroup nanoarrow Nanoarrow C library
///
/// Except where noted, objects are not thread-safe and clients should
/// take care to serialize accesses to methods.
///
/// Because this library is intended to be vendored, it provides full type
/// definitions and encourages clients to stack or statically allocate
/// where convenient.

/// \defgroup nanoarrow-malloc Memory management
///
/// Non-buffer members of a struct ArrowSchema and struct ArrowArray
/// must be allocated using ArrowMalloc() or ArrowRealloc() and freed
/// using ArrowFree() for schemas and arrays allocated here. Buffer members
/// are allocated using an ArrowBufferAllocator.
///
/// @{

/// \brief Allocate like malloc()
NANOARROW_DLL void* ArrowMalloc(int64_t size);

/// \brief Reallocate like realloc()
NANOARROW_DLL void* ArrowRealloc(void* ptr, int64_t size);

/// \brief Free a pointer allocated using ArrowMalloc() or ArrowRealloc().
NANOARROW_DLL void ArrowFree(void* ptr);

/// \brief Return the default allocator
///
/// The default allocator uses ArrowMalloc(), ArrowRealloc(), and
/// ArrowFree().
NANOARROW_DLL struct ArrowBufferAllocator ArrowBufferAllocatorDefault(void);

/// \brief Create a custom deallocator
///
/// Creates a buffer allocator with only a free method that can be used to
/// attach a custom deallocator to an ArrowBuffer. This may be used to
/// avoid copying an existing buffer that was not allocated using the
/// infrastructure provided here (e.g., by an R or Python object).
NANOARROW_DLL struct ArrowBufferAllocator ArrowBufferDeallocator(
    ArrowBufferDeallocatorCallback, void* private_data);

/// @}

/// \brief Move the contents of an src ArrowSchema into dst and set src->release to NULL
/// \ingroup nanoarrow-arrow-cdata
static inline void ArrowSchemaMove(struct ArrowSchema* src, struct ArrowSchema* dst);

/// \brief Call the release callback of an ArrowSchema
/// \ingroup nanoarrow-arrow-cdata
static inline void ArrowSchemaRelease(struct ArrowSchema* schema);

/// \brief Move the contents of an src ArrowArray into dst and set src->release to NULL
/// \ingroup nanoarrow-arrow-cdata
static inline void ArrowArrayMove(struct ArrowArray* src, struct ArrowArray* dst);

/// \brief Call the release callback of an ArrowArray
static inline void ArrowArrayRelease(struct ArrowArray* array);

/// \brief Move the contents of an src ArrowArrayStream into dst and set src->release to
/// NULL \ingroup nanoarrow-arrow-cdata
static inline void ArrowArrayStreamMove(struct ArrowArrayStream* src,
                                        struct ArrowArrayStream* dst);

/// \brief Call the get_schema callback of an ArrowArrayStream
/// \ingroup nanoarrow-arrow-cdata
///
/// Unlike the get_schema callback, this wrapper checks the return code
/// and propagates the error reported by get_last_error into error. This
/// makes it significantly less verbose to iterate over array streams
/// using NANOARROW_RETURN_NOT_OK()-style error handling.
static inline ArrowErrorCode ArrowArrayStreamGetSchema(
    struct ArrowArrayStream* array_stream, struct ArrowSchema* out,
    struct ArrowError* error);

/// \brief Call the get_next callback of an ArrowArrayStream
/// \ingroup nanoarrow-arrow-cdata
///
/// Unlike the get_next callback, this wrapper checks the return code
/// and propagates the error reported by get_last_error into error. This
/// makes it significantly less verbose to iterate over array streams
/// using NANOARROW_RETURN_NOT_OK()-style error handling.
static inline ArrowErrorCode ArrowArrayStreamGetNext(
    struct ArrowArrayStream* array_stream, struct ArrowArray* out,
    struct ArrowError* error);

/// \brief Call the get_last_error callback of an ArrowArrayStream
/// \ingroup nanoarrow-arrow-cdata
///
/// Unlike the get_last_error callback, this function never returns NULL (i.e.,
/// its result is safe to use in printf-style error formatters). Null values
/// from the original callback are reported as
/// "<get_last_error() returned NULL>".
static inline const char* ArrowArrayStreamGetLastError(
    struct ArrowArrayStream* array_stream);

/// \brief Call the release callback of an ArrowArrayStream
static inline void ArrowArrayStreamRelease(struct ArrowArrayStream* array_stream);

/// \defgroup nanoarrow-errors Error handling
///
/// Functions generally return an errno-compatible error code; functions that
/// need to communicate more verbose error information accept a pointer
/// to an ArrowError. This can be stack or statically allocated. The
/// content of the message is undefined unless an error code has been
/// returned. If a nanoarrow function is passed a non-null ArrowError pointer, the
/// ArrowError pointed to by the argument will be propagated with a
/// null-terminated error message. It is safe to pass a NULL ArrowError anywhere
/// in the nanoarrow API.
///
/// Except where documented, it is generally not safe to continue after a
/// function has returned a non-zero ArrowErrorCode. The NANOARROW_RETURN_NOT_OK and
/// NANOARROW_ASSERT_OK macros are provided to help propagate errors. C++ clients can use
/// the helpers provided in the nanoarrow.hpp header to facilitate using C++ idioms
/// for memory management and error propgagtion.
///
/// @{

/// \brief Set the contents of an error using printf syntax.
///
/// If error is NULL, this function does nothing and returns NANOARROW_OK.
NANOARROW_DLL NANOARROW_CHECK_PRINTF_ATTRIBUTE int ArrowErrorSet(struct ArrowError* error,
                                                                 const char* fmt, ...);

/// @}

/// \defgroup nanoarrow-utils Utility data structures
///
/// @{

/// \brief Return a version string in the form "major.minor.patch"
NANOARROW_DLL const char* ArrowNanoarrowVersion(void);

/// \brief Return an integer that can be used to compare versions sequentially
NANOARROW_DLL int ArrowNanoarrowVersionInt(void);

/// \brief Initialize a description of buffer arrangements from a storage type
NANOARROW_DLL void ArrowLayoutInit(struct ArrowLayout* layout,
                                   enum ArrowType storage_type);

/// \brief Create a string view from a null-terminated string
static inline struct ArrowStringView ArrowCharView(const char* value);

/// \brief Sets the integer value of an ArrowDecimal from a string
NANOARROW_DLL ArrowErrorCode ArrowDecimalSetDigits(struct ArrowDecimal* decimal,
                                                   struct ArrowStringView value);

/// \brief Get the integer value of an ArrowDecimal as string
NANOARROW_DLL ArrowErrorCode ArrowDecimalAppendDigitsToBuffer(
    const struct ArrowDecimal* decimal, struct ArrowBuffer* buffer);

/// \brief Get the decimal value of an ArrowDecimal as a string
NANOARROW_DLL ArrowErrorCode ArrowDecimalAppendStringToBuffer(
    const struct ArrowDecimal* decimal, struct ArrowBuffer* buffer);

/// \brief Get the half float value of a float
static inline uint16_t ArrowFloatToHalfFloat(float value);

/// \brief Get the float value of a half float
static inline float ArrowHalfFloatToFloat(uint16_t value);

/// \brief Resolve a chunk index from increasing int64_t offsets
///
/// Given a buffer of increasing int64_t offsets that begin with 0 (e.g., offset buffer
/// of a large type, run ends of a chunked array implementation), resolve a value v
/// where lo <= v < hi such that offsets[v] <= index < offsets[v + 1].
static inline int64_t ArrowResolveChunk64(int64_t index, const int64_t* offsets,
                                          int64_t lo, int64_t hi);

/// @}

/// \defgroup nanoarrow-schema Creating schemas
///
/// These functions allocate, copy, and destroy ArrowSchema structures
///
/// @{

/// \brief Initialize an ArrowSchema
///
/// Initializes the fields and release callback of schema_out. Caller
/// is responsible for calling the schema->release callback if
/// NANOARROW_OK is returned.
NANOARROW_DLL void ArrowSchemaInit(struct ArrowSchema* schema);

/// \brief Initialize an ArrowSchema from an ArrowType
///
/// A convenience constructor for that calls ArrowSchemaInit() and
/// ArrowSchemaSetType() for the common case of constructing an
/// unparameterized type. The caller is responsible for calling the schema->release
/// callback if NANOARROW_OK is returned.
NANOARROW_DLL ArrowErrorCode ArrowSchemaInitFromType(struct ArrowSchema* schema,
                                                     enum ArrowType type);

/// \brief Get a human-readable summary of a Schema
///
/// Writes a summary of an ArrowSchema to out (up to n - 1 characters)
/// and returns the number of characters required for the output if
/// n were sufficiently large. If recursive is non-zero, the result will
/// also include children.
NANOARROW_DLL int64_t ArrowSchemaToString(const struct ArrowSchema* schema, char* out,
                                          int64_t n, char recursive);

/// \brief Set the format field of a schema from an ArrowType
///
/// Initializes the fields and release callback of schema_out. For
/// NANOARROW_TYPE_LIST, NANOARROW_TYPE_LARGE_LIST, and
/// NANOARROW_TYPE_MAP, the appropriate number of children are
/// allocated, initialized, and named; however, the caller must
/// ArrowSchemaSetType() on the preinitialized children. Schema must have been initialized
/// using ArrowSchemaInit() or ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetType(struct ArrowSchema* schema,
                                                enum ArrowType type);

/// \brief Set the format field and initialize children of a struct schema
///
/// The specified number of children are initialized; however, the caller is responsible
/// for calling ArrowSchemaSetType() and ArrowSchemaSetName() on each child.
/// Schema must have been initialized using ArrowSchemaInit() or ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeStruct(struct ArrowSchema* schema,
                                                      int64_t n_children);

/// \brief Set the format field of a fixed-size schema
///
/// Returns EINVAL for fixed_size <= 0 or for type that is not
/// NANOARROW_TYPE_FIXED_SIZE_BINARY or NANOARROW_TYPE_FIXED_SIZE_LIST.
/// For NANOARROW_TYPE_FIXED_SIZE_LIST, the appropriate number of children are
/// allocated, initialized, and named; however, the caller must
/// ArrowSchemaSetType() the first child. Schema must have been initialized using
/// ArrowSchemaInit() or ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeFixedSize(struct ArrowSchema* schema,
                                                         enum ArrowType type,
                                                         int32_t fixed_size);

/// \brief Set the format field of a decimal schema
///
/// Returns EINVAL for scale <= 0 or for type that is not
/// NANOARROW_TYPE_DECIMAL32, NANOARROW_TYPE_DECIMAL64, NANOARROW_TYPE_DECIMAL128 or
/// NANOARROW_TYPE_DECIMAL256. Schema must have been initialized using
/// ArrowSchemaInit() or ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeDecimal(struct ArrowSchema* schema,
                                                       enum ArrowType type,
                                                       int32_t decimal_precision,
                                                       int32_t decimal_scale);

/// \brief Set the format field of a run-end encoded schema
///
/// Returns EINVAL for run_end_type that is not
/// NANOARROW_TYPE_INT16, NANOARROW_TYPE_INT32 or NANOARROW_TYPE_INT64.
/// Schema must have been initialized using ArrowSchemaInit() or ArrowSchemaDeepCopy().
/// The caller must call `ArrowSchemaSetTypeXXX(schema->children[1])` to
/// set the value type. Note that when building arrays using the `ArrowArrayAppendXXX()`
/// functions, the run-end encoded array's logical length must be updated manually.
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeRunEndEncoded(struct ArrowSchema* schema,
                                                             enum ArrowType run_end_type);

/// \brief Set the format field of a time, timestamp, or duration schema
///
/// Returns EINVAL for type that is not
/// NANOARROW_TYPE_TIME32, NANOARROW_TYPE_TIME64,
/// NANOARROW_TYPE_TIMESTAMP, or NANOARROW_TYPE_DURATION. The
/// timezone parameter must be NULL for a non-timestamp type. Schema must have been
/// initialized using ArrowSchemaInit() or ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeDateTime(struct ArrowSchema* schema,
                                                        enum ArrowType type,
                                                        enum ArrowTimeUnit time_unit,
                                                        const char* timezone);

/// \brief Set the format field of a union schema
///
/// Returns EINVAL for a type that is not NANOARROW_TYPE_DENSE_UNION
/// or NANOARROW_TYPE_SPARSE_UNION. The specified number of children are
/// allocated, and initialized.
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetTypeUnion(struct ArrowSchema* schema,
                                                     enum ArrowType type,
                                                     int64_t n_children);

/// \brief Make a (recursive) copy of a schema
///
/// Allocates and copies fields of schema into schema_out.
NANOARROW_DLL ArrowErrorCode ArrowSchemaDeepCopy(const struct ArrowSchema* schema,
                                                 struct ArrowSchema* schema_out);

/// \brief Copy format into schema->format
///
/// schema must have been allocated using ArrowSchemaInitFromType() or
/// ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetFormat(struct ArrowSchema* schema,
                                                  const char* format);

/// \brief Copy name into schema->name
///
/// schema must have been allocated using ArrowSchemaInitFromType() or
/// ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetName(struct ArrowSchema* schema,
                                                const char* name);

/// \brief Copy metadata into schema->metadata
///
/// schema must have been allocated using ArrowSchemaInitFromType() or
/// ArrowSchemaDeepCopy.
NANOARROW_DLL ArrowErrorCode ArrowSchemaSetMetadata(struct ArrowSchema* schema,
                                                    const char* metadata);

/// \brief Allocate the schema->children array
///
/// Includes the memory for each child struct ArrowSchema.
/// schema must have been allocated using ArrowSchemaInitFromType() or
/// ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaAllocateChildren(struct ArrowSchema* schema,
                                                         int64_t n_children);

/// \brief Allocate the schema->dictionary member
///
/// schema must have been allocated using ArrowSchemaInitFromType() or
/// ArrowSchemaDeepCopy().
NANOARROW_DLL ArrowErrorCode ArrowSchemaAllocateDictionary(struct ArrowSchema* schema);

/// @}

/// \defgroup nanoarrow-metadata Create, read, and modify schema metadata
///
/// @{

/// \brief Reader for key/value pairs in schema metadata
///
/// The ArrowMetadataReader does not own any data and is only valid
/// for the lifetime of the underlying metadata pointer.
struct ArrowMetadataReader {
  /// \brief A metadata string from a schema->metadata field.
  const char* metadata;

  /// \brief The current offset into the metadata string
  int64_t offset;

  /// \brief The number of remaining keys
  int32_t remaining_keys;
};

/// \brief Initialize an ArrowMetadataReader
NANOARROW_DLL ArrowErrorCode ArrowMetadataReaderInit(struct ArrowMetadataReader* reader,
                                                     const char* metadata);

/// \brief Read the next key/value pair from an ArrowMetadataReader
NANOARROW_DLL ArrowErrorCode ArrowMetadataReaderRead(struct ArrowMetadataReader* reader,
                                                     struct ArrowStringView* key_out,
                                                     struct ArrowStringView* value_out);

/// \brief The number of bytes in in a key/value metadata string
NANOARROW_DLL int64_t ArrowMetadataSizeOf(const char* metadata);

/// \brief Check for a key in schema metadata
NANOARROW_DLL char ArrowMetadataHasKey(const char* metadata, struct ArrowStringView key);

/// \brief Extract a value from schema metadata
///
/// If key does not exist in metadata, value_out is unmodified
NANOARROW_DLL ArrowErrorCode ArrowMetadataGetValue(const char* metadata,
                                                   struct ArrowStringView key,
                                                   struct ArrowStringView* value_out);

/// \brief Initialize a builder for schema metadata from key/value pairs
///
/// metadata can be an existing metadata string or NULL to initialize
/// an empty metadata string.
NANOARROW_DLL ArrowErrorCode ArrowMetadataBuilderInit(struct ArrowBuffer* buffer,
                                                      const char* metadata);

/// \brief Append a key/value pair to a buffer containing serialized metadata
NANOARROW_DLL ArrowErrorCode ArrowMetadataBuilderAppend(struct ArrowBuffer* buffer,
                                                        struct ArrowStringView key,
                                                        struct ArrowStringView value);

/// \brief Set a key/value pair to a buffer containing serialized metadata
///
/// Ensures that the only entry for key in the metadata is set to value.
/// This function maintains the existing position of (the first instance of)
/// key if present in the data.
NANOARROW_DLL ArrowErrorCode ArrowMetadataBuilderSet(struct ArrowBuffer* buffer,
                                                     struct ArrowStringView key,
                                                     struct ArrowStringView value);

/// \brief Remove a key from a buffer containing serialized metadata
NANOARROW_DLL ArrowErrorCode ArrowMetadataBuilderRemove(struct ArrowBuffer* buffer,
                                                        struct ArrowStringView key);

/// @}

/// \defgroup nanoarrow-schema-view Reading schemas
///
/// @{

/// \brief A non-owning view of a parsed ArrowSchema
///
/// Contains more readily extractable values than a raw ArrowSchema.
/// Clients can stack or statically allocate this structure but are
/// encouraged to use the provided getters to ensure forward
/// compatibility.
struct ArrowSchemaView {
  /// \brief A pointer to the schema represented by this view
  const struct ArrowSchema* schema;

  /// \brief The data type represented by the schema
  ///
  /// This value may be NANOARROW_TYPE_DICTIONARY if the schema has a
  /// non-null dictionary member; datetime types are valid values.
  /// This value will never be NANOARROW_TYPE_EXTENSION (see
  /// extension_name and/or extension_metadata to check for
  /// an extension type).
  enum ArrowType type;

  /// \brief The storage data type represented by the schema
  ///
  /// This value will never be NANOARROW_TYPE_DICTIONARY, NANOARROW_TYPE_EXTENSION
  /// or any datetime type. This value represents only the type required to
  /// interpret the buffers in the array.
  enum ArrowType storage_type;

  /// \brief The storage layout represented by the schema
  struct ArrowLayout layout;

  /// \brief The extension type name if it exists
  ///
  /// If the ARROW:extension:name key is present in schema.metadata,
  /// extension_name.data will be non-NULL.
  struct ArrowStringView extension_name;

  /// \brief The extension type metadata if it exists
  ///
  /// If the ARROW:extension:metadata key is present in schema.metadata,
  /// extension_metadata.data will be non-NULL.
  struct ArrowStringView extension_metadata;

  /// \brief Format fixed size parameter
  ///
  /// This value is set when parsing a fixed-size binary or fixed-size
  /// list schema; this value is undefined for other types. For a
  /// fixed-size binary schema this value is in bytes; for a fixed-size
  /// list schema this value refers to the number of child elements for
  /// each element of the parent.
  int32_t fixed_size;

  /// \brief Decimal bitwidth
  ///
  /// This value is set when parsing a decimal type schema;
  /// this value is undefined for other types.
  int32_t decimal_bitwidth;

  /// \brief Decimal precision
  ///
  /// This value is set when parsing a decimal type schema;
  /// this value is undefined for other types.
  int32_t decimal_precision;

  /// \brief Decimal scale
  ///
  /// This value is set when parsing a decimal type schema;
  /// this value is undefined for other types.
  int32_t decimal_scale;

  /// \brief Format time unit parameter
  ///
  /// This value is set when parsing a date/time type. The value is
  /// undefined for other types.
  enum ArrowTimeUnit time_unit;

  /// \brief Format timezone parameter
  ///
  /// This value is set when parsing a timestamp type and represents
  /// the timezone format parameter. This value points to
  /// data within the schema and is undefined for other types.
  const char* timezone;

  /// \brief Union type ids parameter
  ///
  /// This value is set when parsing a union type and represents
  /// type ids parameter. This value points to
  /// data within the schema and is undefined for other types.
  const char* union_type_ids;
};

/// \brief Initialize an ArrowSchemaView
NANOARROW_DLL ArrowErrorCode ArrowSchemaViewInit(struct ArrowSchemaView* schema_view,
                                                 const struct ArrowSchema* schema,
                                                 struct ArrowError* error);

/// @}

/// \defgroup nanoarrow-buffer Owning, growable buffers
///
/// @{

/// \brief Initialize an ArrowBuffer
///
/// Initialize a buffer with a NULL, zero-size buffer using the default
/// buffer allocator.
static inline void ArrowBufferInit(struct ArrowBuffer* buffer);

/// \brief Set a newly-initialized buffer's allocator
///
/// Returns EINVAL if the buffer has already been allocated.
static inline ArrowErrorCode ArrowBufferSetAllocator(
    struct ArrowBuffer* buffer, struct ArrowBufferAllocator allocator);

/// \brief Reset an ArrowBuffer
///
/// Releases the buffer using the allocator's free method if
/// the buffer's data member is non-null, sets the data member
/// to NULL, and sets the buffer's size and capacity to 0.
static inline void ArrowBufferReset(struct ArrowBuffer* buffer);

/// \brief Move an ArrowBuffer
///
/// Transfers the buffer data and lifecycle management to another
/// address and resets buffer.
static inline void ArrowBufferMove(struct ArrowBuffer* src, struct ArrowBuffer* dst);

/// \brief Grow or shrink a buffer to a given size
///
/// When shrinking the size of the buffer, the buffer is only reallocated
/// if shrink_to_fit is non-zero.
static inline ArrowErrorCode ArrowBufferResize(struct ArrowBuffer* buffer,
                                               int64_t new_size_bytes,
                                               char shrink_to_fit);

/// \brief Ensure a buffer has at least a given additional capacity
///
/// Ensures that the buffer has space to append at least
/// additional_size_bytes, overallocating when required.
static inline ArrowErrorCode ArrowBufferReserve(struct ArrowBuffer* buffer,
                                                int64_t additional_size_bytes);

/// \brief Write data to buffer and increment the buffer size
///
/// This function does not check that buffer has the required capacity
static inline void ArrowBufferAppendUnsafe(struct ArrowBuffer* buffer, const void* data,
                                           int64_t size_bytes);

/// \brief Write data to buffer and increment the buffer size
///
/// This function writes and ensures that the buffer has the required capacity,
/// possibly by reallocating the buffer. Like ArrowBufferReserve, this will
/// overallocate when reallocation is required.
static inline ArrowErrorCode ArrowBufferAppend(struct ArrowBuffer* buffer,
                                               const void* data, int64_t size_bytes);

/// \brief Write fill to buffer and increment the buffer size
///
/// This function writes the specified number of fill bytes and
/// ensures that the buffer has the required capacity,
static inline ArrowErrorCode ArrowBufferAppendFill(struct ArrowBuffer* buffer,
                                                   uint8_t value, int64_t size_bytes);

/// \brief Write an 8-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendInt8(struct ArrowBuffer* buffer,
                                                   int8_t value);

/// \brief Write an unsigned 8-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendUInt8(struct ArrowBuffer* buffer,
                                                    uint8_t value);

/// \brief Write a 16-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendInt16(struct ArrowBuffer* buffer,
                                                    int16_t value);

/// \brief Write an unsigned 16-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendUInt16(struct ArrowBuffer* buffer,
                                                     uint16_t value);

/// \brief Write a 32-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendInt32(struct ArrowBuffer* buffer,
                                                    int32_t value);

/// \brief Write an unsigned 32-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendUInt32(struct ArrowBuffer* buffer,
                                                     uint32_t value);

/// \brief Write a 64-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendInt64(struct ArrowBuffer* buffer,
                                                    int64_t value);

/// \brief Write an unsigned 64-bit integer to a buffer
static inline ArrowErrorCode ArrowBufferAppendUInt64(struct ArrowBuffer* buffer,
                                                     uint64_t value);

/// \brief Write a double to a buffer
static inline ArrowErrorCode ArrowBufferAppendDouble(struct ArrowBuffer* buffer,
                                                     double value);

/// \brief Write a float to a buffer
static inline ArrowErrorCode ArrowBufferAppendFloat(struct ArrowBuffer* buffer,
                                                    float value);

/// \brief Write an ArrowStringView to a buffer
static inline ArrowErrorCode ArrowBufferAppendStringView(struct ArrowBuffer* buffer,
                                                         struct ArrowStringView value);

/// \brief Write an ArrowBufferView to a buffer
static inline ArrowErrorCode ArrowBufferAppendBufferView(struct ArrowBuffer* buffer,
                                                         struct ArrowBufferView value);

/// @}

/// \defgroup nanoarrow-bitmap Bitmap utilities
///
/// @{

/// \brief Extract a boolean value from a bitmap
static inline int8_t ArrowBitGet(const uint8_t* bits, int64_t i);

/// \brief Set a boolean value to a bitmap to true
static inline void ArrowBitSet(uint8_t* bits, int64_t i);

/// \brief Set a boolean value to a bitmap to false
static inline void ArrowBitClear(uint8_t* bits, int64_t i);

/// \brief Set a boolean value to a bitmap
static inline void ArrowBitSetTo(uint8_t* bits, int64_t i, uint8_t value);

/// \brief Set a boolean value to a range in a bitmap
static inline void ArrowBitsSetTo(uint8_t* bits, int64_t start_offset, int64_t length,
                                  uint8_t bits_are_set);

/// \brief Count true values in a bitmap
static inline int64_t ArrowBitCountSet(const uint8_t* bits, int64_t i_from, int64_t i_to);

/// \brief Extract int8 boolean values from a range in a bitmap
static inline void ArrowBitsUnpackInt8(const uint8_t* bits, int64_t start_offset,
                                       int64_t length, int8_t* out);

/// \brief Extract int32 boolean values from a range in a bitmap
static inline void ArrowBitsUnpackInt32(const uint8_t* bits, int64_t start_offset,
                                        int64_t length, int32_t* out);

/// \brief Initialize an ArrowBitmap
///
/// Initialize the builder's buffer, empty its cache, and reset the size to zero
static inline void ArrowBitmapInit(struct ArrowBitmap* bitmap);

/// \brief Move an ArrowBitmap
///
/// Transfers the underlying buffer data and lifecycle management to another
/// address and resets the bitmap.
static inline void ArrowBitmapMove(struct ArrowBitmap* src, struct ArrowBitmap* dst);

/// \brief Ensure a bitmap builder has at least a given additional capacity
///
/// Ensures that the buffer has space to append at least
/// additional_size_bits, overallocating when required.
static inline ArrowErrorCode ArrowBitmapReserve(struct ArrowBitmap* bitmap,
                                                int64_t additional_size_bits);

/// \brief Grow or shrink a bitmap to a given size
///
/// When shrinking the size of the bitmap, the bitmap is only reallocated
/// if shrink_to_fit is non-zero.
static inline ArrowErrorCode ArrowBitmapResize(struct ArrowBitmap* bitmap,
                                               int64_t new_size_bits, char shrink_to_fit);

/// \brief Reserve space for and append zero or more of the same boolean value to a bitmap
static inline ArrowErrorCode ArrowBitmapAppend(struct ArrowBitmap* bitmap,
                                               uint8_t bits_are_set, int64_t length);

/// \brief Append zero or more of the same boolean value to a bitmap
static inline void ArrowBitmapAppendUnsafe(struct ArrowBitmap* bitmap,
                                           uint8_t bits_are_set, int64_t length);

/// \brief Append boolean values encoded as int8_t to a bitmap
///
/// The values must all be 0 or 1.
static inline void ArrowBitmapAppendInt8Unsafe(struct ArrowBitmap* bitmap,
                                               const int8_t* values, int64_t n_values);

/// \brief Append boolean values encoded as int32_t to a bitmap
///
/// The values must all be 0 or 1.
static inline void ArrowBitmapAppendInt32Unsafe(struct ArrowBitmap* bitmap,
                                                const int32_t* values, int64_t n_values);

/// \brief Reset a bitmap builder
///
/// Releases any memory held by buffer, empties the cache, and resets the size to zero
static inline void ArrowBitmapReset(struct ArrowBitmap* bitmap);

/// @}

/// \defgroup nanoarrow-array Creating arrays
///
/// These functions allocate, copy, and destroy ArrowArray structures.
/// Once an ArrowArray has been initialized via ArrowArrayInitFromType()
/// or ArrowArrayInitFromSchema(), the caller is responsible for releasing
/// it using the embedded release callback.
///
/// @{

/// \brief Initialize the fields of an array
///
/// Initializes the fields and release callback of array. Caller
/// is responsible for calling the array->release callback if
/// NANOARROW_OK is returned.
NANOARROW_DLL ArrowErrorCode ArrowArrayInitFromType(struct ArrowArray* array,
                                                    enum ArrowType storage_type);

/// \brief Initialize the contents of an ArrowArray from an ArrowSchema
///
/// Caller is responsible for calling the array->release callback if
/// NANOARROW_OK is returned.
NANOARROW_DLL ArrowErrorCode ArrowArrayInitFromSchema(struct ArrowArray* array,
                                                      const struct ArrowSchema* schema,
                                                      struct ArrowError* error);

/// \brief Initialize the contents of an ArrowArray from an ArrowArrayView
///
/// Caller is responsible for calling the array->release callback if
/// NANOARROW_OK is returned.
NANOARROW_DLL ArrowErrorCode ArrowArrayInitFromArrayView(
    struct ArrowArray* array, const struct ArrowArrayView* array_view,
    struct ArrowError* error);

/// \brief Allocate the array->children array
///
/// Includes the memory for each child struct ArrowArray,
/// whose members are marked as released and may be subsequently initialized
/// with ArrowArrayInitFromType() or moved from an existing ArrowArray.
/// schema must have been allocated using ArrowArrayInitFromType().
NANOARROW_DLL ArrowErrorCode ArrowArrayAllocateChildren(struct ArrowArray* array,
                                                        int64_t n_children);

/// \brief Allocate the array->dictionary member
///
/// Includes the memory for the struct ArrowArray, whose contents
/// is marked as released and may be subsequently initialized
/// with ArrowArrayInitFromType() or moved from an existing ArrowArray.
/// array must have been allocated using ArrowArrayInitFromType()
NANOARROW_DLL ArrowErrorCode ArrowArrayAllocateDictionary(struct ArrowArray* array);

/// \brief Set the validity bitmap of an ArrowArray
///
/// array must have been allocated using ArrowArrayInitFromType()
NANOARROW_DLL void ArrowArraySetValidityBitmap(struct ArrowArray* array,
                                               struct ArrowBitmap* bitmap);

/// \brief Set a buffer of an ArrowArray
///
/// array must have been allocated using ArrowArrayInitFromType()
NANOARROW_DLL ArrowErrorCode ArrowArraySetBuffer(struct ArrowArray* array, int64_t i,
                                                 struct ArrowBuffer* buffer);

/// \brief Add variadic buffers to a string or binary view array
///
/// array must have been allocated using ArrowArrayInitFromType()
static inline ArrowErrorCode ArrowArrayAddVariadicBuffers(struct ArrowArray* array,
                                                          int32_t n_buffers);

/// \brief Get the validity bitmap of an ArrowArray
///
/// array must have been allocated using ArrowArrayInitFromType()
static inline struct ArrowBitmap* ArrowArrayValidityBitmap(struct ArrowArray* array);

/// \brief Get a buffer of an ArrowArray
///
/// array must have been allocated using ArrowArrayInitFromType()
static inline struct ArrowBuffer* ArrowArrayBuffer(struct ArrowArray* array, int64_t i);

/// \brief Start element-wise appending to an ArrowArray
///
/// Initializes any values needed to use ArrowArrayAppend*() functions.
/// All element-wise appenders append by value and return EINVAL if the exact value
/// cannot be represented by the underlying storage type.
/// array must have been allocated using ArrowArrayInitFromType()
static inline ArrowErrorCode ArrowArrayStartAppending(struct ArrowArray* array);

/// \brief Reserve space for future appends
///
/// For buffer sizes that can be calculated (i.e., not string data buffers or
/// child array sizes for non-fixed-size arrays), recursively reserve space for
/// additional elements. This is useful for reducing the number of reallocations
/// that occur using the item-wise appenders.
NANOARROW_DLL ArrowErrorCode ArrowArrayReserve(struct ArrowArray* array,
                                               int64_t additional_size_elements);

/// \brief Append a null value to an array
static inline ArrowErrorCode ArrowArrayAppendNull(struct ArrowArray* array, int64_t n);

/// \brief Append an empty, non-null value to an array
static inline ArrowErrorCode ArrowArrayAppendEmpty(struct ArrowArray* array, int64_t n);

/// \brief Append a signed integer value to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type or EINVAL otherwise (e.g., value
/// is outside the valid array range).
static inline ArrowErrorCode ArrowArrayAppendInt(struct ArrowArray* array, int64_t value);

/// \brief Append an unsigned integer value to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type or EINVAL otherwise (e.g., value
/// is outside the valid array range).
static inline ArrowErrorCode ArrowArrayAppendUInt(struct ArrowArray* array,
                                                  uint64_t value);

/// \brief Append a double value to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type or EINVAL otherwise (e.g., value
/// is outside the valid array range or there is an attempt to append
/// a non-integer to an array with an integer storage type).
static inline ArrowErrorCode ArrowArrayAppendDouble(struct ArrowArray* array,
                                                    double value);

/// \brief Append a string of bytes to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type, EOVERFLOW if appending value would overflow
/// the offset type (e.g., if the data buffer would be larger than 2 GB for a
/// non-large string type), or EINVAL otherwise (e.g., the underlying array is not a
/// binary, string, large binary, large string, or fixed-size binary array, or value is
/// the wrong size for a fixed-size binary array).
static inline ArrowErrorCode ArrowArrayAppendBytes(struct ArrowArray* array,
                                                   struct ArrowBufferView value);

/// \brief Append a string value to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type, EOVERFLOW if appending value would overflow
/// the offset type (e.g., if the data buffer would be larger than 2 GB for a
/// non-large string type), or EINVAL otherwise (e.g., the underlying array is not a
/// string or large string array).
static inline ArrowErrorCode ArrowArrayAppendString(struct ArrowArray* array,
                                                    struct ArrowStringView value);

/// \brief Append a Interval to an array
///
/// Returns NANOARROW_OK if value can be exactly represented by
/// the underlying storage type or EINVAL otherwise.
static inline ArrowErrorCode ArrowArrayAppendInterval(struct ArrowArray* array,
                                                      const struct ArrowInterval* value);

/// \brief Append a decimal value to an array
///
/// Returns NANOARROW_OK if array is a decimal array with the appropriate
/// bitwidth or EINVAL otherwise.
static inline ArrowErrorCode ArrowArrayAppendDecimal(struct ArrowArray* array,
                                                     const struct ArrowDecimal* value);

/// \brief Finish a nested array element
///
/// Appends a non-null element to the array based on the first child's current
/// length. Returns NANOARROW_OK if the item was successfully added, EOVERFLOW
/// if the child of a list or map array would exceed INT_MAX elements, or EINVAL
/// if the underlying storage type is not a struct, list, large list, or fixed-size
/// list, or if there was an attempt to add a struct or fixed-size list element where the
/// length of the child array(s) did not match the expected length.
static inline ArrowErrorCode ArrowArrayFinishElement(struct ArrowArray* array);

/// \brief Finish a union array element
///
/// Appends an element to the union type ids buffer and increments array->length.
/// For sparse unions, up to one element is added to non type-id children. Returns
/// EINVAL if the underlying storage type is not a union, if type_id is not valid,
/// or if child sizes after appending are inconsistent.
static inline ArrowErrorCode ArrowArrayFinishUnionElement(struct ArrowArray* array,
                                                          int8_t type_id);

/// \brief Shrink buffer capacity to the size required
///
/// Also applies shrinking to any child arrays. array must have been allocated using
/// ArrowArrayInitFromType
static inline ArrowErrorCode ArrowArrayShrinkToFit(struct ArrowArray* array);

/// \brief Finish building an ArrowArray
///
/// Flushes any pointers from internal buffers that may have been reallocated
/// into array->buffers and checks the actual size of the buffers
/// against the expected size based on the final length.
/// array must have been allocated using ArrowArrayInitFromType()
NANOARROW_DLL ArrowErrorCode ArrowArrayFinishBuildingDefault(struct ArrowArray* array,
                                                             struct ArrowError* error);

/// \brief Finish building an ArrowArray with explicit validation
///
/// Finish building with an explicit validation level. This could perform less validation
/// (i.e. NANOARROW_VALIDATION_LEVEL_NONE or NANOARROW_VALIDATION_LEVEL_MINIMAL) if CPU
/// buffer data access is not possible or more validation (i.e.,
/// NANOARROW_VALIDATION_LEVEL_FULL) if buffer content was obtained from an untrusted or
/// corruptible source.
NANOARROW_DLL ArrowErrorCode ArrowArrayFinishBuilding(
    struct ArrowArray* array, enum ArrowValidationLevel validation_level,
    struct ArrowError* error);

/// @}

/// \defgroup nanoarrow-array-view Reading arrays
///
/// These functions read and validate the contents ArrowArray structures.
///
/// @{

/// \brief Initialize the contents of an ArrowArrayView
NANOARROW_DLL void ArrowArrayViewInitFromType(struct ArrowArrayView* array_view,
                                              enum ArrowType storage_type);

/// \brief Move an ArrowArrayView
///
/// Transfers the ArrowArrayView data and lifecycle management to another
/// address and resets the contents of src.
static inline void ArrowArrayViewMove(struct ArrowArrayView* src,
                                      struct ArrowArrayView* dst);

/// \brief Initialize the contents of an ArrowArrayView from an ArrowSchema
NANOARROW_DLL ArrowErrorCode
ArrowArrayViewInitFromSchema(struct ArrowArrayView* array_view,
                             const struct ArrowSchema* schema, struct ArrowError* error);

/// \brief Allocate the array_view->children array
///
/// Includes the memory for each child struct ArrowArrayView
NANOARROW_DLL ArrowErrorCode
ArrowArrayViewAllocateChildren(struct ArrowArrayView* array_view, int64_t n_children);

/// \brief Allocate array_view->dictionary
NANOARROW_DLL ArrowErrorCode
ArrowArrayViewAllocateDictionary(struct ArrowArrayView* array_view);

/// \brief Set data-independent buffer sizes from length
NANOARROW_DLL void ArrowArrayViewSetLength(struct ArrowArrayView* array_view,
                                           int64_t length);

/// \brief Set buffer sizes and data pointers from an ArrowArray
NANOARROW_DLL ArrowErrorCode ArrowArrayViewSetArray(struct ArrowArrayView* array_view,
                                                    const struct ArrowArray* array,
                                                    struct ArrowError* error);

/// \brief Set buffer sizes and data pointers from an ArrowArray except for those
/// that require dereferencing buffer content.
NANOARROW_DLL ArrowErrorCode
ArrowArrayViewSetArrayMinimal(struct ArrowArrayView* array_view,
                              const struct ArrowArray* array, struct ArrowError* error);

/// \brief Get the number of buffers
///
/// The number of buffers referred to by this ArrowArrayView.  In may cases this can also
/// be calculated from the ArrowLayout member of the ArrowArrayView or ArrowSchemaView;
/// however, for binary view and string view types, the number of total buffers depends on
/// the number of variadic buffers.
static inline int64_t ArrowArrayViewGetNumBuffers(struct ArrowArrayView* array_view);

/// \brief Get a view of a specific buffer from an ArrowArrayView
///
/// This is the ArrowArrayView equivalent of ArrowArray::buffers[i] that includes
/// size information (if known).
static inline struct ArrowBufferView ArrowArrayViewGetBufferView(
    struct ArrowArrayView* array_view, int64_t i);

/// \brief Get the function of a specific buffer in an ArrowArrayView
///
/// In may cases this can also be obtained from the ArrowLayout member of the
/// ArrowArrayView or ArrowSchemaView; however, for binary view and string view types,
/// the function of each buffer may be different between two arrays of the same type
/// depending on the number of variadic buffers.
static inline enum ArrowBufferType ArrowArrayViewGetBufferType(
    struct ArrowArrayView* array_view, int64_t i);

/// \brief Get the data type of a specific buffer in an ArrowArrayView
///
/// In may cases this can also be obtained from the ArrowLayout member of the
/// ArrowArrayView or ArrowSchemaView; however, for binary view and string view types,
/// the data type of each buffer may be different between two arrays of the same type
/// depending on the number of variadic buffers.
static inline enum ArrowType ArrowArrayViewGetBufferDataType(
    struct ArrowArrayView* array_view, int64_t i);

/// \brief Get the element size (in bits) of a specific buffer in an ArrowArrayView
///
/// In may cases this can also be obtained from the ArrowLayout member of the
/// ArrowArrayView or ArrowSchemaView; however, for binary view and string view types,
/// the element width of each buffer may be different between two arrays of the same type
/// depending on the number of variadic buffers.
static inline int64_t ArrowArrayViewGetBufferElementSizeBits(
    struct ArrowArrayView* array_view, int64_t i);

/// \brief Performs checks on the content of an ArrowArrayView
///
/// If using ArrowArrayViewSetArray() to back array_view with an ArrowArray,
/// the buffer sizes and some content (fist and last offset) have already
/// been validated at the "default" level. If setting the buffer pointers
/// and sizes otherwise, you may wish to perform checks at a different level. See
/// documentation for ArrowValidationLevel for the details of checks performed
/// at each level.
NANOARROW_DLL ArrowErrorCode ArrowArrayViewValidate(
    struct ArrowArrayView* array_view, enum ArrowValidationLevel validation_level,
    struct ArrowError* error);

/// \brief Compare two ArrowArrayView objects for equality
///
/// Given two ArrowArrayView instances, place either 0 (not equal) and
/// 1 (equal) at the address pointed to by out. If the comparison determines
/// that actual and expected are not equal, a reason will be communicated via
/// error if error is non-NULL.
///
/// Returns NANOARROW_OK if the comparison completed successfully.
NANOARROW_DLL ArrowErrorCode ArrowArrayViewCompare(const struct ArrowArrayView* actual,
                                                   const struct ArrowArrayView* expected,
                                                   enum ArrowCompareLevel level, int* out,
                                                   struct ArrowError* reason);

/// \brief Reset the contents of an ArrowArrayView and frees resources
NANOARROW_DLL void ArrowArrayViewReset(struct ArrowArrayView* array_view);

/// \brief Check for a null element in an ArrowArrayView
static inline int8_t ArrowArrayViewIsNull(const struct ArrowArrayView* array_view,
                                          int64_t i);

/// \brief Compute null count for an ArrowArrayView
static inline int64_t ArrowArrayViewComputeNullCount(
    const struct ArrowArrayView* array_view);

/// \brief Get the type id of a union array element
static inline int8_t ArrowArrayViewUnionTypeId(const struct ArrowArrayView* array_view,
                                               int64_t i);

/// \brief Get the child index of a union array element
static inline int8_t ArrowArrayViewUnionChildIndex(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get the index to use into the relevant union child array
static inline int64_t ArrowArrayViewUnionChildOffset(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get an element in an ArrowArrayView as an integer
///
/// This function does not check for null values, that values are actually integers, or
/// that values are within a valid range for an int64.
static inline int64_t ArrowArrayViewGetIntUnsafe(const struct ArrowArrayView* array_view,
                                                 int64_t i);

/// \brief Get an element in an ArrowArrayView as an unsigned integer
///
/// This function does not check for null values, that values are actually integers, or
/// that values are within a valid range for a uint64.
static inline uint64_t ArrowArrayViewGetUIntUnsafe(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get an element in an ArrowArrayView as a double
///
/// This function does not check for null values, or
/// that values are within a valid range for a double.
static inline double ArrowArrayViewGetDoubleUnsafe(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get an element in an ArrowArrayView as an ArrowStringView
///
/// This function does not check for null values.
static inline struct ArrowStringView ArrowArrayViewGetStringUnsafe(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get an element in an ArrowArrayView as an ArrowBufferView
///
/// This function does not check for null values.
static inline struct ArrowBufferView ArrowArrayViewGetBytesUnsafe(
    const struct ArrowArrayView* array_view, int64_t i);

/// \brief Get an element in an ArrowArrayView as an ArrowDecimal
///
/// This function does not check for null values. The out parameter must
/// be initialized with ArrowDecimalInit() with the proper parameters for this
/// type before calling this for the first time.
static inline void ArrowArrayViewGetDecimalUnsafe(const struct ArrowArrayView* array_view,
                                                  int64_t i, struct ArrowDecimal* out);

/// @}

/// \defgroup nanoarrow-basic-array-stream Basic ArrowArrayStream implementation
///
/// An implementation of an ArrowArrayStream based on a collection of
/// zero or more previously-existing ArrowArray objects. Users should
/// initialize and/or validate the contents before transferring the
/// responsibility of the ArrowArrayStream elsewhere.
///
/// @{

/// \brief Initialize an ArrowArrayStream backed by this implementation
///
/// This function moves the ownership of schema to the array_stream. If
/// this function returns NANOARROW_OK, the caller is responsible for
/// releasing the ArrowArrayStream.
NANOARROW_DLL ArrowErrorCode ArrowBasicArrayStreamInit(
    struct ArrowArrayStream* array_stream, struct ArrowSchema* schema, int64_t n_arrays);

/// \brief Set the ith ArrowArray in this ArrowArrayStream.
///
/// array_stream must have been initialized with ArrowBasicArrayStreamInit().
/// This function moves the ownership of array to the array_stream. i must
/// be greater than or equal to zero and less than the value of n_arrays passed in
/// ArrowBasicArrayStreamInit(). Callers are not required to fill all
/// n_arrays members (i.e., n_arrays is a maximum bound).
NANOARROW_DLL void ArrowBasicArrayStreamSetArray(struct ArrowArrayStream* array_stream,
                                                 int64_t i, struct ArrowArray* array);

/// \brief Validate the contents of this ArrowArrayStream
///
/// array_stream must have been initialized with ArrowBasicArrayStreamInit().
/// This function uses ArrowArrayStreamInitFromSchema() and ArrowArrayStreamSetArray()
/// to validate the contents of the arrays.
NANOARROW_DLL ArrowErrorCode ArrowBasicArrayStreamValidate(
    const struct ArrowArrayStream* array_stream, struct ArrowError* error);

/// @}

// Undefine ArrowErrorCode, which may have been defined to annotate functions that return
// it to warn for an unused result.
#if defined(ArrowErrorCode)
#undef ArrowErrorCode
#endif

// Inline function definitions


#ifdef __cplusplus
}
#endif

#endif
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#ifndef NANOARROW_BUFFER_INLINE_H_INCLUDED
#define NANOARROW_BUFFER_INLINE_H_INCLUDED

#include <errno.h>
#include <stdint.h>
#include <string.h>


#ifdef __cplusplus
extern "C" {
#endif

// Modified from Arrow C++ (1eb46f76) cpp/src/arrow/chunk_resolver.h#L133-L162
static inline int64_t ArrowResolveChunk64(int64_t index, const int64_t* offsets,
                                          int64_t lo, int64_t hi) {
  // Similar to std::upper_bound(), but slightly different as our offsets
  // array always starts with 0.
  int64_t n = hi - lo;
  // First iteration does not need to check for n > 1
  // (lo < hi is guaranteed by the precondition).
  NANOARROW_DCHECK(n > 1);
  do {
    const int64_t m = n >> 1;
    const int64_t mid = lo + m;
    if (index >= offsets[mid]) {
      lo = mid;
      n -= m;
    } else {
      n = m;
    }
  } while (n > 1);
  return lo;
}

static inline int64_t ArrowResolveChunk32(int32_t index, const int32_t* offsets,
                                          int32_t lo, int32_t hi) {
  // Similar to std::upper_bound(), but slightly different as our offsets
  // array always starts with 0.
  int32_t n = hi - lo;
  // First iteration does not need to check for n > 1
  // (lo < hi is guaranteed by the precondition).
  NANOARROW_DCHECK(n > 1);
  do {
    const int32_t m = n >> 1;
    const int32_t mid = lo + m;
    if (index >= offsets[mid]) {
      lo = mid;
      n -= m;
    } else {
      n = m;
    }
  } while (n > 1);
  return lo;
}

static inline int64_t _ArrowGrowByFactor(int64_t current_capacity, int64_t new_capacity) {
  int64_t doubled_capacity = current_capacity * 2;
  if (doubled_capacity > new_capacity) {
    return doubled_capacity;
  } else {
    return new_capacity;
  }
}

// float to half float conversion, adapted from Arrow Go
// https://github.com/apache/arrow/blob/main/go/arrow/float16/float16.go
static inline uint16_t ArrowFloatToHalfFloat(float value) {
  union {
    float f;
    uint32_t b;
  } u;
  u.f = value;

  uint16_t sn = (uint16_t)((u.b >> 31) & 0x1);
  uint16_t exp = (u.b >> 23) & 0xff;
  int16_t res = (int16_t)(exp - 127 + 15);
  uint16_t fc = (uint16_t)(u.b >> 13) & 0x3ff;

  if (exp == 0) {
    res = 0;
  } else if (exp == 0xff) {
    res = 0x1f;
  } else if (res > 0x1e) {
    res = 0x1f;
    fc = 0;
  } else if (res < 0x01) {
    res = 0;
    fc = 0;
  }

  return (uint16_t)((sn << 15) | (uint16_t)(res << 10) | fc);
}

// half float to float conversion, adapted from Arrow Go
// https://github.com/apache/arrow/blob/main/go/arrow/float16/float16.go
static inline float ArrowHalfFloatToFloat(uint16_t value) {
  uint32_t sn = (uint32_t)((value >> 15) & 0x1);
  uint32_t exp = (value >> 10) & 0x1f;
  uint32_t res = exp + 127 - 15;
  uint32_t fc = value & 0x3ff;

  if (exp == 0) {
    res = 0;
  } else if (exp == 0x1f) {
    res = 0xff;
  }

  union {
    float f;
    uint32_t b;
  } u;
  u.b = (uint32_t)(sn << 31) | (uint32_t)(res << 23) | (uint32_t)(fc << 13);
  return u.f;
}

static inline void ArrowBufferInit(struct ArrowBuffer* buffer) {
  buffer->data = NULL;
  buffer->size_bytes = 0;
  buffer->capacity_bytes = 0;
  buffer->allocator = ArrowBufferAllocatorDefault();
}

static inline ArrowErrorCode ArrowBufferSetAllocator(
    struct ArrowBuffer* buffer, struct ArrowBufferAllocator allocator) {
  // This is not a perfect test for "has a buffer already been allocated"
  // but is likely to catch most cases.
  if (buffer->data == NULL) {
    buffer->allocator = allocator;
    return NANOARROW_OK;
  } else {
    return EINVAL;
  }
}

static inline void ArrowBufferReset(struct ArrowBuffer* buffer) {
  buffer->allocator.free(&buffer->allocator, (uint8_t*)buffer->data,
                         buffer->capacity_bytes);
  ArrowBufferInit(buffer);
}

static inline void ArrowBufferMove(struct ArrowBuffer* src, struct ArrowBuffer* dst) {
  memcpy(dst, src, sizeof(struct ArrowBuffer));
  src->data = NULL;
  ArrowBufferInit(src);
}

static inline ArrowErrorCode ArrowBufferResize(struct ArrowBuffer* buffer,
                                               int64_t new_size_bytes,
                                               char shrink_to_fit) {
  if (new_size_bytes < 0) {
    return EINVAL;
  }

  int needs_reallocation = new_size_bytes > buffer->capacity_bytes ||
                           (shrink_to_fit && new_size_bytes < buffer->capacity_bytes);

  if (needs_reallocation) {
    buffer->data = buffer->allocator.reallocate(&buffer->allocator, buffer->data,
                                                buffer->capacity_bytes, new_size_bytes);

    if (buffer->data == NULL && new_size_bytes > 0) {
      buffer->capacity_bytes = 0;
      buffer->size_bytes = 0;
      return ENOMEM;
    }

    buffer->capacity_bytes = new_size_bytes;
  }

  buffer->size_bytes = new_size_bytes;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowBufferReserve(struct ArrowBuffer* buffer,
                                                int64_t additional_size_bytes) {
  int64_t min_capacity_bytes = buffer->size_bytes + additional_size_bytes;
  if (min_capacity_bytes <= buffer->capacity_bytes) {
    return NANOARROW_OK;
  }

  int64_t new_capacity_bytes =
      _ArrowGrowByFactor(buffer->capacity_bytes, min_capacity_bytes);
  buffer->data = buffer->allocator.reallocate(&buffer->allocator, buffer->data,
                                              buffer->capacity_bytes, new_capacity_bytes);

  if (buffer->data == NULL && new_capacity_bytes > 0) {
    buffer->capacity_bytes = 0;
    buffer->size_bytes = 0;
    return ENOMEM;
  }

  buffer->capacity_bytes = new_capacity_bytes;
  return NANOARROW_OK;
}

static inline void ArrowBufferAppendUnsafe(struct ArrowBuffer* buffer, const void* data,
                                           int64_t size_bytes) {
  if (size_bytes > 0) {
    NANOARROW_DCHECK(buffer->data != NULL);
    memcpy(buffer->data + buffer->size_bytes, data, size_bytes);
    buffer->size_bytes += size_bytes;
  }
}

static inline ArrowErrorCode ArrowBufferAppend(struct ArrowBuffer* buffer,
                                               const void* data, int64_t size_bytes) {
  NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, size_bytes));

  ArrowBufferAppendUnsafe(buffer, data, size_bytes);
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowBufferAppendInt8(struct ArrowBuffer* buffer,
                                                   int8_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(int8_t));
}

static inline ArrowErrorCode ArrowBufferAppendUInt8(struct ArrowBuffer* buffer,
                                                    uint8_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(uint8_t));
}

static inline ArrowErrorCode ArrowBufferAppendInt16(struct ArrowBuffer* buffer,
                                                    int16_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(int16_t));
}

static inline ArrowErrorCode ArrowBufferAppendUInt16(struct ArrowBuffer* buffer,
                                                     uint16_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(uint16_t));
}

static inline ArrowErrorCode ArrowBufferAppendInt32(struct ArrowBuffer* buffer,
                                                    int32_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(int32_t));
}

static inline ArrowErrorCode ArrowBufferAppendUInt32(struct ArrowBuffer* buffer,
                                                     uint32_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(uint32_t));
}

static inline ArrowErrorCode ArrowBufferAppendInt64(struct ArrowBuffer* buffer,
                                                    int64_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(int64_t));
}

static inline ArrowErrorCode ArrowBufferAppendUInt64(struct ArrowBuffer* buffer,
                                                     uint64_t value) {
  return ArrowBufferAppend(buffer, &value, sizeof(uint64_t));
}

static inline ArrowErrorCode ArrowBufferAppendDouble(struct ArrowBuffer* buffer,
                                                     double value) {
  return ArrowBufferAppend(buffer, &value, sizeof(double));
}

static inline ArrowErrorCode ArrowBufferAppendFloat(struct ArrowBuffer* buffer,
                                                    float value) {
  return ArrowBufferAppend(buffer, &value, sizeof(float));
}

static inline ArrowErrorCode ArrowBufferAppendStringView(struct ArrowBuffer* buffer,
                                                         struct ArrowStringView value) {
  return ArrowBufferAppend(buffer, value.data, value.size_bytes);
}

static inline ArrowErrorCode ArrowBufferAppendBufferView(struct ArrowBuffer* buffer,
                                                         struct ArrowBufferView value) {
  return ArrowBufferAppend(buffer, value.data.data, value.size_bytes);
}

static inline ArrowErrorCode ArrowBufferAppendFill(struct ArrowBuffer* buffer,
                                                   uint8_t value, int64_t size_bytes) {
  if (size_bytes == 0) {
    return NANOARROW_OK;
  }

  NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, size_bytes));

  NANOARROW_DCHECK(buffer->data != NULL);  // To help clang-tidy
  memset(buffer->data + buffer->size_bytes, value, size_bytes);
  buffer->size_bytes += size_bytes;

  return NANOARROW_OK;
}

static const uint8_t _ArrowkBitmask[] = {1, 2, 4, 8, 16, 32, 64, 128};
static const uint8_t _ArrowkFlippedBitmask[] = {254, 253, 251, 247, 239, 223, 191, 127};
static const uint8_t _ArrowkPrecedingBitmask[] = {0, 1, 3, 7, 15, 31, 63, 127};
static const uint8_t _ArrowkTrailingBitmask[] = {255, 254, 252, 248, 240, 224, 192, 128};

static const uint8_t _ArrowkBytePopcount[] = {
    0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4, 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3,
    4, 4, 5, 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5, 2, 3, 3, 4, 3, 4, 4, 5, 3, 4,
    4, 5, 4, 5, 5, 6, 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5, 2, 3, 3, 4, 3, 4, 4,
    5, 3, 4, 4, 5, 4, 5, 5, 6, 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6, 3, 4, 4, 5,
    4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7, 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5, 2,
    3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6, 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5,
    5, 6, 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7, 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4,
    5, 4, 5, 5, 6, 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7, 3, 4, 4, 5, 4, 5, 5, 6,
    4, 5, 5, 6, 5, 6, 6, 7, 4, 5, 5, 6, 5, 6, 6, 7, 5, 6, 6, 7, 6, 7, 7, 8};

static inline int64_t _ArrowRoundUpToMultipleOf8(int64_t value) {
  return (value + 7) & ~((int64_t)7);
}

static inline int64_t _ArrowRoundDownToMultipleOf8(int64_t value) {
  return (value / 8) * 8;
}

static inline int64_t _ArrowBytesForBits(int64_t bits) {
  return (bits >> 3) + ((bits & 7) != 0);
}

static inline void _ArrowBitsUnpackInt8(const uint8_t word, int8_t* out) {
  out[0] = (word & 0x1) != 0;
  out[1] = (word & 0x2) != 0;
  out[2] = (word & 0x4) != 0;
  out[3] = (word & 0x8) != 0;
  out[4] = (word & 0x10) != 0;
  out[5] = (word & 0x20) != 0;
  out[6] = (word & 0x40) != 0;
  out[7] = (word & 0x80) != 0;
}

static inline void _ArrowBitsUnpackInt32(const uint8_t word, int32_t* out) {
  out[0] = (word & 0x1) != 0;
  out[1] = (word & 0x2) != 0;
  out[2] = (word & 0x4) != 0;
  out[3] = (word & 0x8) != 0;
  out[4] = (word & 0x10) != 0;
  out[5] = (word & 0x20) != 0;
  out[6] = (word & 0x40) != 0;
  out[7] = (word & 0x80) != 0;
}

static inline void _ArrowBitmapPackInt8(const int8_t* values, uint8_t* out) {
  *out = (uint8_t)(values[0] | ((values[1] + 0x1) & 0x2) | ((values[2] + 0x3) & 0x4) |
                   ((values[3] + 0x7) & 0x8) | ((values[4] + 0xf) & 0x10) |
                   ((values[5] + 0x1f) & 0x20) | ((values[6] + 0x3f) & 0x40) |
                   ((values[7] + 0x7f) & 0x80));
}

static inline void _ArrowBitmapPackInt32(const int32_t* values, uint8_t* out) {
  *out = (uint8_t)(values[0] | ((values[1] + 0x1) & 0x2) | ((values[2] + 0x3) & 0x4) |
                   ((values[3] + 0x7) & 0x8) | ((values[4] + 0xf) & 0x10) |
                   ((values[5] + 0x1f) & 0x20) | ((values[6] + 0x3f) & 0x40) |
                   ((values[7] + 0x7f) & 0x80));
}

static inline int8_t ArrowBitGet(const uint8_t* bits, int64_t i) {
  return (bits[i >> 3] >> (i & 0x07)) & 1;
}

static inline void ArrowBitsUnpackInt8(const uint8_t* bits, int64_t start_offset,
                                       int64_t length, int8_t* out) {
  if (length == 0) {
    return;
  }

  const int64_t i_begin = start_offset;
  const int64_t i_end = start_offset + length;
  const int64_t i_last_valid = i_end - 1;

  const int64_t bytes_begin = i_begin / 8;
  const int64_t bytes_last_valid = i_last_valid / 8;

  if (bytes_begin == bytes_last_valid) {
    for (int i = 0; i < length; i++) {
      out[i] = ArrowBitGet(&bits[bytes_begin], i + i_begin % 8);
    }

    return;
  }

  // first byte
  for (int i = 0; i < 8 - (i_begin % 8); i++) {
    *out++ = ArrowBitGet(&bits[bytes_begin], i + i_begin % 8);
  }

  // middle bytes
  for (int64_t i = bytes_begin + 1; i < bytes_last_valid; i++) {
    _ArrowBitsUnpackInt8(bits[i], out);
    out += 8;
  }

  // last byte
  const int bits_remaining = (int)(i_end % 8 == 0 ? 8 : i_end % 8);
  for (int i = 0; i < bits_remaining; i++) {
    *out++ = ArrowBitGet(&bits[bytes_last_valid], i);
  }
}

static inline void ArrowBitsUnpackInt32(const uint8_t* bits, int64_t start_offset,
                                        int64_t length, int32_t* out) {
  if (length == 0) {
    return;
  }

  NANOARROW_DCHECK(bits != NULL && out != NULL);

  const int64_t i_begin = start_offset;
  const int64_t i_end = start_offset + length;
  const int64_t i_last_valid = i_end - 1;

  const int64_t bytes_begin = i_begin / 8;
  const int64_t bytes_last_valid = i_last_valid / 8;

  if (bytes_begin == bytes_last_valid) {
    for (int i = 0; i < length; i++) {
      out[i] = ArrowBitGet(&bits[bytes_begin], i + i_begin % 8);
    }

    return;
  }

  // first byte
  for (int i = 0; i < 8 - (i_begin % 8); i++) {
    *out++ = ArrowBitGet(&bits[bytes_begin], i + i_begin % 8);
  }

  // middle bytes
  for (int64_t i = bytes_begin + 1; i < bytes_last_valid; i++) {
    _ArrowBitsUnpackInt32(bits[i], out);
    out += 8;
  }

  // last byte
  const int bits_remaining = (int)(i_end % 8 == 0 ? 8 : i_end % 8);
  for (int i = 0; i < bits_remaining; i++) {
    *out++ = ArrowBitGet(&bits[bytes_last_valid], i);
  }
}

static inline void ArrowBitSet(uint8_t* bits, int64_t i) {
  bits[i / 8] |= _ArrowkBitmask[i % 8];
}

static inline void ArrowBitClear(uint8_t* bits, int64_t i) {
  bits[i / 8] &= _ArrowkFlippedBitmask[i % 8];
}

static inline void ArrowBitSetTo(uint8_t* bits, int64_t i, uint8_t bit_is_set) {
  bits[i / 8] ^= (uint8_t)(((uint8_t)(-((uint8_t)(bit_is_set != 0)) ^ bits[i / 8])) &
                           _ArrowkBitmask[i % 8]);
}

static inline void ArrowBitsSetTo(uint8_t* bits, int64_t start_offset, int64_t length,
                                  uint8_t bits_are_set) {
  if (length == 0) {
    return;
  }

  NANOARROW_DCHECK(bits != NULL);

  const int64_t i_begin = start_offset;
  const int64_t i_end = start_offset + length;
  const uint8_t fill_byte = (uint8_t)(-bits_are_set);

  const int64_t bytes_begin = i_begin / 8;
  const int64_t bytes_end = i_end / 8 + 1;

  const uint8_t first_byte_mask = _ArrowkPrecedingBitmask[i_begin % 8];
  const uint8_t last_byte_mask = _ArrowkTrailingBitmask[i_end % 8];

  if (bytes_end == bytes_begin + 1) {
    // set bits within a single byte
    const uint8_t only_byte_mask =
        i_end % 8 == 0 ? first_byte_mask : (uint8_t)(first_byte_mask | last_byte_mask);
    bits[bytes_begin] &= only_byte_mask;
    bits[bytes_begin] |= (uint8_t)(fill_byte & ~only_byte_mask);
    return;
  }

  // set/clear trailing bits of first byte
  bits[bytes_begin] &= first_byte_mask;
  bits[bytes_begin] |= (uint8_t)(fill_byte & ~first_byte_mask);

  if (bytes_end - bytes_begin > 2) {
    // set/clear whole bytes
    memset(bits + bytes_begin + 1, fill_byte, (size_t)(bytes_end - bytes_begin - 2));
  }

  if (i_end % 8 == 0) {
    return;
  }

  // set/clear leading bits of last byte
  bits[bytes_end - 1] &= last_byte_mask;
  bits[bytes_end - 1] |= (uint8_t)(fill_byte & ~last_byte_mask);
}

static inline int64_t ArrowBitCountSet(const uint8_t* bits, int64_t start_offset,
                                       int64_t length) {
  if (length == 0) {
    return 0;
  }

  NANOARROW_DCHECK(bits != NULL);

  const int64_t i_begin = start_offset;
  const int64_t i_end = start_offset + length;
  const int64_t i_last_valid = i_end - 1;

  const int64_t bytes_begin = i_begin / 8;
  const int64_t bytes_last_valid = i_last_valid / 8;

  if (bytes_begin == bytes_last_valid) {
    // count bits within a single byte
    const uint8_t first_byte_mask = _ArrowkPrecedingBitmask[i_end % 8];
    const uint8_t last_byte_mask = _ArrowkTrailingBitmask[i_begin % 8];

    const uint8_t only_byte_mask =
        i_end % 8 == 0 ? last_byte_mask : (uint8_t)(first_byte_mask & last_byte_mask);

    const uint8_t byte_masked = bits[bytes_begin] & only_byte_mask;
    return _ArrowkBytePopcount[byte_masked];
  }

  const uint8_t first_byte_mask = _ArrowkPrecedingBitmask[i_begin % 8];
  const uint8_t last_byte_mask = i_end % 8 == 0 ? 0 : _ArrowkTrailingBitmask[i_end % 8];
  int64_t count = 0;

  // first byte
  count += _ArrowkBytePopcount[bits[bytes_begin] & ~first_byte_mask];

  // middle bytes
  for (int64_t i = bytes_begin + 1; i < bytes_last_valid; i++) {
    count += _ArrowkBytePopcount[bits[i]];
  }

  // last byte
  count += _ArrowkBytePopcount[bits[bytes_last_valid] & ~last_byte_mask];

  return count;
}

static inline void ArrowBitmapInit(struct ArrowBitmap* bitmap) {
  ArrowBufferInit(&bitmap->buffer);
  bitmap->size_bits = 0;
}

static inline void ArrowBitmapMove(struct ArrowBitmap* src, struct ArrowBitmap* dst) {
  ArrowBufferMove(&src->buffer, &dst->buffer);
  dst->size_bits = src->size_bits;
  src->size_bits = 0;
}

static inline ArrowErrorCode ArrowBitmapReserve(struct ArrowBitmap* bitmap,
                                                int64_t additional_size_bits) {
  int64_t min_capacity_bits = bitmap->size_bits + additional_size_bits;
  int64_t min_capacity_bytes = _ArrowBytesForBits(min_capacity_bits);
  int64_t current_size_bytes = bitmap->buffer.size_bytes;
  int64_t current_capacity_bytes = bitmap->buffer.capacity_bytes;

  if (min_capacity_bytes <= current_capacity_bytes) {
    return NANOARROW_OK;
  }

  int64_t additional_capacity_bytes = min_capacity_bytes - current_size_bytes;
  NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(&bitmap->buffer, additional_capacity_bytes));

  // Zero out the last byte for deterministic output in the common case
  // of reserving a known remaining size. We should have returned above
  // if there was not at least one additional byte to allocate; however,
  // DCHECK() just to be sure.
  NANOARROW_DCHECK(bitmap->buffer.capacity_bytes > current_capacity_bytes);
  bitmap->buffer.data[bitmap->buffer.capacity_bytes - 1] = 0;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowBitmapResize(struct ArrowBitmap* bitmap,
                                               int64_t new_size_bits,
                                               char shrink_to_fit) {
  if (new_size_bits < 0) {
    return EINVAL;
  }

  int64_t new_size_bytes = _ArrowBytesForBits(new_size_bits);
  NANOARROW_RETURN_NOT_OK(
      ArrowBufferResize(&bitmap->buffer, new_size_bytes, shrink_to_fit));

  bitmap->size_bits = new_size_bits;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowBitmapAppend(struct ArrowBitmap* bitmap,
                                               uint8_t bits_are_set, int64_t length) {
  NANOARROW_RETURN_NOT_OK(ArrowBitmapReserve(bitmap, length));

  ArrowBitmapAppendUnsafe(bitmap, bits_are_set, length);
  return NANOARROW_OK;
}

static inline void ArrowBitmapAppendUnsafe(struct ArrowBitmap* bitmap,
                                           uint8_t bits_are_set, int64_t length) {
  ArrowBitsSetTo(bitmap->buffer.data, bitmap->size_bits, length, bits_are_set);
  bitmap->size_bits += length;
  bitmap->buffer.size_bytes = _ArrowBytesForBits(bitmap->size_bits);
}

static inline void ArrowBitmapAppendInt8Unsafe(struct ArrowBitmap* bitmap,
                                               const int8_t* values, int64_t n_values) {
  if (n_values == 0) {
    return;
  }

  NANOARROW_DCHECK(bitmap->buffer.data != NULL);
  NANOARROW_DCHECK(values != NULL);

  const int8_t* values_cursor = values;
  int64_t n_remaining = n_values;
  int64_t out_i_cursor = bitmap->size_bits;
  uint8_t* out_cursor = bitmap->buffer.data + bitmap->size_bits / 8;

  // First byte
  if ((out_i_cursor % 8) != 0) {
    int64_t n_partial_bits = _ArrowRoundUpToMultipleOf8(out_i_cursor) - out_i_cursor;
    for (int i = 0; i < n_partial_bits; i++) {
      ArrowBitSetTo(bitmap->buffer.data, out_i_cursor++, values[i]);
    }

    out_cursor++;
    values_cursor += n_partial_bits;
    n_remaining -= n_partial_bits;
  }

  // Middle bytes
  int64_t n_full_bytes = n_remaining / 8;
  for (int64_t i = 0; i < n_full_bytes; i++) {
    _ArrowBitmapPackInt8(values_cursor, out_cursor);
    values_cursor += 8;
    out_cursor++;
  }

  // Last byte
  out_i_cursor += n_full_bytes * 8;
  n_remaining -= n_full_bytes * 8;
  if (n_remaining > 0) {
    // Zero out the last byte
    *out_cursor = 0x00;
    for (int i = 0; i < n_remaining; i++) {
      ArrowBitSetTo(bitmap->buffer.data, out_i_cursor++, values_cursor[i]);
    }
    out_cursor++;
  }

  bitmap->size_bits += n_values;
  bitmap->buffer.size_bytes = out_cursor - bitmap->buffer.data;
}

static inline void ArrowBitmapAppendInt32Unsafe(struct ArrowBitmap* bitmap,
                                                const int32_t* values, int64_t n_values) {
  if (n_values == 0) {
    return;
  }

  NANOARROW_DCHECK(bitmap->buffer.data != NULL);
  NANOARROW_DCHECK(values != NULL);

  const int32_t* values_cursor = values;
  int64_t n_remaining = n_values;
  int64_t out_i_cursor = bitmap->size_bits;
  uint8_t* out_cursor = bitmap->buffer.data + bitmap->size_bits / 8;

  // First byte
  if ((out_i_cursor % 8) != 0) {
    int64_t n_partial_bits = _ArrowRoundUpToMultipleOf8(out_i_cursor) - out_i_cursor;
    for (int i = 0; i < n_partial_bits; i++) {
      ArrowBitSetTo(bitmap->buffer.data, out_i_cursor++, (uint8_t)values[i]);
    }

    out_cursor++;
    values_cursor += n_partial_bits;
    n_remaining -= n_partial_bits;
  }

  // Middle bytes
  int64_t n_full_bytes = n_remaining / 8;
  for (int64_t i = 0; i < n_full_bytes; i++) {
    _ArrowBitmapPackInt32(values_cursor, out_cursor);
    values_cursor += 8;
    out_cursor++;
  }

  // Last byte
  out_i_cursor += n_full_bytes * 8;
  n_remaining -= n_full_bytes * 8;
  if (n_remaining > 0) {
    // Zero out the last byte
    *out_cursor = 0x00;
    for (int i = 0; i < n_remaining; i++) {
      ArrowBitSetTo(bitmap->buffer.data, out_i_cursor++, (uint8_t)values_cursor[i]);
    }
    out_cursor++;
  }

  bitmap->size_bits += n_values;
  bitmap->buffer.size_bytes = out_cursor - bitmap->buffer.data;
}

static inline void ArrowBitmapReset(struct ArrowBitmap* bitmap) {
  ArrowBufferReset(&bitmap->buffer);
  bitmap->size_bits = 0;
}

#ifdef __cplusplus
}
#endif

#endif
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#ifndef NANOARROW_ARRAY_INLINE_H_INCLUDED
#define NANOARROW_ARRAY_INLINE_H_INCLUDED

#include <errno.h>
#include <float.h>
#include <limits.h>
#include <stdint.h>
#include <string.h>


#ifdef __cplusplus
extern "C" {
#endif

static inline struct ArrowBitmap* ArrowArrayValidityBitmap(struct ArrowArray* array) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  return &private_data->bitmap;
}

static inline struct ArrowBuffer* ArrowArrayBuffer(struct ArrowArray* array, int64_t i) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  switch (i) {
    case 0:
      return &private_data->bitmap.buffer;
    case 1:
      return private_data->buffers;
    default:
      if (array->n_buffers > 3 && i == (array->n_buffers - 1)) {
        // The variadic buffer sizes buffer if for a BinaryView/String view array
        // is always stored in private_data->buffers[1]; however, from the numbered
        // buffers perspective this is the array->buffers[array->n_buffers - 1].
        return private_data->buffers + 1;
      } else if (array->n_buffers > 3) {
        // If there are one or more variadic buffers, they are stored in
        // private_data->variadic_buffers
        return private_data->variadic_buffers + (i - 2);
      } else {
        // Otherwise, we're just accessing buffer at index 2 (e.g., String/Binary
        // data buffer or variadic sizes buffer for the case where there are no
        // variadic buffers)
        NANOARROW_DCHECK(i == 2);
        return private_data->buffers + i - 1;
      }
  }
}

// We don't currently support the case of unions where type_id != child_index;
// however, these functions are used to keep track of where that assumption
// is made.
static inline int8_t _ArrowArrayUnionChildIndex(struct ArrowArray* array,
                                                int8_t type_id) {
  NANOARROW_UNUSED(array);
  return type_id;
}

static inline int8_t _ArrowArrayUnionTypeId(struct ArrowArray* array,
                                            int8_t child_index) {
  NANOARROW_UNUSED(array);
  return child_index;
}

static inline int32_t _ArrowParseUnionTypeIds(const char* type_ids, int8_t* out) {
  if (*type_ids == '\0') {
    return 0;
  }

  int32_t i = 0;
  long type_id;
  char* end_ptr;
  do {
    type_id = strtol(type_ids, &end_ptr, 10);
    if (end_ptr == type_ids || type_id < 0 || type_id > 127) {
      return -1;
    }

    if (out != NULL) {
      out[i] = (int8_t)type_id;
    }

    i++;

    type_ids = end_ptr;
    if (*type_ids == '\0') {
      return i;
    } else if (*type_ids != ',') {
      return -1;
    } else {
      type_ids++;
    }
  } while (1);

  return -1;
}

static inline int8_t _ArrowParsedUnionTypeIdsWillEqualChildIndices(const int8_t* type_ids,
                                                                   int64_t n_type_ids,
                                                                   int64_t n_children) {
  if (n_type_ids != n_children) {
    return 0;
  }

  for (int8_t i = 0; i < n_type_ids; i++) {
    if (type_ids[i] != i) {
      return 0;
    }
  }

  return 1;
}

static inline int8_t _ArrowUnionTypeIdsWillEqualChildIndices(const char* type_id_str,
                                                             int64_t n_children) {
  int8_t type_ids[128];
  int32_t n_type_ids = _ArrowParseUnionTypeIds(type_id_str, type_ids);
  return _ArrowParsedUnionTypeIdsWillEqualChildIndices(type_ids, n_type_ids, n_children);
}

static inline ArrowErrorCode ArrowArrayStartAppending(struct ArrowArray* array) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_UNINITIALIZED:
      return EINVAL;
    case NANOARROW_TYPE_SPARSE_UNION:
    case NANOARROW_TYPE_DENSE_UNION:
      // Note that this value could be -1 if the type_ids string was invalid
      if (private_data->union_type_id_is_child_index != 1) {
        return EINVAL;
      } else {
        break;
      }
    default:
      break;
  }
  if (private_data->storage_type == NANOARROW_TYPE_UNINITIALIZED) {
    return EINVAL;
  }

  // Initialize any data offset buffer with a single zero
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    if (private_data->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_DATA_OFFSET &&
        private_data->layout.element_size_bits[i] == 64) {
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt64(ArrowArrayBuffer(array, i), 0));
    } else if (private_data->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_DATA_OFFSET &&
               private_data->layout.element_size_bits[i] == 32) {
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(ArrowArrayBuffer(array, i), 0));
    }
  }

  // Start building any child arrays or dictionaries
  for (int64_t i = 0; i < array->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayStartAppending(array->children[i]));
  }

  if (array->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayStartAppending(array->dictionary));
  }

  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayShrinkToFit(struct ArrowArray* array) {
  for (int64_t i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    struct ArrowBuffer* buffer = ArrowArrayBuffer(array, i);
    NANOARROW_RETURN_NOT_OK(ArrowBufferResize(buffer, buffer->size_bytes, 1));
  }

  for (int64_t i = 0; i < array->n_children; i++) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayShrinkToFit(array->children[i]));
  }

  if (array->dictionary != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowArrayShrinkToFit(array->dictionary));
  }

  return NANOARROW_OK;
}

static inline ArrowErrorCode _ArrowArrayAppendBits(struct ArrowArray* array,
                                                   int64_t buffer_i, uint8_t value,
                                                   int64_t n) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  struct ArrowBuffer* buffer = ArrowArrayBuffer(array, buffer_i);
  int64_t bytes_required =
      _ArrowRoundUpToMultipleOf8(private_data->layout.element_size_bits[buffer_i] *
                                 (array->length + 1)) /
      8;
  if (bytes_required > buffer->size_bytes) {
    NANOARROW_RETURN_NOT_OK(
        ArrowBufferAppendFill(buffer, 0, bytes_required - buffer->size_bytes));
  }

  ArrowBitsSetTo(buffer->data, array->length, n, value);
  return NANOARROW_OK;
}

static inline ArrowErrorCode _ArrowArrayAppendEmptyInternal(struct ArrowArray* array,
                                                            int64_t n, uint8_t is_valid) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  if (n == 0) {
    return NANOARROW_OK;
  }

  // Some type-specific handling
  switch (private_data->storage_type) {
    case NANOARROW_TYPE_NA:
      // (An empty value for a null array *is* a null)
      array->null_count += n;
      array->length += n;
      return NANOARROW_OK;

    case NANOARROW_TYPE_DENSE_UNION: {
      // Add one null to the first child and append n references to that child
      int8_t type_id = _ArrowArrayUnionTypeId(array, 0);
      NANOARROW_RETURN_NOT_OK(
          _ArrowArrayAppendEmptyInternal(array->children[0], 1, is_valid));
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendFill(ArrowArrayBuffer(array, 0), type_id, n));
      for (int64_t i = 0; i < n; i++) {
        NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(
            ArrowArrayBuffer(array, 1), (int32_t)array->children[0]->length - 1));
      }
      // For the purposes of array->null_count, union elements are never considered "null"
      // even if some children contain nulls.
      array->length += n;
      return NANOARROW_OK;
    }

    case NANOARROW_TYPE_SPARSE_UNION: {
      // Add n nulls to the first child and append n references to that child
      int8_t type_id = _ArrowArrayUnionTypeId(array, 0);
      NANOARROW_RETURN_NOT_OK(
          _ArrowArrayAppendEmptyInternal(array->children[0], n, is_valid));
      for (int64_t i = 1; i < array->n_children; i++) {
        NANOARROW_RETURN_NOT_OK(ArrowArrayAppendEmpty(array->children[i], n));
      }

      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendFill(ArrowArrayBuffer(array, 0), type_id, n));
      // For the purposes of array->null_count, union elements are never considered "null"
      // even if some children contain nulls.
      array->length += n;
      return NANOARROW_OK;
    }

    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      NANOARROW_RETURN_NOT_OK(ArrowArrayAppendEmpty(
          array->children[0], n * private_data->layout.child_size_elements));
      break;
    case NANOARROW_TYPE_STRUCT:
      for (int64_t i = 0; i < array->n_children; i++) {
        NANOARROW_RETURN_NOT_OK(ArrowArrayAppendEmpty(array->children[i], n));
      }
      break;

    default:
      break;
  }

  // Append n is_valid bits to the validity bitmap. If we haven't allocated a bitmap yet
  // and we need to append nulls, do it now.
  if (!is_valid && private_data->bitmap.buffer.data == NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapReserve(&private_data->bitmap, array->length + n));
    ArrowBitmapAppendUnsafe(&private_data->bitmap, 1, array->length);
    ArrowBitmapAppendUnsafe(&private_data->bitmap, is_valid, n);
  } else if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapReserve(&private_data->bitmap, n));
    ArrowBitmapAppendUnsafe(&private_data->bitmap, is_valid, n);
  }

  // Add appropriate buffer fill
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    struct ArrowBuffer* buffer = ArrowArrayBuffer(array, i);
    int64_t size_bytes = private_data->layout.element_size_bits[i] / 8;

    switch (private_data->layout.buffer_type[i]) {
      case NANOARROW_BUFFER_TYPE_NONE:
      case NANOARROW_BUFFER_TYPE_VARIADIC_DATA:
      case NANOARROW_BUFFER_TYPE_VARIADIC_SIZE:
      case NANOARROW_BUFFER_TYPE_VALIDITY:
        // These buffer types don't require initialization for empty appends:
        // - NONE: No buffer exists
        // - VARIADIC_*: Handled by child arrays
        // - VALIDITY: Already handled in previous bitmap logic
        break;

      case NANOARROW_BUFFER_TYPE_SIZE:
        // Size buffers (e.g., string/array lengths) should be zero-initialized:
        // This ensures empty elements have logical zero-length
        NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFill(buffer, 0, size_bytes * n));
        break;

      case NANOARROW_BUFFER_TYPE_DATA_OFFSET:
        // Offset buffers require special handling to maintain continuity.
        // 1. Reserve space for new offset entries
        NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, size_bytes * n));

        // 2. Duplicate last offset value for each new (empty) element
        for (int64_t j = 0; j < n; j++) {
          ArrowBufferAppendUnsafe(buffer, buffer->data + size_bytes * (array->length + j),
                                  size_bytes);
        }

        // 3. Skip next buffer (DATA) since it's paired with offsets
        //    Rationale: Offset buffers are always followed by data buffers
        //    that don't require separate initialization here
        i++;
        break;

      case NANOARROW_BUFFER_TYPE_DATA:
        // Fixed-width data buffers require zero-initialization:
        if (private_data->layout.element_size_bits[i] % 8 == 0) {
          // Byte-aligned: use efficient memset-style fill
          NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFill(buffer, 0, size_bytes * n));
        } else {
          // Bit-packed: use special bitwise initialization
          NANOARROW_RETURN_NOT_OK(_ArrowArrayAppendBits(array, i, 0, n));
        }
        break;

      case NANOARROW_BUFFER_TYPE_VIEW_OFFSET:
        // View offset buffers (for string/binary view types) require zero-initialization.
        NANOARROW_RETURN_NOT_OK(ArrowBufferReserve(buffer, size_bytes * n));
        NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFill(buffer, 0, size_bytes * n));
        break;

      case NANOARROW_BUFFER_TYPE_TYPE_ID:
      case NANOARROW_BUFFER_TYPE_UNION_OFFSET:
        // These buffer types should have been handled by the outer type switch and
        // are not expected here, indicating an internal logic error.
        return EINVAL;
    }
  }

  array->length += n;
  array->null_count += n * !is_valid;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendNull(struct ArrowArray* array, int64_t n) {
  return _ArrowArrayAppendEmptyInternal(array, n, 0);
}

static inline ArrowErrorCode ArrowArrayAppendEmpty(struct ArrowArray* array, int64_t n) {
  return _ArrowArrayAppendEmptyInternal(array, n, 1);
}

static inline ArrowErrorCode ArrowArrayAppendInt(struct ArrowArray* array,
                                                 int64_t value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_INT64:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppend(data_buffer, &value, sizeof(int64_t)));
      break;
    case NANOARROW_TYPE_INT32:
      _NANOARROW_CHECK_RANGE(value, INT32_MIN, INT32_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, (int32_t)value));
      break;
    case NANOARROW_TYPE_INT16:
      _NANOARROW_CHECK_RANGE(value, INT16_MIN, INT16_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt16(data_buffer, (int16_t)value));
      break;
    case NANOARROW_TYPE_INT8:
      _NANOARROW_CHECK_RANGE(value, INT8_MIN, INT8_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt8(data_buffer, (int8_t)value));
      break;
    case NANOARROW_TYPE_UINT64:
    case NANOARROW_TYPE_UINT32:
    case NANOARROW_TYPE_UINT16:
    case NANOARROW_TYPE_UINT8:
      _NANOARROW_CHECK_RANGE(value, 0, INT64_MAX);
      return ArrowArrayAppendUInt(array, value);
    case NANOARROW_TYPE_DOUBLE:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendDouble(data_buffer, (double)value));
      break;
    case NANOARROW_TYPE_FLOAT:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFloat(data_buffer, (float)value));
      break;
    case NANOARROW_TYPE_HALF_FLOAT:
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendUInt16(data_buffer, ArrowFloatToHalfFloat((float)value)));
      break;
    case NANOARROW_TYPE_BOOL:
      NANOARROW_RETURN_NOT_OK(_ArrowArrayAppendBits(array, 1, value != 0, 1));
      break;
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendUInt(struct ArrowArray* array,
                                                  uint64_t value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_UINT64:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppend(data_buffer, &value, sizeof(uint64_t)));
      break;
    case NANOARROW_TYPE_UINT32:
      _NANOARROW_CHECK_UPPER_LIMIT(value, UINT32_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendUInt32(data_buffer, (uint32_t)value));
      break;
    case NANOARROW_TYPE_UINT16:
      _NANOARROW_CHECK_UPPER_LIMIT(value, UINT16_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendUInt16(data_buffer, (uint16_t)value));
      break;
    case NANOARROW_TYPE_UINT8:
      _NANOARROW_CHECK_UPPER_LIMIT(value, UINT8_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendUInt8(data_buffer, (uint8_t)value));
      break;
    case NANOARROW_TYPE_INT64:
    case NANOARROW_TYPE_INT32:
    case NANOARROW_TYPE_INT16:
    case NANOARROW_TYPE_INT8:
      _NANOARROW_CHECK_UPPER_LIMIT(value, INT64_MAX);
      return ArrowArrayAppendInt(array, value);
    case NANOARROW_TYPE_DOUBLE:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendDouble(data_buffer, (double)value));
      break;
    case NANOARROW_TYPE_FLOAT:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFloat(data_buffer, (float)value));
      break;
    case NANOARROW_TYPE_HALF_FLOAT:
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendUInt16(data_buffer, ArrowFloatToHalfFloat((float)value)));
      break;
    case NANOARROW_TYPE_BOOL:
      NANOARROW_RETURN_NOT_OK(_ArrowArrayAppendBits(array, 1, value != 0, 1));
      break;
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendDouble(struct ArrowArray* array,
                                                    double value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_DOUBLE:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppend(data_buffer, &value, sizeof(double)));
      break;
    case NANOARROW_TYPE_FLOAT:
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendFloat(data_buffer, (float)value));
      break;
    case NANOARROW_TYPE_HALF_FLOAT:
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendUInt16(data_buffer, ArrowFloatToHalfFloat((float)value)));
      break;
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

// Binary views only have two fixed buffers, but be aware that they must also
// always have more 1 buffer to store variadic buffer sizes (even if there are none)
#define NANOARROW_BINARY_VIEW_FIXED_BUFFERS 2
#define NANOARROW_BINARY_VIEW_INLINE_SIZE 12
#define NANOARROW_BINARY_VIEW_PREFIX_SIZE 4
#define NANOARROW_BINARY_VIEW_BLOCK_SIZE (32 << 10)  // 32KB

// The Arrow C++ implementation uses anonymous structs as members
// of the ArrowBinaryView. For Cython support in this library, we define
// those structs outside of the ArrowBinaryView
struct ArrowBinaryViewInlined {
  int32_t size;
  uint8_t data[NANOARROW_BINARY_VIEW_INLINE_SIZE];
};

struct ArrowBinaryViewRef {
  int32_t size;
  uint8_t prefix[NANOARROW_BINARY_VIEW_PREFIX_SIZE];
  int32_t buffer_index;
  int32_t offset;
};

union ArrowBinaryView {
  struct ArrowBinaryViewInlined inlined;
  struct ArrowBinaryViewRef ref;
  int64_t alignment_dummy;
};

static inline int32_t ArrowArrayVariadicBufferCount(struct ArrowArray* array) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  return private_data->n_variadic_buffers;
}

static inline ArrowErrorCode ArrowArrayAddVariadicBuffers(struct ArrowArray* array,
                                                          int32_t n_buffers) {
  const int32_t n_current_bufs = ArrowArrayVariadicBufferCount(array);
  const int32_t nvariadic_bufs_needed = n_current_bufs + n_buffers;

  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  private_data->variadic_buffers = (struct ArrowBuffer*)ArrowRealloc(
      private_data->variadic_buffers, sizeof(struct ArrowBuffer) * nvariadic_bufs_needed);
  if (private_data->variadic_buffers == NULL) {
    return ENOMEM;
  }

  private_data->n_variadic_buffers = nvariadic_bufs_needed;
  array->n_buffers = NANOARROW_BINARY_VIEW_FIXED_BUFFERS + 1 + nvariadic_bufs_needed;

  private_data->buffer_data = (const void**)ArrowRealloc(
      private_data->buffer_data, array->n_buffers * sizeof(void*));

  for (int32_t i = n_current_bufs; i < nvariadic_bufs_needed; i++) {
    ArrowBufferInit(&private_data->variadic_buffers[i]);
    private_data->buffer_data[NANOARROW_BINARY_VIEW_FIXED_BUFFERS + i] = NULL;
  }

  // Zero out memory for the final buffer (variadic sizes buffer we haven't built yet)
  private_data->buffer_data[NANOARROW_BINARY_VIEW_FIXED_BUFFERS + nvariadic_bufs_needed] =
      NULL;

  // Ensure array->buffers points to a valid value
  array->buffers = private_data->buffer_data;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendBytes(struct ArrowArray* array,
                                                   struct ArrowBufferView value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  if (private_data->storage_type == NANOARROW_TYPE_STRING_VIEW ||
      private_data->storage_type == NANOARROW_TYPE_BINARY_VIEW) {
    struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);
    union ArrowBinaryView bvt;
    bvt.inlined.size = (int32_t)value.size_bytes;

    if (value.size_bytes <= NANOARROW_BINARY_VIEW_INLINE_SIZE) {
      memcpy(bvt.inlined.data, value.data.as_char, value.size_bytes);
      memset(bvt.inlined.data + bvt.inlined.size, 0,
             NANOARROW_BINARY_VIEW_INLINE_SIZE - bvt.inlined.size);
    } else {
      int32_t current_n_vbufs = ArrowArrayVariadicBufferCount(array);
      if (current_n_vbufs == 0 ||
          private_data->variadic_buffers[current_n_vbufs - 1].size_bytes +
                  value.size_bytes >
              NANOARROW_BINARY_VIEW_BLOCK_SIZE) {
        const int32_t additional_bufs_needed = 1;
        NANOARROW_RETURN_NOT_OK(
            ArrowArrayAddVariadicBuffers(array, additional_bufs_needed));
        current_n_vbufs += additional_bufs_needed;
      }

      const int32_t buf_index = current_n_vbufs - 1;
      struct ArrowBuffer* variadic_buf = &private_data->variadic_buffers[buf_index];
      memcpy(bvt.ref.prefix, value.data.as_char, NANOARROW_BINARY_VIEW_PREFIX_SIZE);
      bvt.ref.buffer_index = (int32_t)buf_index;
      bvt.ref.offset = (int32_t)variadic_buf->size_bytes;
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppend(variadic_buf, value.data.as_char, value.size_bytes));
    }
    NANOARROW_RETURN_NOT_OK(ArrowBufferAppend(data_buffer, &bvt, sizeof(bvt)));
  } else {
    struct ArrowBuffer* offset_buffer = ArrowArrayBuffer(array, 1);
    struct ArrowBuffer* data_buffer = ArrowArrayBuffer(
        array, 1 + (private_data->storage_type != NANOARROW_TYPE_FIXED_SIZE_BINARY));
    int32_t offset;
    int64_t large_offset;
    int64_t fixed_size_bytes = private_data->layout.element_size_bits[1] / 8;

    switch (private_data->storage_type) {
      case NANOARROW_TYPE_STRING:
      case NANOARROW_TYPE_BINARY:
        offset = ((int32_t*)offset_buffer->data)[array->length];
        if ((((int64_t)offset) + value.size_bytes) > INT32_MAX) {
          return EOVERFLOW;
        }

        offset += (int32_t)value.size_bytes;
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(offset_buffer, &offset, sizeof(int32_t)));
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value.data.data, value.size_bytes));
        break;

      case NANOARROW_TYPE_LARGE_STRING:
      case NANOARROW_TYPE_LARGE_BINARY:
        large_offset = ((int64_t*)offset_buffer->data)[array->length];
        large_offset += value.size_bytes;
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(offset_buffer, &large_offset, sizeof(int64_t)));
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value.data.data, value.size_bytes));
        break;

      case NANOARROW_TYPE_FIXED_SIZE_BINARY:
        if (value.size_bytes != fixed_size_bytes) {
          return EINVAL;
        }

        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value.data.data, value.size_bytes));
        break;
      default:
        return EINVAL;
    }
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendString(struct ArrowArray* array,
                                                    struct ArrowStringView value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  struct ArrowBufferView buffer_view;
  buffer_view.data.data = value.data;
  buffer_view.size_bytes = value.size_bytes;

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_STRING_VIEW:
    case NANOARROW_TYPE_BINARY:
    case NANOARROW_TYPE_LARGE_BINARY:
    case NANOARROW_TYPE_BINARY_VIEW:
      return ArrowArrayAppendBytes(array, buffer_view);
    default:
      return EINVAL;
  }
}

static inline ArrowErrorCode ArrowArrayAppendInterval(struct ArrowArray* array,
                                                      const struct ArrowInterval* value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_INTERVAL_MONTHS: {
      if (value->type != NANOARROW_TYPE_INTERVAL_MONTHS) {
        return EINVAL;
      }

      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, value->months));
      break;
    }
    case NANOARROW_TYPE_INTERVAL_DAY_TIME: {
      if (value->type != NANOARROW_TYPE_INTERVAL_DAY_TIME) {
        return EINVAL;
      }

      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, value->days));
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, value->ms));
      break;
    }
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO: {
      if (value->type != NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO) {
        return EINVAL;
      }

      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, value->months));
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(data_buffer, value->days));
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt64(data_buffer, value->ns));
      break;
    }
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayAppendDecimal(struct ArrowArray* array,
                                                     const struct ArrowDecimal* value) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;
  struct ArrowBuffer* data_buffer = ArrowArrayBuffer(array, 1);

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_DECIMAL32:
      if (value->n_words != 0) {
        return EINVAL;
      } else {
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value->words, sizeof(uint32_t)));
        break;
      }
    case NANOARROW_TYPE_DECIMAL64:
      if (value->n_words != 1) {
        return EINVAL;
      } else {
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value->words, sizeof(uint64_t)));
        break;
      }
    case NANOARROW_TYPE_DECIMAL128:
      if (value->n_words != 2) {
        return EINVAL;
      } else {
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value->words, 2 * sizeof(uint64_t)));
        break;
      }
    case NANOARROW_TYPE_DECIMAL256:
      if (value->n_words != 4) {
        return EINVAL;
      } else {
        NANOARROW_RETURN_NOT_OK(
            ArrowBufferAppend(data_buffer, value->words, 4 * sizeof(uint64_t)));
        break;
      }
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayFinishElement(struct ArrowArray* array) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  int64_t child_length;

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_MAP:
      child_length = array->children[0]->length;
      if (child_length > INT32_MAX) {
        return EOVERFLOW;
      }

      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendInt32(ArrowArrayBuffer(array, 1), (int32_t)child_length));
      break;
    case NANOARROW_TYPE_LARGE_LIST:
      child_length = array->children[0]->length;
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendInt64(ArrowArrayBuffer(array, 1), child_length));
      break;
    case NANOARROW_TYPE_FIXED_SIZE_LIST:
      child_length = array->children[0]->length;
      if (child_length !=
          ((array->length + 1) * private_data->layout.child_size_elements)) {
        return EINVAL;
      }
      break;
    case NANOARROW_TYPE_LIST_VIEW: {
      child_length = array->children[0]->length;
      if (child_length > INT32_MAX) {
        return EOVERFLOW;
      }

      const int32_t last_valid_offset = (int32_t)private_data->list_view_offset;
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendInt32(ArrowArrayBuffer(array, 1), last_valid_offset));
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(
          ArrowArrayBuffer(array, 2), (int32_t)child_length - last_valid_offset));
      private_data->list_view_offset = child_length;
      break;
    }
    case NANOARROW_TYPE_LARGE_LIST_VIEW: {
      child_length = array->children[0]->length;
      const int64_t last_valid_offset = private_data->list_view_offset;
      NANOARROW_RETURN_NOT_OK(
          ArrowBufferAppendInt64(ArrowArrayBuffer(array, 1), last_valid_offset));
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt64(ArrowArrayBuffer(array, 2),
                                                     child_length - last_valid_offset));
      private_data->list_view_offset = child_length;
      break;
    }

    case NANOARROW_TYPE_STRUCT:
      for (int64_t i = 0; i < array->n_children; i++) {
        child_length = array->children[i]->length;
        if (child_length != (array->length + 1)) {
          return EINVAL;
        }
      }
      break;
    default:
      return EINVAL;
  }

  if (private_data->bitmap.buffer.data != NULL) {
    NANOARROW_RETURN_NOT_OK(ArrowBitmapAppend(ArrowArrayValidityBitmap(array), 1, 1));
  }

  array->length++;
  return NANOARROW_OK;
}

static inline ArrowErrorCode ArrowArrayFinishUnionElement(struct ArrowArray* array,
                                                          int8_t type_id) {
  struct ArrowArrayPrivateData* private_data =
      (struct ArrowArrayPrivateData*)array->private_data;

  int64_t child_index = _ArrowArrayUnionChildIndex(array, type_id);
  if (child_index < 0 || child_index >= array->n_children) {
    return EINVAL;
  }

  switch (private_data->storage_type) {
    case NANOARROW_TYPE_DENSE_UNION:
      // Append the target child length to the union offsets buffer
      _NANOARROW_CHECK_RANGE(array->children[child_index]->length, 0, INT32_MAX);
      NANOARROW_RETURN_NOT_OK(ArrowBufferAppendInt32(
          ArrowArrayBuffer(array, 1), (int32_t)array->children[child_index]->length - 1));
      break;
    case NANOARROW_TYPE_SPARSE_UNION:
      // Append one empty to any non-target column that isn't already the right length
      // or abort if appending a null will result in a column with invalid length
      for (int64_t i = 0; i < array->n_children; i++) {
        if (i == child_index || array->children[i]->length == (array->length + 1)) {
          continue;
        }

        if (array->children[i]->length != array->length) {
          return EINVAL;
        }

        NANOARROW_RETURN_NOT_OK(ArrowArrayAppendEmpty(array->children[i], 1));
      }

      break;
    default:
      return EINVAL;
  }

  // Write to the type_ids buffer
  NANOARROW_RETURN_NOT_OK(
      ArrowBufferAppendInt8(ArrowArrayBuffer(array, 0), (int8_t)type_id));
  array->length++;
  return NANOARROW_OK;
}

static inline void ArrowArrayViewMove(struct ArrowArrayView* src,
                                      struct ArrowArrayView* dst) {
  memcpy(dst, src, sizeof(struct ArrowArrayView));
  ArrowArrayViewInitFromType(src, NANOARROW_TYPE_UNINITIALIZED);
}

static inline int64_t ArrowArrayViewGetNumBuffers(struct ArrowArrayView* array_view) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      return NANOARROW_BINARY_VIEW_FIXED_BUFFERS + array_view->n_variadic_buffers + 1;
    default:
      break;
  }

  int64_t n_buffers = 0;
  for (int i = 0; i < NANOARROW_MAX_FIXED_BUFFERS; i++) {
    if (array_view->layout.buffer_type[i] == NANOARROW_BUFFER_TYPE_NONE) {
      break;
    }

    n_buffers++;
  }

  return n_buffers;
}

static inline struct ArrowBufferView ArrowArrayViewGetBufferView(
    struct ArrowArrayView* array_view, int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      if (i < NANOARROW_BINARY_VIEW_FIXED_BUFFERS) {
        return array_view->buffer_views[i];
      } else if (i >=
                 (array_view->n_variadic_buffers + NANOARROW_BINARY_VIEW_FIXED_BUFFERS)) {
        struct ArrowBufferView view;
        view.data.as_int64 = array_view->variadic_buffer_sizes;
        view.size_bytes = array_view->n_variadic_buffers * sizeof(double);
        return view;
      } else {
        struct ArrowBufferView view;
        view.data.data =
            array_view->variadic_buffers[i - NANOARROW_BINARY_VIEW_FIXED_BUFFERS];
        view.size_bytes =
            array_view->variadic_buffer_sizes[i - NANOARROW_BINARY_VIEW_FIXED_BUFFERS];
        return view;
      }
    default:
      // We need this check to avoid -Warray-bounds from complaining
      if (i >= NANOARROW_MAX_FIXED_BUFFERS) {
        struct ArrowBufferView view;
        view.data.data = NULL;
        view.size_bytes = 0;
        return view;
      } else {
        return array_view->buffer_views[i];
      }
  }
}

enum ArrowBufferType ArrowArrayViewGetBufferType(struct ArrowArrayView* array_view,
                                                 int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      if (i < NANOARROW_BINARY_VIEW_FIXED_BUFFERS) {
        return array_view->layout.buffer_type[i];
      } else if (i ==
                 (array_view->n_variadic_buffers + NANOARROW_BINARY_VIEW_FIXED_BUFFERS)) {
        return NANOARROW_BUFFER_TYPE_VARIADIC_SIZE;
      } else {
        return NANOARROW_BUFFER_TYPE_VARIADIC_DATA;
      }
    default:
      // We need this check to avoid -Warray-bounds from complaining
      if (i >= NANOARROW_MAX_FIXED_BUFFERS) {
        return NANOARROW_BUFFER_TYPE_NONE;
      } else {
        return array_view->layout.buffer_type[i];
      }
  }
}

static inline enum ArrowType ArrowArrayViewGetBufferDataType(
    struct ArrowArrayView* array_view, int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      if (i < NANOARROW_BINARY_VIEW_FIXED_BUFFERS) {
        return array_view->layout.buffer_data_type[i];
      } else if (i >=
                 (array_view->n_variadic_buffers + NANOARROW_BINARY_VIEW_FIXED_BUFFERS)) {
        return NANOARROW_TYPE_INT64;
      } else if (array_view->storage_type == NANOARROW_TYPE_BINARY_VIEW) {
        return NANOARROW_TYPE_BINARY;
      } else {
        return NANOARROW_TYPE_STRING;
      }
    default:
      // We need this check to avoid -Warray-bounds from complaining
      if (i >= NANOARROW_MAX_FIXED_BUFFERS) {
        return NANOARROW_TYPE_UNINITIALIZED;
      } else {
        return array_view->layout.buffer_data_type[i];
      }
  }
}

static inline int64_t ArrowArrayViewGetBufferElementSizeBits(
    struct ArrowArrayView* array_view, int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_BINARY_VIEW:
    case NANOARROW_TYPE_STRING_VIEW:
      if (i < NANOARROW_BINARY_VIEW_FIXED_BUFFERS) {
        return array_view->layout.element_size_bits[i];
      } else if (i >=
                 (array_view->n_variadic_buffers + NANOARROW_BINARY_VIEW_FIXED_BUFFERS)) {
        return sizeof(int64_t) * 8;
      } else {
        return 0;
      }
    default:
      // We need this check to avoid -Warray-bounds from complaining
      if (i >= NANOARROW_MAX_FIXED_BUFFERS) {
        return 0;
      } else {
        return array_view->layout.element_size_bits[i];
      }
  }
}

static inline int8_t ArrowArrayViewIsNull(const struct ArrowArrayView* array_view,
                                          int64_t i) {
  const uint8_t* validity_buffer = array_view->buffer_views[0].data.as_uint8;
  i += array_view->offset;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_NA:
      return 0x01;
    case NANOARROW_TYPE_DENSE_UNION:
    case NANOARROW_TYPE_SPARSE_UNION:
      // Unions are "never null" in Arrow land
      return 0x00;
    default:
      return validity_buffer != NULL && !ArrowBitGet(validity_buffer, i);
  }
}

static inline int64_t ArrowArrayViewComputeNullCount(
    const struct ArrowArrayView* array_view) {
  if (array_view->length == 0) {
    return 0;
  }

  switch (array_view->storage_type) {
    case NANOARROW_TYPE_NA:
      return array_view->length;
    case NANOARROW_TYPE_DENSE_UNION:
    case NANOARROW_TYPE_SPARSE_UNION:
      // Unions are "never null" in Arrow land
      return 0;
    default:
      break;
  }

  const uint8_t* validity_buffer = array_view->buffer_views[0].data.as_uint8;
  if (validity_buffer == NULL) {
    return 0;
  }
  return array_view->length -
         ArrowBitCountSet(validity_buffer, array_view->offset, array_view->length);
}

static inline int8_t ArrowArrayViewUnionTypeId(const struct ArrowArrayView* array_view,
                                               int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_DENSE_UNION:
    case NANOARROW_TYPE_SPARSE_UNION:
      return array_view->buffer_views[0].data.as_int8[array_view->offset + i];
    default:
      return -1;
  }
}

static inline int8_t ArrowArrayViewUnionChildIndex(
    const struct ArrowArrayView* array_view, int64_t i) {
  int8_t type_id = ArrowArrayViewUnionTypeId(array_view, i);
  if (array_view->union_type_id_map == NULL) {
    return type_id;
  } else {
    return array_view->union_type_id_map[type_id];
  }
}

static inline int64_t ArrowArrayViewUnionChildOffset(
    const struct ArrowArrayView* array_view, int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_DENSE_UNION:
      return array_view->buffer_views[1].data.as_int32[array_view->offset + i];
    case NANOARROW_TYPE_SPARSE_UNION:
      return array_view->offset + i;
    default:
      return -1;
  }
}

static inline int64_t ArrowArrayViewListChildOffset(
    const struct ArrowArrayView* array_view, int64_t i) {
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_LIST:
    case NANOARROW_TYPE_MAP:
    case NANOARROW_TYPE_LIST_VIEW:
      return array_view->buffer_views[1].data.as_int32[i];
    case NANOARROW_TYPE_LARGE_LIST:
    case NANOARROW_TYPE_LARGE_LIST_VIEW:
      return array_view->buffer_views[1].data.as_int64[i];
    default:
      return -1;
  }
}

static struct ArrowBufferView ArrowArrayViewGetBytesFromViewArrayUnsafe(
    const struct ArrowArrayView* array_view, int64_t i) {
  const union ArrowBinaryView* bv = &array_view->buffer_views[1].data.as_binary_view[i];
  struct ArrowBufferView out = {{NULL}, bv->inlined.size};
  if (bv->inlined.size <= NANOARROW_BINARY_VIEW_INLINE_SIZE) {
    out.data.as_uint8 = bv->inlined.data;
    return out;
  }

  out.data.data = array_view->variadic_buffers[bv->ref.buffer_index];
  out.data.as_uint8 += bv->ref.offset;
  return out;
}

static inline int64_t ArrowArrayViewGetIntUnsafe(const struct ArrowArrayView* array_view,
                                                 int64_t i) {
  const struct ArrowBufferView* data_view = &array_view->buffer_views[1];
  i += array_view->offset;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_INT64:
      return data_view->data.as_int64[i];
    case NANOARROW_TYPE_UINT64:
      return data_view->data.as_uint64[i];
    case NANOARROW_TYPE_INTERVAL_MONTHS:
    case NANOARROW_TYPE_INT32:
      return data_view->data.as_int32[i];
    case NANOARROW_TYPE_UINT32:
      return data_view->data.as_uint32[i];
    case NANOARROW_TYPE_INT16:
      return data_view->data.as_int16[i];
    case NANOARROW_TYPE_UINT16:
      return data_view->data.as_uint16[i];
    case NANOARROW_TYPE_INT8:
      return data_view->data.as_int8[i];
    case NANOARROW_TYPE_UINT8:
      return data_view->data.as_uint8[i];
    case NANOARROW_TYPE_DOUBLE:
      return (int64_t)data_view->data.as_double[i];
    case NANOARROW_TYPE_FLOAT:
      return (int64_t)data_view->data.as_float[i];
    case NANOARROW_TYPE_HALF_FLOAT:
      return (int64_t)ArrowHalfFloatToFloat(data_view->data.as_uint16[i]);
    case NANOARROW_TYPE_BOOL:
      return ArrowBitGet(data_view->data.as_uint8, i);
    default:
      return INT64_MAX;
  }
}

static inline uint64_t ArrowArrayViewGetUIntUnsafe(
    const struct ArrowArrayView* array_view, int64_t i) {
  i += array_view->offset;
  const struct ArrowBufferView* data_view = &array_view->buffer_views[1];
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_INT64:
      return data_view->data.as_int64[i];
    case NANOARROW_TYPE_UINT64:
      return data_view->data.as_uint64[i];
    case NANOARROW_TYPE_INTERVAL_MONTHS:
    case NANOARROW_TYPE_INT32:
      return data_view->data.as_int32[i];
    case NANOARROW_TYPE_UINT32:
      return data_view->data.as_uint32[i];
    case NANOARROW_TYPE_INT16:
      return data_view->data.as_int16[i];
    case NANOARROW_TYPE_UINT16:
      return data_view->data.as_uint16[i];
    case NANOARROW_TYPE_INT8:
      return data_view->data.as_int8[i];
    case NANOARROW_TYPE_UINT8:
      return data_view->data.as_uint8[i];
    case NANOARROW_TYPE_DOUBLE:
      return (uint64_t)data_view->data.as_double[i];
    case NANOARROW_TYPE_FLOAT:
      return (uint64_t)data_view->data.as_float[i];
    case NANOARROW_TYPE_HALF_FLOAT:
      return (uint64_t)ArrowHalfFloatToFloat(data_view->data.as_uint16[i]);
    case NANOARROW_TYPE_BOOL:
      return ArrowBitGet(data_view->data.as_uint8, i);
    default:
      return UINT64_MAX;
  }
}

static inline double ArrowArrayViewGetDoubleUnsafe(
    const struct ArrowArrayView* array_view, int64_t i) {
  i += array_view->offset;
  const struct ArrowBufferView* data_view = &array_view->buffer_views[1];
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_INT64:
      return (double)data_view->data.as_int64[i];
    case NANOARROW_TYPE_UINT64:
      return (double)data_view->data.as_uint64[i];
    case NANOARROW_TYPE_INT32:
      return data_view->data.as_int32[i];
    case NANOARROW_TYPE_UINT32:
      return data_view->data.as_uint32[i];
    case NANOARROW_TYPE_INT16:
      return data_view->data.as_int16[i];
    case NANOARROW_TYPE_UINT16:
      return data_view->data.as_uint16[i];
    case NANOARROW_TYPE_INT8:
      return data_view->data.as_int8[i];
    case NANOARROW_TYPE_UINT8:
      return data_view->data.as_uint8[i];
    case NANOARROW_TYPE_DOUBLE:
      return data_view->data.as_double[i];
    case NANOARROW_TYPE_FLOAT:
      return data_view->data.as_float[i];
    case NANOARROW_TYPE_HALF_FLOAT:
      return ArrowHalfFloatToFloat(data_view->data.as_uint16[i]);
    case NANOARROW_TYPE_BOOL:
      return ArrowBitGet(data_view->data.as_uint8, i);
    default:
      return DBL_MAX;
  }
}

static inline struct ArrowStringView ArrowArrayViewGetStringUnsafe(
    const struct ArrowArrayView* array_view, int64_t i) {
  i += array_view->offset;
  const struct ArrowBufferView* offsets_view = &array_view->buffer_views[1];
  const char* data_view = array_view->buffer_views[2].data.as_char;

  struct ArrowStringView view;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_BINARY:
      view.data = data_view + offsets_view->data.as_int32[i];
      view.size_bytes =
          (int64_t)offsets_view->data.as_int32[i + 1] - offsets_view->data.as_int32[i];
      break;
    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_LARGE_BINARY:
      view.data = data_view + offsets_view->data.as_int64[i];
      view.size_bytes =
          offsets_view->data.as_int64[i + 1] - offsets_view->data.as_int64[i];
      break;
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      view.size_bytes = array_view->layout.element_size_bits[1] / 8;
      view.data = array_view->buffer_views[1].data.as_char + (i * view.size_bytes);
      break;
    case NANOARROW_TYPE_STRING_VIEW:
    case NANOARROW_TYPE_BINARY_VIEW: {
      struct ArrowBufferView buf_view =
          ArrowArrayViewGetBytesFromViewArrayUnsafe(array_view, i);
      view.data = buf_view.data.as_char;
      view.size_bytes = buf_view.size_bytes;
      break;
    }
    default:
      view.data = NULL;
      view.size_bytes = 0;
      break;
  }

  return view;
}

static inline struct ArrowBufferView ArrowArrayViewGetBytesUnsafe(
    const struct ArrowArrayView* array_view, int64_t i) {
  i += array_view->offset;
  const struct ArrowBufferView* offsets_view = &array_view->buffer_views[1];
  const uint8_t* data_view = array_view->buffer_views[2].data.as_uint8;

  struct ArrowBufferView view;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_STRING:
    case NANOARROW_TYPE_BINARY:
      view.size_bytes =
          (int64_t)offsets_view->data.as_int32[i + 1] - offsets_view->data.as_int32[i];
      view.data.as_uint8 = data_view + offsets_view->data.as_int32[i];
      break;
    case NANOARROW_TYPE_LARGE_STRING:
    case NANOARROW_TYPE_LARGE_BINARY:
      view.size_bytes =
          offsets_view->data.as_int64[i + 1] - offsets_view->data.as_int64[i];
      view.data.as_uint8 = data_view + offsets_view->data.as_int64[i];
      break;
    case NANOARROW_TYPE_FIXED_SIZE_BINARY:
      view.size_bytes = array_view->layout.element_size_bits[1] / 8;
      view.data.as_uint8 =
          array_view->buffer_views[1].data.as_uint8 + (i * view.size_bytes);
      break;
    case NANOARROW_TYPE_STRING_VIEW:
    case NANOARROW_TYPE_BINARY_VIEW:
      view = ArrowArrayViewGetBytesFromViewArrayUnsafe(array_view, i);
      break;
    default:
      view.data.data = NULL;
      view.size_bytes = 0;
      break;
  }

  return view;
}

static inline void ArrowArrayViewGetIntervalUnsafe(
    const struct ArrowArrayView* array_view, int64_t i, struct ArrowInterval* out) {
  const uint8_t* data_view = array_view->buffer_views[1].data.as_uint8;
  const int64_t offset = array_view->offset;
  const int64_t index = offset + i;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_INTERVAL_MONTHS: {
      const size_t size = sizeof(int32_t);
      memcpy(&out->months, data_view + index * size, sizeof(int32_t));
      break;
    }
    case NANOARROW_TYPE_INTERVAL_DAY_TIME: {
      const size_t size = sizeof(int32_t) + sizeof(int32_t);
      memcpy(&out->days, data_view + index * size, sizeof(int32_t));
      memcpy(&out->ms, data_view + index * size + 4, sizeof(int32_t));
      break;
    }
    case NANOARROW_TYPE_INTERVAL_MONTH_DAY_NANO: {
      const size_t size = sizeof(int32_t) + sizeof(int32_t) + sizeof(int64_t);
      memcpy(&out->months, data_view + index * size, sizeof(int32_t));
      memcpy(&out->days, data_view + index * size + 4, sizeof(int32_t));
      memcpy(&out->ns, data_view + index * size + 8, sizeof(int64_t));
      break;
    }
    default:
      break;
  }
}

static inline void ArrowArrayViewGetDecimalUnsafe(const struct ArrowArrayView* array_view,
                                                  int64_t i, struct ArrowDecimal* out) {
  i += array_view->offset;
  const uint8_t* data_view = array_view->buffer_views[1].data.as_uint8;
  switch (array_view->storage_type) {
    case NANOARROW_TYPE_DECIMAL32:
      ArrowDecimalSetBytes(out, data_view + (i * 4));
      break;
    case NANOARROW_TYPE_DECIMAL64:
      ArrowDecimalSetBytes(out, data_view + (i * 8));
      break;
    case NANOARROW_TYPE_DECIMAL128:
      ArrowDecimalSetBytes(out, data_view + (i * 16));
      break;
    case NANOARROW_TYPE_DECIMAL256:
      ArrowDecimalSetBytes(out, data_view + (i * 32));
      break;
    default:
      memset(out->words, 0, sizeof(out->words));
      break;
  }
}

#ifdef __cplusplus
}
#endif

#endif


================================================
FILE: data/lang/cpp/pool.cpp
================================================
#include <string>
#include <iostream>
#include <sstream>
#include <functional>
#include <vector>
#include <algorithm>
#include <stdexcept>
#include <fstream>
#include <system_error>
#include <unordered_map>
#include <sys/stat.h>
#include <sys/mman.h>

// needed for foreign interface
#include <cstdlib>
#include <cstdio>
#include <cstdint>
#include <unistd.h>

#include <limits>
#include <utility>


using namespace std;

char* g_tmpdir;

uint8_t* foreign_call(const char* socket_filename, size_t mid, ...) __attribute__((sentinel));

// AUTO include statements start
// <<<BREAK>>>
// AUTO include statements end

// Proper linking of cppmorloc requires it be included AFTER the custom modules
#include "mlc_arrow.hpp"
#include "cppmorloc.hpp"

#define PROPAGATE_ERROR(errmsg) \
    if(errmsg != NULL) { \
      char errmsg_buffer[MAX_ERRMSG_SIZE] = { 0 }; \
      snprintf(errmsg_buffer, MAX_ERRMSG_SIZE, "Error C++ pool (%s:%d in %s):\n%s" , __FILE__, __LINE__, __func__, errmsg); \
      free(errmsg); \
      throw std::runtime_error(errmsg_buffer); \
    }

#define PROPAGATE_FAIL_PACKET(errmsg) \
    if(errmsg != NULL){ \
        uint8_t* fail_packet_ = make_fail_packet(errmsg); \
        free(errmsg); \
        return fail_packet_; \
    }


// AUTO serialization statements start
// <<<BREAK>>>
// AUTO serialization statements end


std::string interweave_strings(const std::vector<std::string>& first, const std::vector<std::string>& second)
{
    // Validate sizes - errors here indicate a bug in the morloc compiler
    if (first.size() != second.size() + 1) {
        throw std::invalid_argument("First list must have exactly 1 more element than second list");
    }

    // Pre-calculate total size to avoid reallocations
    size_t total_size = 0;
    for (const auto& s : first) total_size += s.size();
    for (const auto& s : second) total_size += s.size();

    std::string result;
    result.reserve(total_size);

    // Interweave the strings
    for (size_t i = 0; i < second.size(); ++i) {
        result += first[i];
        result += second[i];
    }
    result += first.back();  // Append the final element from first list

    return result;
}

// Thread-local list of SHM pointers allocated by _put_value.
// Freed after foreign_call returns (args consumed) or at next dispatch start
// (result consumed by caller in the synchronous call that returned it).
struct ShmEntry { absptr_t ptr; Schema* schema; };
thread_local std::vector<ShmEntry> _shm_tracker;

static void _flush_shm_tracker() {
    for (auto& e : _shm_tracker) {
        char* err = NULL;
        // Only do recursive sub-freeing if we have a schema and this is
        // the last reference. NULL schema entries (from foreign_call result
        // tracking) just decrement the refcount.
        block_header_t* blk = (block_header_t*)((char*)e.ptr - sizeof(block_header_t));
        if (e.schema && blk->reference_count <= 1) {
            shfree_by_schema(e.ptr, e.schema, &err);
            if (err) { free(err); err = NULL; }
        }
        shfree(e.ptr, &err);
        if (err) { free(err); }
    }
    _shm_tracker.clear();
}

// Thread-local schema cache: avoids re-parsing the same schema strings
Schema* get_cached_schema(const char* schema_str) {
    thread_local std::unordered_map<std::string, Schema*> cache;
    auto it = cache.find(schema_str);
    if (it != cache.end()) return it->second;
    Schema* schema = parse_schema_cpp(schema_str);
    cache[schema_str] = schema;
    return schema;
}

// Transforms a serialized value into a message ready for the socket
template <typename T>
uint8_t* _put_value(const T& value, const std::string& schema_str) {
    Schema* schema = get_cached_schema(schema_str.c_str());

    if constexpr (std::is_same_v<T, mlc::ArrowTable>) {
        // Arrow export: move table data into SHM, build packet.
        // const_cast is safe here: the value is always a temporary from
        // a manifold call, never a truly const object.
        mlc::ArrowTable& tbl = const_cast<mlc::ArrowTable&>(value);
        relptr_t relptr = tbl.move_to_shm();

        uint8_t* packet = make_arrow_data_packet(relptr, schema);
        if (!packet) { throw std::runtime_error("Failed to create arrow data packet"); }

        char* err = nullptr;
        void* shm_ptr = rel2abs(relptr, &err);
        if (err) { free(err); }
        if (shm_ptr) { _shm_tracker.push_back({(absptr_t)shm_ptr, nullptr}); }
        return packet;
    } else {
        // Arrow dispatch: if schema hint is "arrow", the C++ type must be mlc::ArrowTable
        if (schema->hint && strcmp(schema->hint, "arrow") == 0) {
            throw std::runtime_error("Arrow schema but C++ type is not mlc::ArrowTable");
        }

        void* voidstar = nullptr;
        try {
            voidstar = toAnything(schema, value);
            relptr_t relptr = abs2rel_cpp(voidstar);

            char* errmsg = nullptr;
            uint8_t* packet = make_data_packet_auto(voidstar, relptr, schema, &errmsg);
            if (errmsg) {
                shfree_cpp(voidstar);
                PROPAGATE_ERROR(errmsg);
            }

            const morloc_packet_header_t* hdr = (const morloc_packet_header_t*)packet;
            if (hdr->command.data.source == PACKET_SOURCE_RPTR) {
                // SHM referenced by packet -- track for deferred cleanup
                _shm_tracker.push_back({(absptr_t)voidstar, schema});
            } else {
                // Data inlined in packet -- free SHM immediately
                char* free_err = NULL;
                shfree_by_schema((absptr_t)voidstar, schema, &free_err);
                if (free_err) { free(free_err); free_err = NULL; }
                shfree((absptr_t)voidstar, &free_err);
                if (free_err) { free(free_err); }
            }
            return packet;
        } catch (...) {
            if (voidstar) shfree_cpp(voidstar);
            throw;
        }
    }
}


// Use a key to retrieve a value
template <typename T>
T _get_value(const uint8_t* packet, const std::string& schema_str){
    const morloc_packet_header_t* header = (const morloc_packet_header_t*)packet;
    uint8_t source = header->command.data.source;
    uint8_t format = header->command.data.format;

    if constexpr (std::is_same_v<T, mlc::ArrowTable>) {
        // Arrow import: packet -> arrow_from_shm -> ArrowTable
        Schema* schema = get_cached_schema(schema_str.c_str());
        char* errmsg = nullptr;
        uint8_t* raw = get_morloc_data_packet_value(packet, schema, &errmsg);
        if (errmsg) { PROPAGATE_ERROR(errmsg); }

        const arrow_shm_header_t* hdr = (const arrow_shm_header_t*)raw;
        struct ArrowSchema as;
        struct ArrowArray aa;
        char* aerr = nullptr;
        arrow_from_shm(hdr, &as, &aa, &aerr);
        if (aerr) { PROPAGATE_ERROR(aerr); }

        char* ierr = nullptr;
        shincref((absptr_t)raw, &ierr);
        if (ierr) { free(ierr); }
        _shm_tracker.push_back({(absptr_t)raw, nullptr});

        return mlc::ArrowTable(std::move(as), std::move(aa));
    } else {
        if (format == PACKET_FORMAT_ARROW) {
            throw std::runtime_error("Arrow data but C++ type is not mlc::ArrowTable");
        }

        Schema* schema = get_cached_schema(schema_str.c_str());

        // Fast path: inline voidstar -- read directly from packet, no SHM needed
        if (source == PACKET_SOURCE_MESG && format == PACKET_FORMAT_VOIDSTAR) {
            const uint8_t* payload = packet + sizeof(morloc_packet_header_t) + header->offset;
            T* dummy = nullptr;
            return fromAnything(schema, (const void*)payload, dummy, (const void*)payload);
        }

        // SHM paths (RPTR or MESG+MSGPACK): existing logic
        bool is_rptr = (source == PACKET_SOURCE_RPTR);

        char* errmsg = NULL;
        uint8_t* voidstar = get_morloc_data_packet_value(packet, schema, &errmsg);
        if(errmsg != NULL) {
            PROPAGATE_ERROR(errmsg)
        }

        // For RPTR data, increment refcount so the owner's tracker flush
        // won't destroy data we may still need (e.g. forwarded packets).
        if (is_rptr) {
            char* incref_err = NULL;
            shincref((absptr_t)voidstar, &incref_err);
            if (incref_err) { free(incref_err); }
            _shm_tracker.push_back({(absptr_t)voidstar, schema});
        }

        T* dummy = nullptr;
        return fromAnything(schema, (void*)voidstar, dummy);
    }
}


// Hash a value, returning a 16-char hex string
template <typename T>
std::string _mlc_hash(const T& value, const std::string& schema_str) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    void* voidstar = toAnything(schema, value);
    char* errmsg = NULL;
    char* hex = mlc_hash(voidstar, schema, &errmsg);
    shfree_cpp(voidstar);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
    std::string result(hex);
    free(hex);
    return result;
}

// Save a value to file in msgpack format
template <typename T>
void _mlc_save(const T& value, const std::string& schema_str, const std::string& path) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    void* voidstar = toAnything(schema, value);
    char* errmsg = NULL;
    mlc_save(voidstar, schema, path.c_str(), &errmsg);
    shfree_cpp(voidstar);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
}

// Save a value to file in flat voidstar binary format
template <typename T>
void _mlc_save_voidstar(const T& value, const std::string& schema_str, const std::string& path) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    void* voidstar = toAnything(schema, value);
    char* errmsg = NULL;
    mlc_save_voidstar(voidstar, schema, path.c_str(), &errmsg);
    shfree_cpp(voidstar);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
}

// Save a value to file in JSON format
template <typename T>
void _mlc_save_json(const T& value, const std::string& schema_str, const std::string& path) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    void* voidstar = toAnything(schema, value);
    char* errmsg = NULL;
    mlc_save_json(voidstar, schema, path.c_str(), &errmsg);
    shfree_cpp(voidstar);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
}

// Serialize a value to a JSON string
template <typename T>
std::string _mlc_show(const T& value, const std::string& schema_str) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    void* voidstar = toAnything(schema, value);
    char* errmsg = NULL;
    char* json = mlc_show(voidstar, schema, &errmsg);
    shfree_cpp(voidstar);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
    std::string result(json);
    free(json);
    return result;
}

// Deserialize a JSON string to a typed value
// Returns std::nullopt on parse failure
template <typename T>
std::optional<T> _mlc_read(const std::string& schema_str, const std::string& json_str) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    char* errmsg = NULL;
    void* voidstar = mlc_read(json_str.c_str(), schema, &errmsg);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
    if (voidstar == NULL) {
        return std::nullopt;
    }
    T* dummy = nullptr;
    T result = fromAnything(schema, voidstar, dummy);
    shfree_cpp(voidstar);
    return result;
}

// Load a value from file, auto-detecting format
// Returns std::nullopt if file does not exist
template <typename T>
std::optional<T> _mlc_load(const std::string& schema_str, const std::string& path) {
    Schema* schema = get_cached_schema(schema_str.c_str());
    char* errmsg = NULL;
    void* voidstar = mlc_load(path.c_str(), schema, &errmsg);
    if (errmsg != NULL) {
        PROPAGATE_ERROR(errmsg)
    }
    if (voidstar == NULL) {
        return std::nullopt;
    }
    T* dummy = nullptr;
    T result = fromAnything(schema, voidstar, dummy);
    shfree_cpp(voidstar);
    return result;
}

uint8_t* foreign_call(const char* socket_filename, size_t mid, ...) {
    char* errmsg = NULL;
    va_list args;
    size_t nargs = 0;

    char socket_path[128];
    snprintf(socket_path, sizeof(socket_path), "%s/%s", g_tmpdir, socket_filename);

    // Count arguments (must be NULL-terminated)
    va_start(args, mid);
    while (va_arg(args, uint8_t*) != NULL) nargs++;
    va_end(args);

    // Allocate and populate args array
    const uint8_t** args_array = (const uint8_t**)malloc((nargs + 1) * sizeof(uint8_t*));
    if (!args_array) throw std::runtime_error("malloc failed in foreign_call");

    va_start(args, mid);
    for (size_t i = 0; i < nargs; i++) {
        args_array[i] = va_arg(args, uint8_t*);
    }
    args_array[nargs] = NULL;  // Sentinel
    va_end(args);

    // Original logic with variadic args converted to array
    uint8_t* packet = make_morloc_local_call_packet((uint32_t)mid, args_array, nargs, &errmsg);
    if (errmsg != NULL) {
        free(args_array);
        PROPAGATE_ERROR(errmsg)
    }

    pool_mark_busy();
    uint8_t* result = send_and_receive_over_socket(socket_path, packet, &errmsg);
    pool_mark_idle();

    free(packet);

    if (errmsg != NULL) {
        free(args_array);
        PROPAGATE_ERROR(errmsg)
    }

    // Incref the result's SHM so the callee's tracker flush won't destroy
    // data we may still need (e.g. forwarded result packets).
    {
        const morloc_packet_header_t* res_header = (const morloc_packet_header_t*)result;
        if (res_header->command.data.source == PACKET_SOURCE_RPTR) {
            size_t relptr = *(size_t*)(result + res_header->offset + sizeof(morloc_packet_header_t));
            char* resolve_err = NULL;
            void* res_voidstar = rel2abs(relptr, &resolve_err);
            if (resolve_err) { free(resolve_err); resolve_err = NULL; }
            if (res_voidstar) {
                char* incref_err = NULL;
                shincref((absptr_t)res_voidstar, &incref_err);
                if (incref_err) { free(incref_err); }
                _shm_tracker.push_back({(absptr_t)res_voidstar, nullptr});
            }
        }
    }

    free(args_array);
    return result;
}


// AUTO signatures statements start
// <<<BREAK>>>
// AUTO signatures statements end


// AUTO manifolds statements start
// <<<BREAK>>>
// AUTO manifolds statements end


// AUTO dispatch start
// <<<BREAK>>>
// AUTO dispatch end


// Wrappers to adapt compiler-generated dispatch functions to pool_dispatch_fn_t.
// These catch C++ exceptions so the C pool_main never sees them.
static uint8_t* cpp_local_dispatch(uint32_t mid, const uint8_t** args,
                                    size_t nargs, void* ctx) {
    (void)nargs; (void)ctx;
    // Free SHM from previous dispatch (result packet consumed by caller)
    _flush_shm_tracker();
    try {
        return local_dispatch(mid, args);
    } catch (const std::exception& e) {
        return make_fail_packet(e.what());
    } catch (...) {
        return make_fail_packet("An unknown error occurred");
    }
}

static uint8_t* cpp_remote_dispatch(uint32_t mid, const uint8_t** args,
                                     size_t nargs, void* ctx) {
    (void)nargs; (void)ctx;
    try {
        return remote_dispatch(mid, args);
    } catch (const std::exception& e) {
        return make_fail_packet(e.what());
    } catch (...) {
        return make_fail_packet("An unknown error occurred");
    }
}


int main(int argc, char* argv[]) {
    // Line-buffer stderr so diagnostic output is not lost on pool shutdown.
    // stdout is left fully buffered for performance (genome-scale piping)
    // and flushed after each job by pool.c.
    setvbuf(stderr, NULL, _IOLBF, 0);

    // Health check: confirm binary links and print version
    if (argc == 2 && std::string(argv[1]) == "--health") {
        std::cout << "{\"status\":\"ok\",\"version\":\"__MORLOC_VERSION__\"}" << std::endl;
        return 0;
    }

    if (argc != 4) {
        std::cerr << "Usage: " << argv[0] << " <socket_path> <tmpdir> <shm_basename>\n";
        return 1;
    }

    g_tmpdir = strdup(argv[2]);

    pool_config_t config = {};
    config.local_dispatch = cpp_local_dispatch;
    config.remote_dispatch = cpp_remote_dispatch;
    config.dispatch_ctx = NULL;
    config.concurrency = POOL_THREADS;
    config.initial_workers = 1;
    config.dynamic_scaling = true;

    int result = pool_main(argc, argv, &config);

    free(g_tmpdir);
    return result;
}


================================================
FILE: data/lang/julia/MorlocRuntime.jl
================================================
"""
    MorlocRuntime

Julia runtime module for morloc. Provides IPC (daemon lifecycle, packet I/O),
msgpack-based serialization, and foreign call support.

All heavy lifting is done by libmorloc via the thin C bridge (libjuliamorloc.so).
Julia handles only the msgpack <-> native type conversion using MsgPack.jl.
"""
module MorlocRuntime

using MsgPack

# Path to the bridge shared library (set during morloc init)
const LIB_PATH = Ref{String}("")

function __init__()
    # Look for libjuliamorloc.so relative to this file, or in standard locations
    candidates = [
        joinpath(dirname(@__FILE__), "libjuliamorloc.so"),
        joinpath(dirname(@__FILE__), "..", "lib", "libjuliamorloc.so"),
    ]
    # Also check the morloc home lib directory
    morloc_home = get(ENV, "MORLOC_HOME", joinpath(homedir(), ".local", "share", "morloc"))
    push!(candidates, joinpath(morloc_home, "lib", "libjuliamorloc.so"))

    for path in candidates
        if isfile(path)
            LIB_PATH[] = path
            return
        end
    end
    error("Cannot find libjuliamorloc.so. Run `morloc init` first.")
end

lib() = LIB_PATH[]

# -- Error handling --

function check_error(context::String)
    msg = unsafe_string(ccall((:jlmorloc_last_error, lib()), Cstring, ()))
    if !isempty(msg)
        error("$context: $msg")
    end
end

# -- Daemon lifecycle --

function start_daemon(socket_path::String, tmpdir::String,
                      shm_basename::String, shm_size::Integer)
    ptr = ccall((:jlmorloc_start_daemon, lib()), Ptr{Nothing},
                (Cstring, Cstring, Cstring, Csize_t),
                socket_path, tmpdir, shm_basename, UInt(shm_size))
    ptr == C_NULL && check_error("start_daemon")
    return ptr
end

function close_daemon(daemon::Ptr{Nothing})
    ccall((:jlmorloc_close_daemon, lib()), Nothing, (Ptr{Nothing},), daemon)
end

function wait_for_client(daemon::Ptr{Nothing})
    fd = ccall((:jlmorloc_wait_for_client, lib()), Cint, (Ptr{Nothing},), daemon)
    fd < 0 && check_error("wait_for_client")
    return fd
end

# -- Packet I/O --

function stream_from_client(client_fd)
    out_size = Ref{Csize_t}(0)
    ptr = ccall((:jlmorloc_stream_from_client, lib()), Ptr{UInt8},
                (Cint, Ref{Csize_t}), Int32(client_fd), out_size)
    ptr == C_NULL && check_error("stream_from_client")
    return ptr  # opaque packet pointer
end

function send_packet_to_foreign_server(client_fd, packet::Ptr{UInt8})
    rc = ccall((:jlmorloc_send_packet, lib()), Cint,
               (Cint, Ptr{UInt8}), Int32(client_fd), packet)
    rc != 0 && check_error("send_packet")
end

function close_socket(fd)
    ccall((:jlmorloc_close_socket, lib()), Nothing, (Cint,), Int32(fd))
end

# -- Packet classification --

function is_ping(packet::Ptr{UInt8})
    ccall((:jlmorloc_is_ping, lib()), Cint, (Ptr{UInt8},), packet) != 0
end

function is_local_call(packet::Ptr{UInt8})
    ccall((:jlmorloc_is_local_call, lib()), Cint, (Ptr{UInt8},), packet) != 0
end

function is_remote_call(packet::Ptr{UInt8})
    ccall((:jlmorloc_is_remote_call, lib()), Cint, (Ptr{UInt8},), packet) != 0
end

function pong(packet::Ptr{UInt8})
    result = ccall((:jlmorloc_pong, lib()), Ptr{UInt8}, (Ptr{UInt8},), packet)
    result == C_NULL && check_error("pong")
    return result
end

# -- Call packet parsing --

"""
    read_morloc_call_packet(packet) -> (mid, args)

Parse a call packet into a manifold index and a vector of argument packets.
"""
function read_morloc_call_packet(packet::Ptr{UInt8})
    out_mid = Ref{UInt32}(0)
    out_nargs = Ref{Csize_t}(0)
    call_ptr = ccall((:jlmorloc_read_call, lib()), Ptr{Nothing},
                     (Ptr{UInt8}, Ref{UInt32}, Ref{Csize_t}),
                     packet, out_mid, out_nargs)
    call_ptr == C_NULL && check_error("read_call")

    mid = Int(out_mid[])
    nargs = Int(out_nargs[])
    args = Vector{Ptr{UInt8}}(undef, nargs)
    for i in 1:nargs
        args[i] = ccall((:jlmorloc_call_arg, lib()), Ptr{UInt8},
                        (Ptr{Nothing}, Csize_t), call_ptr, UInt(i - 1))
    end

    ccall((:jlmorloc_free_call, lib()), Nothing, (Ptr{Nothing},), call_ptr)
    return (mid, args)
end

# -- Msgpack bridge: serialize/deserialize --

"""
Strip the `<TypeName>` prefix from schema strings like `"<Int64>i4"` -> `"i4"`.
"""
function strip_schema_prefix(schema_str::String)
    if !isempty(schema_str) && schema_str[1] == '<'
        i = findfirst('>', schema_str)
        if i !== nothing
            return schema_str[i+1:end]
        end
    end
    return schema_str
end

"""
    put_value(value, schema_str) -> Ptr{UInt8}

Serialize a Julia value to a morloc data packet via msgpack.
"""
function put_value(value, schema_str::String)
    schema = strip_schema_prefix(schema_str)
    mpk = MsgPack.pack(to_msgpack(value, schema))
    pkt = ccall((:jlmorloc_pack, lib()), Ptr{UInt8},
                (Ptr{UInt8}, Csize_t, Cstring),
                mpk, length(mpk), schema)
    pkt == C_NULL && check_error("pack")
    return pkt
end

"""
    get_value(packet, schema_str) -> Julia value

Deserialize a morloc data packet to a Julia value via msgpack.
"""
function get_value(packet::Ptr{UInt8}, schema_str::String)
    schema = strip_schema_prefix(schema_str)
    out_size = Ref{Csize_t}(0)
    mpk_ptr = ccall((:jlmorloc_unpack, lib()), Ptr{UInt8},
                    (Ptr{UInt8}, Cstring, Ref{Csize_t}),
                    packet, schema, out_size)
    mpk_ptr == C_NULL && check_error("unpack")

    mpk_bytes = unsafe_wrap(Array, mpk_ptr, out_size[]; own=true)
    raw = MsgPack.unpack(mpk_bytes)
    return from_msgpack(raw, schema)
end

# -- Error packet --

function make_fail_packet(msg::String)
    ccall((:jlmorloc_make_fail_packet, lib()), Ptr{UInt8}, (Cstring,), msg)
end

# -- Foreign call --

"""
    foreign_call(tmpdir, socket_name, mid, args) -> Ptr{UInt8}

Call another pool (cross-language IPC). args is a vector of packet pointers.
"""
function foreign_call(tmpdir::String, socket_name::String,
                      mid::Integer, args::Vector{Ptr{UInt8}})
    nargs = length(args)
    result = ccall((:jlmorloc_foreign_call, lib()), Ptr{UInt8},
                   (Cstring, Cstring, UInt32, Ptr{Ptr{UInt8}}, Csize_t),
                   tmpdir, socket_name, UInt32(mid), args, UInt(nargs))
    result == C_NULL && check_error("foreign_call")
    return result
end

# -- Type conversion helpers --

# Schema string format:
#   "b" = bool, "i4" = int32, "i8" = int64, "f8" = float64, "s" = string
#   "ai4" = array of int32, "t(i4f8s)" = tuple
#   "m{name:s,age:i4}" = record

"""
Convert a Julia value to a msgpack-friendly representation based on schema.
MsgPack.jl handles most types natively, but we need to ensure correct types
for the schema (e.g., Int32 vs Int64).
"""
function to_msgpack(value, schema::String)
    if startswith(schema, "a")
        elem_schema = schema[2:end]
        return [to_msgpack(v, elem_schema) for v in value]
    elseif startswith(schema, "t(")
        inner = schema[3:end-1]
        schemas = split_tuple_schema(inner)
        return [to_msgpack(value[i], schemas[i]) for i in 1:length(schemas)]
    elseif startswith(schema, "m{")
        inner = schema[3:end-1]
        fields = split_record_schema(inner)
        return Dict(k => to_msgpack(value[k], s) for (k, s) in fields)
    else
        return to_msgpack_scalar(value, schema)
    end
end

function to_msgpack_scalar(value, schema::String)
    if schema == "b"
        return Bool(value)
    elseif schema == "i4"
        return Int32(value)
    elseif schema == "i8"
        return Int64(value)
    elseif schema == "u4"
        return UInt32(value)
    elseif schema == "u8"
        return UInt64(value)
    elseif schema == "f4"
        return Float32(value)
    elseif schema == "f8"
        return Float64(value)
    elseif schema == "s"
        return String(value)
    elseif schema == "u"
        return nothing
    else
        return value
    end
end

"""
Convert a raw msgpack value to a Julia type based on schema.
"""
function from_msgpack(raw, schema::String)
    if startswith(schema, "a")
        elem_schema = schema[2:end]
        return [from_msgpack(v, elem_schema) for v in raw]
    elseif startswith(schema, "t(")
        inner = schema[3:end-1]
        schemas = split_tuple_schema(inner)
        return Tuple(from_msgpack(raw[i], schemas[i]) for i in 1:length(schemas))
    elseif startswith(schema, "m{")
        inner = schema[3:end-1]
        fields = split_record_schema(inner)
        return Dict(k => from_msgpack(raw[k], s) for (k, s) in fields)
    else
        return from_msgpack_scalar(raw, schema)
    end
end

function from_msgpack_scalar(raw, schema::String)
    if schema == "b"
        return Bool(raw)
    elseif schema == "i4"
        return Int32(raw)
    elseif schema == "i8"
        return Int64(raw)
    elseif schema == "u4"
        return UInt32(raw)
    elseif schema == "u8"
        return UInt64(raw)
    elseif schema == "f4"
        return Float32(raw)
    elseif schema == "f8"
        return Float64(raw)
    elseif schema == "s"
        return String(raw)
    elseif schema == "u"
        return nothing
    else
        return raw
    end
end

# -- Schema parsing helpers --

function split_tuple_schema(inner::String)
    schemas = String[]
    i = 1
    while i <= length(inner)
        s, i = parse_one_schema(inner, i)
        push!(schemas, s)
    end
    return schemas
end

function split_record_schema(inner::String)
    fields = Pair{String,String}[]
    i = 1
    while i <= length(inner)
        # parse field name
        colon = findnext(':', inner, i)
        name = inner[i:colon-1]
        i = colon + 1
        # parse field schema
        s, i = parse_one_schema(inner, i)
        push!(fields, name => s)
        if i <= length(inner) && inner[i] == ','
            i += 1
        end
    end
    return fields
end

function parse_one_schema(s::String, i::Int)
    if s[i] == 'a'
        inner, next_i = parse_one_schema(s, i + 1)
        return "a" * inner, next_i
    elseif s[i] == 't'
        # find matching ')'
        depth = 0
        j = i + 1
        while j <= length(s)
            if s[j] == '('; depth += 1; end
            if s[j] == ')'; depth -= 1; if depth == 0; break; end; end
            j += 1
        end
        return s[i:j], j + 1
    elseif s[i] == 'm'
        depth = 0
        j = i + 1
        while j <= length(s)
            if s[j] == '{'; depth += 1; end
            if s[j] == '}'; depth -= 1; if depth == 0; break; end; end
            j += 1
        end
        return s[i:j], j + 1
    elseif s[i] in ('i', 'u', 'f')
        # numeric: i4, i8, u4, u8, f4, f8
        return s[i:i+1], i + 2
    elseif s[i] == 's'
        return "s", i + 1
    elseif s[i] == 'b'
        return "b", i + 1
    else
        error("Unknown schema character: $(s[i]) at position $i in '$s'")
    end
end

end # module


================================================
FILE: data/lang/julia/init.sh
================================================
#!/bin/bash
set -e

MORLOC_HOME="$1"
BUILD_DIR="$2"
SANITIZE_FLAGS="$3"
INCLUDE_DIR="$MORLOC_HOME/include"
LIB_DIR="$MORLOC_HOME/lib"
LANG_DIR="$MORLOC_HOME/lang/julia"

mkdir -p "$LANG_DIR"

# Install language descriptor and runtime files
cp "$BUILD_DIR/lang.yaml" "$LANG_DIR/"
cp "$BUILD_DIR/pool.jl" "$LANG_DIR/"
cp "$BUILD_DIR/MorlocRuntime.jl" "$LANG_DIR/"

# Compile juliabridge.c -> libjuliamorloc.so
gcc -shared -fPIC -O2 $SANITIZE_FLAGS -I"$INCLUDE_DIR" -o "$LIB_DIR/libjuliamorloc.so" \
    "$BUILD_DIR/juliabridge.c" -L"$LIB_DIR" -Wl,-rpath,"$LIB_DIR" -lmorloc -lpthread


================================================
FILE: data/lang/julia/juliabridge.c
================================================
/* juliabridge.c -- Thin C bridge between Julia and libmorloc.
 *
 * Compiled to libjuliamorloc.so, called from Julia via ccall.
 * Wraps libmorloc functions that use opaque structs (language_daemon_t,
 * morloc_call_t, Schema) or the ERRMSG pattern into simple pointer/int
 * interfaces that Julia's FFI can handle directly.
 */

#include "morloc.h"
#include <stdlib.h>
#include <string.h>
#include <stdio.h>

/* Thread-local error message buffer */
static __thread char jl_errbuf[4096];
static __thread char* jl_errmsg = NULL;

static void clear_err(void) {
    jl_errmsg = NULL;
    jl_errbuf[0] = '\0';
}

/* Get the last error message (returns "" if none). */
const char* jlmorloc_last_error(void) {
    return jl_errmsg ? jl_errmsg : "";
}

/* -- Daemon lifecycle -- */

void* jlmorloc_start_daemon(const char* socket_path, const char* tmpdir,
                             const char* shm_basename, size_t shm_size) {
    clear_err();
    language_daemon_t* d = start_daemon(socket_path, tmpdir, shm_basename,
                                         shm_size, &jl_errmsg);
    if (!d && jl_errmsg) {
        snprintf(jl_errbuf, sizeof(jl_errbuf), "%s", jl_errmsg);
        jl_errmsg = jl_errbuf;
    }
    return (void*)d;
}

void jlmorloc_close_daemon(void* daemon) {
    language_daemon_t* d = (language_daemon_t*)daemon;
    close_daemon(&d);
}

int jlmorloc_wait_for_client(void* daemon) {
    clear_err();
    return wait_for_client((language_daemon_t*)daemon, &jl_errmsg);
}

/* -- Packet I/O -- */

/* Returns a pointer to the packet bytes. Caller must NOT free this
 * directly -- it lives in shared memory or was allocated by libmorloc. */
uint8_t* jlmorloc_stream_from_client(int client_fd, size_t* out_size) {
    clear_err();
    uint8_t* pkt = stream_from_client(client_fd, &jl_errmsg);
    if (pkt && out_size) {
        /* Packet size is in the first 4 bytes (little-endian uint32) */
        uint32_t sz;
        memcpy(&sz, pkt, sizeof(sz));
        *out_size = (size_t)sz;
    }
    return pkt;
}

int jlmorloc_send_packet(int client_fd, uint8_t* packet) {
    clear_err();
    size_t sent = send_packet_to_foreign_server(client_fd, packet, &jl_errmsg);
    return sent > 0 ? 0 : -1;
}

void jlmorloc_close_socket(int fd) {
    close_socket(fd);
}

/* -- Packet classification -- */

int jlmorloc_is_ping(const uint8_t* packet) {
    clear_err();
    return packet_is_ping(packet, &jl_errmsg) ? 1 : 0;
}

int jlmorloc_is_local_call(const uint8_t* packet) {
    clear_err();
    return packet_is_local_call(packet, &jl_errmsg) ? 1 : 0;
}

int jlmorloc_is_remote_call(const uint8_t* packet) {
    clear_err();
    return packet_is_remote_call(packet, &jl_errmsg) ? 1 : 0;
}

uint8_t* jlmorloc_pong(const uint8_t* packet) {
    clear_err();
    return return_ping(packet, &jl_errmsg);
}

/* -- Call packet parsing -- */

/* Parse a call packet. Returns the manifold index via out_mid,
 * the number of arguments via out_nargs, and a pointer to the
 * morloc_call_t (which the caller must free via jlmorloc_free_call). */
void* jlmorloc_read_call(const uint8_t* packet, uint32_t* out_mid,
                          size_t* out_nargs) {
    clear_err();
    morloc_call_t* call = read_morloc_call_packet(packet, &jl_errmsg);
    if (!call) return NULL;
    *out_mid = call->midx;
    *out_nargs = call->nargs;
    return (void*)call;
}

/* Get the i-th argument packet from a parsed call. */
uint8_t* jlmorloc_call_arg(void* call_ptr, size_t i) {
    morloc_call_t* call = (morloc_call_t*)call_ptr;
    if (i >= call->nargs) return NULL;
    return call->args[i];
}

void jlmorloc_free_call(void* call_ptr) {
    if (call_ptr) free_morloc_call((morloc_call_t*)call_ptr);
}

/* -- Msgpack bridge -- */

/* Convert msgpack bytes + schema string -> morloc data packet.
 * The schema_str is a compact type descriptor like "i4", "ai4", "m{x:f8}". */
uint8_t* jlmorloc_pack(const char* mpk, size_t mpk_size,
                        const char* schema_str) {
    clear_err();
    Schema* schema = parse_schema(schema_str, &jl_errmsg);
    if (!schema) return NULL;
    uint8_t* pkt = make_data_packet_from_mpk(mpk, mpk_size, schema);
    free_schema(schema);
    return pkt;
}

/* Convert a morloc data packet -> msgpack bytes.
 * Returns a malloc'd buffer; caller must free it. */
char* jlmorloc_unpack(const uint8_t* packet, const char* schema_str,
                       size_t* out_size) {
    clear_err();
    Schema* schema = parse_schema(schema_str, &jl_errmsg);
    if (!schema) return NULL;
    char* mpk = NULL;
    size_t mpk_size = 0;
    int ok = get_data_packet_as_mpk(packet, schema, &mpk, &mpk_size, &jl_errmsg);
    free_schema(schema);
    if (!ok) return NULL;
    *out_size = mpk_size;
    return mpk;
}

/* -- Error packet -- */

uint8_t* jlmorloc_make_fail_packet(const char* msg) {
    return make_fail_packet(msg);
}

/* -- Foreign call (cross-pool IPC) -- */

uint8_t* jlmorloc_foreign_call(const char* tmpdir, const char* socket_name,
                                uint32_t mid, uint8_t** arg_packets,
                                size_t nargs) {
    clear_err();
    /* Build the call packet */
    uint8_t* call_pkt = make_morloc_local_call_packet(
        mid, (const uint8_t**)arg_packets, nargs, &jl_errmsg);
    if (!call_pkt) return NULL;

    /* Build the socket path */
    size_t pathlen = strlen(tmpdir) + 1 + strlen(socket_name) + 1;
    char* socket_path = (char*)malloc(pathlen);
    snprintf(socket_path, pathlen, "%s/%s", tmpdir, socket_name);

    /* Send and receive */
    uint8_t* result = send_and_receive_over_socket(socket_path, call_pkt,
                                                    &jl_errmsg);
    free(socket_path);
    free(call_pkt);
    return result;
}

/* -- Shared memory init (needed before daemon start in some cases) -- */

int jlmorloc_shinit(const char* basename, int volume, size_t size) {
    clear_err();
    return shinit(basename, volume, size, &jl_errmsg) ? 0 : -1;
}

void jlmorloc_set_fallback_dir(const char* dir) {
    shm_set_fallback_dir(dir);
}


================================================
FILE: data/lang/julia/lang.yaml
================================================
# Julia language descriptor for morloc compiler
# Metadata fields (read by LangRegistry) + descriptor fields (read by generic translator)

# Identity and metadata
name: jl
extension: jl
aliases: ["julia"]
is_compiled: false
run_command: ["julia"]
serial_type: "bytes"
cost: 5

# Descriptor identity (kept for compatibility with generic translator)
ldName: julia
ldExtension: jl

# Literals
ldBoolTrue: "true"
ldBoolFalse: "false"
ldNullLiteral: "nothing"

# Constructors
ldListStyle: bracket
ldTupleConstructor: ""
ldRecordConstructor: "Dict"
ldRecordSeparator: "=>"

# Access styles
ldIndexStyle: one_bracket
ldKeyAccess: bracket
ldFieldAccess: dot

# Serialize/deserialize function names (from juliamorloc.jl)
ldSerializeFn: "MorlocRuntime.put_value"
ldDeserializeFn: "MorlocRuntime.get_value"
ldIntrinsicPrefix: "MorlocRuntime."

# Foreign call
ldForeignCallFn: "MorlocRuntime.foreign_call"
ldForeignCallIntSuffix: ""

# Import syntax
ldQualifiedImports: false
ldIncludeRelToFile: true

# Template fields
ldAssignOp: "="
ldLambdaTemplate: "({{args}}) -> {{body}}"
ldDoBlockExpr: "(() -> {{expr}})"
ldDoBlockBlock: ""
ldPartialTemplate: "({{bound_args}}) -> {{fn}}({{all_args}})"
ldImportTemplate: "include(\"{{path}}\")"
ldSocketPathTemplate: "joinpath(global_state[\"tmpdir\"], {{socket}})"
ldResourcePackTemplate: "[{{mem}}, {{time}}, {{cpus}}, {{gpus}}]"
ldReturnTemplate: "return({{expr}})"
ldFuncDefHeader: "function {{name}}({{args}})"
ldBlockStyle: end_keyword
ldBlockEnd: "end"
ldErrorWrapOpen: ""
ldErrorWrapClose: []
ldPatternStyle: concat_call
ldConcatFn: "string"
ldQuoteTerminator: '"'
ldQuoteTerminatorEsc: '\"'
ldMapStyle: list_comprehension
ldDispatchLocalHeader: "dispatch = Dict("
ldDispatchLocalEntry: "    {{mid}} => {{name}},"
ldDispatchLocalFooter: ")"
ldDispatchRemoteHeader: "remote_dispatch = Dict("
ldDispatchRemoteEntry: "    {{mid}} => {{name}}_remote,"
ldDispatchRemoteFooter: ")"

# Pool template (loaded from pool.jl at runtime, left empty here)
ldPoolTemplate: ""
ldBreakMarker: "# <<<BREAK>>>"
ldCommentMarker: "#"


================================================
FILE: data/lang/julia/pool.jl
================================================
# Morloc Julia pool template
# Single-threaded daemon: accepts one connection at a time.

# Add morloc runtime to load path
const MORLOC_HOME = get(ENV, "MORLOC_HOME", joinpath(homedir(), ".local", "share", "morloc"))
push!(LOAD_PATH, joinpath(MORLOC_HOME, "lang", "julia"))

# Global state accessible to manifolds (e.g., tmpdir for foreign calls)
global_state = Dict{String,String}()

# <<<BREAK>>>

using MorlocRuntime

# <<<BREAK>>>

# <<<BREAK>>>

function run_job(client_fd)
    try
        client_data = MorlocRuntime.stream_from_client(client_fd)

        if MorlocRuntime.is_local_call(client_data)
            (mid, args) = MorlocRuntime.read_morloc_call_packet(client_data)
            try
                result = dispatch[mid](args...)
            catch e
                result = MorlocRuntime.make_fail_packet(string(e))
            end

        elseif MorlocRuntime.is_remote_call(client_data)
            (mid, args) = MorlocRuntime.read_morloc_call_packet(client_data)
            try
                result = remote_dispatch[mid](args...)
            catch e
                result = MorlocRuntime.make_fail_packet(string(e))
            end

        elseif MorlocRuntime.is_ping(client_data)
            result = MorlocRuntime.pong(client_data)

        else
            error("Expected a ping or call type packet")
        end

        MorlocRuntime.send_packet_to_foreign_server(client_fd, result)

    catch e
        # Best-effort: wrap the error in a fail packet and send it back so the
        # caller gets a structured error instead of hanging on a closed socket.
        # Includes the full backtrace so context propagates through the stack.
        msg = sprint(showerror, e, catch_backtrace())
        try
            result = MorlocRuntime.make_fail_packet(msg)
            MorlocRuntime.send_packet_to_foreign_server(client_fd, result)
        catch
            # Client may already be gone (timed-out ping, broken pipe); ignore.
        end
        @error "job failed" exception=(e, catch_backtrace())
    finally
        MorlocRuntime.close_socket(client_fd)
    end
end

function main()
    socket_path = ARGS[1]
    tmpdir = ARGS[2]
    shm_basename = ARGS[3]

    global_state["tmpdir"] = tmpdir

    daemon = MorlocRuntime.start_daemon(socket_path, tmpdir, shm_basename, 0xffff)

    # Simple signal handling
    running = Ref(true)

    @async begin
        try
            while running[]
                sleep(0.01)
            end
        catch
        end
    end

    try
        while running[]
            client_fd = MorlocRuntime.wait_for_client(daemon)
            if client_fd > 0
                run_job(client_fd)
            end
        end
    catch e
        if !(e isa InterruptException)
            @error "Pool error" exception=(e, catch_backtrace())
        end
    finally
        MorlocRuntime.close_daemon(daemon)
    end
end

main()


================================================
FILE: data/lang/languages.yaml
================================================
# Pairwise language costs for the morloc optimizer
#
# Same-language function overhead (intra-language call cost)
same_language_costs:
  c: 1
  cpp: 1
  py: 10
  r:  20

# Cost of calling INTO a language from a different language (IPC overhead)
cross_language_costs:
  c: 1001
  cpp: 1000
  py: 10000
  r: 40000

# Special optimized pairs (from -> to) that bypass normal IPC
optimized_pairs:
  - from: cpp
    to: c
    cost: 1

# Defaults for unknown/plugin languages
default_same_language: 10
default_cross_language: 10000


================================================
FILE: data/lang/py/Makefile
================================================
all:
	python3 setup.py build_ext --inplace
	cp -fs pymorloc.cpython* pymorloc


================================================
FILE: data/lang/py/init.sh
================================================
#!/bin/bash
set -e

export MORLOC_HOME="$1"
BUILD_DIR="$2"
SANITIZE_FLAGS="$3"
OPT_DIR="$MORLOC_HOME/opt"

# Clean stale build artifacts
rm -f "$OPT_DIR"/pymorloc.cpython* "$OPT_DIR/pymorloc"
rm -rf "$OPT_DIR/build"

# Copy files to opt dir
cp "$BUILD_DIR/pymorloc.c" "$OPT_DIR/"
cp "$BUILD_DIR/setup.py" "$OPT_DIR/"
cp "$BUILD_DIR/Makefile" "$OPT_DIR/"

# Build pymorloc extension
export CFLAGS="$SANITIZE_FLAGS"
make -C "$OPT_DIR" -f Makefile


================================================
FILE: data/lang/py/lang.yaml
================================================
# Python language descriptor for morloc compiler
# Metadata fields (read by LangRegistry) + descriptor fields (read by generic translator)

# Identity and metadata
name: py
extension: py
aliases: ["python", "python3"]
is_compiled: false
run_command: ["python3"]
serial_type: "str"
cost: 3
preamble:
  - 'sys.path = [os.path.normpath(os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "..")), os.path.expanduser("."), os.path.expanduser("{{opt}}"), os.path.expanduser("{{lib}}")] + sys.path'
  - "import importlib"
  - "import pymorloc as morloc"

# Literals
ldBoolTrue: "True"
ldBoolFalse: "False"
ldNullLiteral: "None"

# Constructors
ldListStyle: bracket
ldTupleConstructor: ""
ldRecordConstructor: "OrderedDict"
ldRecordSeparator: "="

# Access styles
ldIndexStyle: zero_bracket
ldKeyAccess: "bracket"
ldFieldAccess: dot

# Serialize/deserialize
ldSerializeFn: "morloc.put_value"
ldDeserializeFn: "morloc.get_value"
ldIntrinsicPrefix: "morloc."

# Foreign call
ldForeignCallFn: "morloc.foreign_call"
ldForeignCallIntSuffix: ""

# Remote call
ldRemoteCallFn: "morloc.remote_call"

# Record handling
ldDictStyleRecords: true
ldQuoteRecordKeys: false

# Import syntax
ldQualifiedImports: true
ldIncludeRelToFile: false

# Template fields
ldAssignOp: "="
ldLambdaTemplate: "lambda {{args}}: {{body}}"
ldDoBlockExpr: "(lambda: {{expr}})"
ldDoBlockBlock: ""
ldPartialTemplate: "functools.partial({{fn_with_context}})"
ldImportTemplate: "{{namespace}} = importlib.import_module(\"{{module_path}}\")"
ldSocketPathTemplate: "os.path.join(global_state[\"tmpdir\"], {{socket}})"
ldResourcePackTemplate: "struct.pack('iiii', {{mem}}, {{time}}, {{cpus}}, {{gpus}})"
ldReturnTemplate: "return({{expr}})"
ldFuncDefHeader: "def {{name}}({{args}}):"
ldBlockStyle: indent
ldBlockEnd: ""
ldErrorWrapOpen: "try:"
ldErrorWrapClose:
  - "except Exception as e:"
  - "    raise RuntimeError(f\"Error (pool daemon in {{name}}):\\n{e!s}\")"
ldPatternStyle: fstring
ldQuoteTerminator: '"""'
ldQuoteTerminatorEsc: '\"\"\"'
ldMapStyle: loop_append
ldDispatchLocalHeader: "dispatch = {"
ldDispatchLocalEntry: "    {{mid}}: {{name}},"
ldDispatchLocalFooter: "}"
ldDispatchRemoteHeader: "remote_dispatch = {"
ldDispatchRemoteEntry: "    {{mid}}: {{name}}_remote,"
ldDispatchRemoteFooter: "}"

# Pool template (loaded from pool.py, left empty here)
ldPoolTemplate: ""
ldBreakMarker: "# <<<BREAK>>>"
ldCommentMarker: "#"


================================================
FILE: data/lang/py/pool.py
================================================
import signal
import sys
import select
import os # required for setting path to morloc dependencies
import time
import copy
import array
import struct
import socket as _socket
from collections import OrderedDict
from multiprocessing import Process, Value, RawValue
import ctypes
import functools


# Global variables for clean signal handling
daemon = None
workers = []
global_state = dict()
_shutdown_wakeup_fd = -1

# AUTO include sources start
# <<<BREAK>>>
# AUTO include sources end

# Dynamic worker spawning: monkey-patch foreign_call to track busy workers.
# Workers atomically increment busy_count before a foreign_call and decrement
# after. When busy_count reaches total_workers, a byte is written to a wake-up
# pipe to tell the main process to spawn a new worker.
_original_foreign_call = morloc.foreign_call
_busy_ref = None
_total_ref = None
_wakeup_fd = -1

def _init_worker_tracking(busy, total, wakeup_fd):
    global _busy_ref, _total_ref, _wakeup_fd
    _busy_ref = busy
    _total_ref = total
    _wakeup_fd = wakeup_fd
    morloc.foreign_call = _tracked_foreign_call

def _tracked_foreign_call(*args):
    prev = _busy_ref.value
    _busy_ref.value = prev + 1
    if prev + 1 >= _total_ref.value and _wakeup_fd >= 0:
        try:
            os.write(_wakeup_fd, b'!')
        except OSError:
            pass
    try:
        return _original_foreign_call(*args)
    finally:
        _busy_ref.value -= 1

# AUTO include manifolds start
# <<<BREAK>>>
# AUTO include manifolds end


# AUTO include dispatch start
# <<<BREAK>>>
# AUTO include dispatch end

def run_job(client_fd: int) -> None:
    try:
        # Free SHM from previous dispatch result (consumed by caller)
        morloc.flush_shm_tracker()
        client_data = morloc.stream_from_client(client_fd)

        if(morloc.is_local_call(client_data)):
            (mid, args) = morloc.read_morloc_call_packet(client_data)

            try:
                result = dispatch[mid](*args)
            except Exception as e:
                result = morloc.make_fail_packet(str(e))

        elif(morloc.is_remote_call(client_data)):
            (mid, args) = morloc.read_morloc_call_packet(client_data)

            try:
                result = remote_dispatch[mid](*args)
            except Exception as e:
                result = morloc.make_fail_packet(str(e))

        elif(morloc.is_ping(client_data)):
            result = morloc.pong(client_data)

        else:
            raise ValueError("Expected a ping or call type packet")

        # Flush stdout BEFORE sending the result back. The nexus prints its
        # own output (the return value) right after receiving this response.
        # Both processes share the same stdout fd, so if we flush after sending,
        # the nexus can print first, causing out-of-order output.
        sys.stdout.flush()

        morloc.send_packet_to_foreign_server(client_fd, result)

    except Exception as e:
        # Try to send a fail packet back to the caller before giving up.
        # This may fail (e.g., broken pipe from a timed-out ping), which is OK.
        try:
            result = morloc.make_fail_packet(str(e))
            morloc.send_packet_to_foreign_server(client_fd, result)
        except Exception:
            pass
        print(f"job failed: {e!s}", file=sys.stderr)
    finally:
        # Safety-net flush for any output from error handling paths
        sys.stdout.flush()
        # close child copy
        morloc.close_socket(client_fd)


def _send_fd(sock, fd):
    """Send a file descriptor over a Unix domain socket."""
    sock.sendmsg([b'\x00'],
                 [(_socket.SOL_SOCKET, _socket.SCM_RIGHTS,
                   array.array('i', [fd]))])

def _recv_fd(sock):
    """Receive a file descriptor from a Unix domain socket."""
    msg, ancdata, flags, addr = sock.recvmsg(1, _socket.CMSG_SPACE(4))
    if not msg and not ancdata:
        raise EOFError("Connection closed")
    for cmsg_level, cmsg_type, cmsg_data in ancdata:
        if (cmsg_level == _socket.SOL_SOCKET and
                cmsg_type == _socket.SCM_RIGHTS):
            a = array.array('i')
            a.frombytes(cmsg_data[:4])
            return a[0]
    raise RuntimeError("No fd received in ancillary data")


WORKER_IDLE_TIMEOUT = 5.0  # seconds before an idle worker exits

def worker_process(job_fd, tmpdir, shm_basename, shutdown_flag, busy_count, total_workers, wakeup_w):
    # Reset signal handlers inherited from main. If user code inside run_job
    # calls multiprocessing.Pool (or anything else that forks and later
    # SIGTERMs its own children), those grandchildren would otherwise inherit
    # main's signal_handler and flip the shared shutdown_flag, causing main
    # to SIGKILL this worker mid-response. See the multiprocessing-py-1 bug.
    signal.signal(signal.SIGTERM, signal.SIG_DFL)
    signal.signal(signal.SIGINT, signal.SIG_DFL)
    morloc.set_fallback_dir(tmpdir)
    morloc.shinit(shm_basename, 0, 0xffff)
    _init_worker_tracking(busy_count, total_workers, wakeup_w)
    sock = _socket.fromfd(job_fd, _socket.AF_UNIX, _socket.SOCK_STREAM)
    os.close(job_fd)  # sock owns a dup'd copy
    last_activity = time.monotonic()
    try:
        while not shutdown_flag.value:
            rlist, _, _ = select.select([sock.fileno()], [], [], 0.01)
            if shutdown_flag.value:
                break
            if rlist:
                try:
                    client_fd = _recv_fd(sock)
                    run_job(client_fd)
                    last_activity = time.monotonic()
                except (EOFError, OSError):
                    break
            elif total_workers.value > 1 and time.monotonic() - last_activity > WORKER_IDLE_TIMEOUT:
                break
    except BaseException as e:
        # Catch-all for errors that escape run_job's own exception handling:
        # MemoryError, KeyboardInterrupt, SystemExit, or bugs in the worker
        # loop itself. Without this, the worker dies silently and the nexus
        # only sees "failed to read response header" with no indication of
        # what went wrong in the pool.
        #
        # Race condition: the nexus detects the broken socket and may start
        # its clean_exit tear-down (SIGTERM -> SIGKILL) while this print is
        # still buffered. We flush immediately to maximize the chance the
        # message reaches the terminal before we are killed. stderr is
        # line-buffered (set in __main__), but the flush is a safety net for
        # edge cases (redirected stderr, forked-process buffer state).
        import traceback
        print(f"morloc pool worker fatal error: {e!s}", file=sys.stderr)
        traceback.print_exc(file=sys.stderr)
        sys.stderr.flush()
    finally:
        sock.close()


def signal_handler(sig, frame):
    global daemon
    # Ignore further SIGTERM/SIGINT during cleanup. Python processes pending
    # signals between bytecodes, including while another signal handler is
    # running, so a second SIGTERM arriving mid-cleanup would otherwise
    # re-enter this handler and double-free the daemon pointer.
    try:
        signal.signal(signal.SIGTERM, signal.SIG_IGN)
        signal.signal(signal.SIGINT, signal.SIG_IGN)
    except Exception:
        pass
    shutdown_flag.value = True
    if _shutdown_wakeup_fd >= 0:
        try:
            os.write(_shutdown_wakeup_fd, b'!')
        except OSError:
            pass
    # Capture the daemon pointer into a local and clear the global BEFORE
    # invoking close_daemon. If a pending signal still slips through and
    # re-enters this handler, it will see daemon=None and skip the free.
    d = daemon
    daemon = None
    if d is not None:
        morloc.close_daemon(d)


def client_listener(job_fd, socket_path, tmpdir, shm_basename, shutdown_flag):
    global daemon
    daemon = morloc.start_daemon(socket_path, tmpdir, shm_basename, 0xffff)
    sock = _socket.fromfd(job_fd, _socket.AF_UNIX, _socket.SOCK_STREAM)
    os.close(job_fd)  # sock owns a dup'd copy

    while not shutdown_flag.value:
        try:
            client_fd = morloc.wait_for_client(daemon)
        except Exception as e:
            print(f"In python daemon, failed to connect to client: {e!s}", file=sys.stderr)
            continue

        if client_fd > 0:
            try:
                _send_fd(sock, client_fd)
            except Exception as e:
                print(f"In python daemon, failed to start worker: {e!s}", file=sys.stderr)
            finally:
                morloc.close_socket(client_fd)
    sock.close()


if __name__ == "__main__":
    # Line-buffer stderr so diagnostic output is not lost when pool is killed.
    # stdout is left fully buffered for performance (genome-scale piping) and
    # flushed explicitly after each job and during shutdown.
    sys.stderr.reconfigure(line_buffering=True)

    shutdown_flag = Value('b', False)  # Shared flag

    signal.signal(signal.SIGINT, signal_handler)
    signal.signal(signal.SIGTERM, signal_handler)

    # Health check: confirm imports loaded and print version
    if len(sys.argv) > 1 and sys.argv[1] == "--health":
        sys.stdout.write('{"status":"ok","version":"__MORLOC_VERSION__"}\n')
        sys.exit(0)

    # Process arguments passed from the nexus
    try:
        socket_path = sys.argv[1]
        tmpdir = sys.argv[2]
        shm_basename = sys.argv[3]
    except IndexError:
        print("Usage: script.py <socket_path> <tmpdir> <shm_basename>")
        sys.exit(1)

    global_state["tmpdir"] = tmpdir

    # Shared job queue: listener writes fds to write_sock, workers read from read_sock.
    # Only idle workers (blocked in recvmsg) pick up jobs, preventing the round-robin
    # deadlock where a callback gets dispatched to a busy worker.
    read_sock, write_sock = _socket.socketpair(_socket.AF_UNIX, _socket.SOCK_STREAM)

    num_workers = 1
    workers = []

    # Shared counters for dynamic worker spawning.
    # Workers increment busy_count before foreign_call and decrement after.
    # When all workers are busy, main process spawns a new one.
    busy_count = RawValue(ctypes.c_int, 0)
    total_workers = RawValue(ctypes.c_int, num_workers)
    wakeup_r, wakeup_w = os.pipe()
    os.set_blocking(wakeup_r, False)
    _shutdown_wakeup_fd = wakeup_w

    # Keep a dup of the read end so we can spawn new workers later
    spare_read_fd = os.dup(read_sock.fileno())

    for i in range(num_workers):
        worker = Process(target=worker_process,
                         args=(read_sock.fileno(), tmpdir, shm_basename, shutdown_flag,
                               busy_count, total_workers, wakeup_w))
        worker.start()
        workers.append(worker)
    read_sock.close()  # main/listener don't need the read end (spare_read_fd kept)

    # Start client listener process
    listener_process = Process(
        target=client_listener,
        args=(write_sock.fileno(), socket_path, tmpdir, shm_basename, shutdown_flag)
    )
    listener_process.start()
    write_sock.close()  # main doesn't need the write end

    # Main loop: monitor wake-up pipe, spawn new workers when all are busy,
    # and reap idle workers that have exited.
    while not shutdown_flag.value:
        rlist, _, _ = select.select([wakeup_r], [], [], 0.01)
        if rlist:
            try:
                os.read(wakeup_r, 4096)  # drain pipe
            except OSError:
                pass

        # Reap dead workers (idle timeout or error exit)
        alive = []
        for w in workers:
            if w.is_alive():
                alive.append(w)
            else:
                w.join(timeout=0)
                w.close()
        workers = alive
        total_workers.value = max(1, len(workers))

        # Spawn a new worker if all are busy (or all have exited)
        if len(workers) == 0 or busy_count.value >= total_workers.value:
            w = Process(target=worker_process,
                        args=(spare_read_fd, tmpdir, shm_basename, shutdown_flag,
                              busy_count, total_workers, wakeup_w))
            w.start()
            workers.append(w)
            total_workers.value = len(workers)

    # Shutdown sequence
    os.close(wakeup_r)
    os.close(wakeup_w)
    os.close(spare_read_fd)

    # 1. Stop listener first
    listener_process.terminate()
    listener_process.join(timeout=0.001)
    listener_process.kill()
    listener_process.join()  # Final blocking reap
    listener_process.close()

    # 2. Terminate workers with escalating force
    for p in workers:
        if p.is_alive():
            p.kill()
        p.join()  # Final blocking reap
        p.close()

    sys.exit(0)


================================================
FILE: data/lang/py/pymorloc.c
================================================
#define PY_SSIZE_T_CLEAN
#include "morloc.h"
#include "Python.h"
#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/stat.h>

// boilerplate for numpy support
#define PY_ARRAY_UNIQUE_SYMBOL MORLOC_ARRAY_API
#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
#include <numpy/arrayobject.h>

// SHM tracker for _put_value allocations (deferred cleanup)
#define SHM_TRACKER_INIT_CAP 16
typedef struct {
    absptr_t ptr;
    Schema* schema;
} shm_entry_t;
static shm_entry_t* shm_tracker = NULL;
static size_t shm_tracker_count = 0;
static size_t shm_tracker_cap = 0;

static void shm_tracker_push(absptr_t ptr, Schema* schema) {
    if (shm_tracker_count >= shm_tracker_cap) {
        size_t new_cap = shm_tracker_cap ? shm_tracker_cap * 2 : SHM_TRACKER_INIT_CAP;
        shm_entry_t* new_buf = (shm_entry_t*)realloc(shm_tracker, new_cap * sizeof(shm_entry_t));
        if (!new_buf) return;
        shm_tracker = new_buf;
        shm_tracker_cap = new_cap;
    }
    shm_tracker[shm_tracker_count].ptr = ptr;
    shm_tracker[shm_tracker_count].schema = schema;
    shm_tracker_count++;
}

static void flush_shm_tracker(void) {
    for (size_t i = 0; i < shm_tracker_count; i++) {
        char* err = NULL;
        block_header_t* blk = (block_header_t*)((char*)shm_tracker[i].ptr - sizeof(block_header_t));
        if (shm_tracker[i].schema && blk->reference_count <= 1) {
            shfree_by_schema(shm_tracker[i].ptr, shm_tracker[i].schema, &err);
            if (err) { free(err); err = NULL; }
        }
        shfree(shm_tracker[i].ptr, &err);
        if (err) { free(err); }
        if (shm_tracker[i].schema) {
            free_schema(shm_tracker[i].schema);
        }
    }
    shm_tracker_count = 0;
}

#define NOTHING

#define MAYFAIL \
    char* child_errmsg_ = NULL; \

// Returns a strdup'd string that the caller must free, or NULL.
char* get_prior_err(){
    char* prior_err = NULL;
    if (PyErr_Occurred()) {
        // Fetch existing exception
        PyObject *type, *value, *traceback;
        PyErr_Fetch(&type, &value, &traceback);

        // Extract error message
        PyObject* str = PyObject_Str(value);  // Convert exception to string
        if (str) {
            const char* raw = PyUnicode_AsUTF8(str);
            if (raw) {
                prior_err = strdup(raw);
            }
            Py_DECREF(str);
        }
        Py_XDECREF(type);
        Py_XDECREF(value);
        Py_XDECREF(traceback);
    }
    return prior_err;
}


#define PyTRY(fun, ...) \
    fun(__VA_ARGS__ __VA_OPT__(,) &child_errmsg_); \
    if(child_errmsg_ != NULL){ \
        char* prior_err = get_prior_err(); \
        if(prior_err == NULL){ \
            PyErr_Format(PyExc_RuntimeError, "Error (%s:%d in %s):\n%s", __FILE__, __LINE__, __func__, child_errmsg_); \
        } else { \
            PyErr_Format(PyExc_RuntimeError, "%s\nError (%s:%d in %s):\n%s", prior_err, __FILE__, __LINE__, __func__, child_errmsg_); \
            free(prior_err); \
        } \
        goto error; \
    }

#define PyRAISE(msg, ...) { \
    char* prior_err_ = get_prior_err(); \
    if(prior_err_ == NULL){ \
        PyErr_Format(PyExc_RuntimeError, "Error (%s:%d in %s):\n" msg "\n", __FILE__, __LINE__, __func__, ##__VA_ARGS__); \
    } else { \
        PyErr_Format(PyExc_RuntimeError, "%s\nError (%s:%d in %s):\n" msg "\n", prior_err_, __FILE__, __LINE__, __func__, ##__VA_ARGS__); \
        free(prior_err_); \
    } \
    goto error; \
    }

#define PyTRACE(cond) \
    if(cond){ \
        char* prior_err = get_prior_err(); \
        if(prior_err != NULL){ \
            PyErr_Format(PyExc_TypeError, "Error (%s:%d in %s):\n%s", __FILE__, __LINE__, __func__, prior_err); \
            free(prior_err); \
            goto error; \
        } \
    }

PyObject* numpy_module = NULL;


// This function will be called to import numpy if, and only if, a numpy feature
// is used. This avoids the agonizingly long numpy import time.
void* import_numpy() {
    numpy_module = PyImport_ImportModule("numpy");
    if(numpy_module == NULL){
        PyRAISE("NumPy is not available");
    }

    import_array();

error:
    return NULL;
}


// Map morloc schema element type to numpy type number
static int schema_to_npy_type(morloc_serial_type type) {
    switch (type) {
        case MORLOC_BOOL:    return NPY_BOOL;
        case MORLOC_SINT8:   return NPY_INT8;
        case MORLOC_SINT16:  return NPY_INT16;
        case MORLOC_SINT32:  return NPY_INT32;
        case MORLOC_SINT64:  return NPY_INT64;
        case MORLOC_UINT8:   return NPY_UINT8;
        case MORLOC_UINT16:  return NPY_UINT16;
        case MORLOC_UINT32:  return NPY_UINT32;
        case MORLOC_UINT64:  return NPY_UINT64;
        case MORLOC_FLOAT32: return NPY_FLOAT32;
        case MORLOC_FLOAT64: return NPY_FLOAT64;
        default:             return -1;
    }
}

PyObject* fromAnything(const Schema* schema, const void* data, const void* base_ptr){ MAYFAIL

    PyObject* obj = NULL;
    switch (schema->type) {
        case MORLOC_NIL:
            Py_RETURN_NONE;
        case MORLOC_BOOL:
            obj = PyBool_FromLong(*(bool*)data);
            break;
        case MORLOC_SINT8:
            obj = PyLong_FromLong(*(int8_t*)data);
            break;
        case MORLOC_SINT16:
            obj = PyLong_FromLong(*(int16_t*)data);
            break;
        case MORLOC_SINT32:
            obj = PyLong_FromLong(*(int32_t*)data);
            break;
        case MORLOC_SINT64:
            obj = PyLong_FromLongLong(*(int64_t*)data);
            break;
        case MORLOC_UINT8:
            obj = PyLong_FromUnsignedLong(*(uint8_t*)data);
            break;
        case MORLOC_UINT16:
            obj = PyLong_FromUnsignedLong(*(uint16_t*)data);
            break;
        case MORLOC_UINT32:
            obj = PyLong_FromUnsignedLong(*(uint32_t*)data);
            break;
        case MORLOC_UINT64:
            obj = PyLong_FromUnsignedLongLong(*(uint64_t*)data);
            break;
        case MORLOC_FLOAT32:
            obj = PyFloat_FromDouble(*(float*)data);
            break;
        case MORLOC_FLOAT64:
            obj = PyFloat_FromDouble(*(double*)data);
            break;
        case MORLOC_STRING: {
            Array* str_array = (Array*)data;
            void* tmp_ptr = NULL;

            if (str_array->size != 0) {
                tmp_ptr = PyTRY(resolve_relptr, str_array->data, base_ptr);
            }

            if (schema->hint != NULL && strcmp(schema->hint, "bytes") == 0) {
                // load binary data as a python bytes object
                if (str_array->size == 0) {
                    obj = PyBytes_FromStringAndSize("", 0);  // empty bytes object
                } else {
                    obj = PyBytes_FromStringAndSize(tmp_ptr, str_array->size);
                }
                if (!obj) {
                    PyRAISE("Failed to parse data as bytes");
                }
            } else if (schema->hint != NULL && strcmp(schema->hint, "bytearray") == 0) {
                // load binary data as a python bytearray object
                if (str_array->size == 0) {
                    obj = PyByteArray_FromStringAndSize("", 0);  // empty bytearray object
                } else {
                    obj = PyByteArray_FromStringAndSize(tmp_ptr, str_array->size);
                }
                if (!obj) {
                    PyRAISE("Failed to parse data as bytearray");
                }
            } else {
                // otherwise, load this as a str type
                if (str_array->size == 0) {
                    obj = PyUnicode_New(0, 127);  // empty string object
                } else {
                    obj = PyUnicode_FromStringAndSize(tmp_ptr, str_array->size);
                }
                if (!obj) {
                    PyRAISE("Failed to parse data as string");
                }
            }
            break;
        }
        case MORLOC_ARRAY: {
            Array* array = (Array*)data;
            if (schema->hint != NULL && strcmp(schema->hint, "numpy.ndarray") == 0) {
                import_numpy();
                Schema* element_schema = schema->parameters[0];
                npy_intp dims[] = {array->size};
                void* absptr = NULL;
                int nd = 1; // number of dimensions
                int type_num;
                // Determine the NumPy type number based on the element schema
                switch (element_schema->type) {
                    case MORLOC_BOOL:    type_num = NPY_BOOL; break;
                    case MORLOC_SINT8:   type_num = NPY_INT8; break;
                    case MORLOC_SINT16:  type_num = NPY_INT16; break;
                    case MORLOC_SINT32:  type_num = NPY_INT32; break;
                    case MORLOC_SINT64:  type_num = NPY_INT64; break;
                    case MORLOC_UINT8:   type_num = NPY_UINT8; break;
                    case MORLOC_UINT16:  type_num = NPY_UINT16; break;
                    case MORLOC_UINT32:  type_num = NPY_UINT32; break;
                    case MORLOC_UINT64:  type_num = NPY_UINT64; break;
                    case MORLOC_FLOAT32: type_num = NPY_FLOAT32; break;
                    case MORLOC_FLOAT64: type_num = NPY_FLOAT64; break;
                    default:
                        PyRAISE("Unsupported element type for NumPy array");
                }

                absptr = PyTRY(resolve_relptr, array->data, base_ptr);

                // Create the NumPy array
                obj = PyArray_SimpleNewFromData(nd, dims, type_num, absptr);

                if(obj == NULL) {
                    PyRAISE("Failed to parse data");
                }

                // Note that we do not want to give ownership to Python
                // This is shared memory, which means, python should not mutate
                // it.

            } else if (schema->hint != NULL && strcmp(schema->hint, "bytearray") == 0) {
                // Create a Python bytearray object
                void* absptr = PyTRY(resolve_relptr, array->data, base_ptr);
                obj = PyByteArray_FromStringAndSize((const char*)absptr, array->size);
                if (!obj) {
                    PyErr_SetString(PyExc_TypeError, "Failed to create bytearray");
                    goto error;
                }
                // Note: Similar to the numpy case, we don't want to give ownership to Python.
                // The bytearray is created from a copy of the data, so no additional handling is needed.
            } else if (schema->parameters[0]->type == MORLOC_UINT8) {
                // Create a Python bytes object for UINT8 arrays
                void* tmp_ptr = PyTRY(resolve_relptr, array->data, base_ptr);
                obj = PyBytes_FromStringAndSize((const char*)tmp_ptr, array->size);
                if (obj == NULL) {
                    PyRAISE("Failed to one bytes")
                }
            } else if (schema->hint == NULL || (schema->hint != NULL && strcmp(schema->hint, "list") == 0)) {
                // For other types, create a standard list
                obj = PyList_New(array->size);
                if(obj == NULL){
                    PyRAISE("Failed to one string");
                }
                if(array->size > 0){
                    char* start = (char*) PyTRY(resolve_relptr, array->data, base_ptr);
                    size_t width = schema->parameters[0]->width;
                    Schema* element_schema = schema->parameters[0];
                    for (size_t i = 0; i < array->size; i++) {
                        PyObject* item = fromAnything(element_schema, start + width * i, base_ptr);
                        if (!item || PyList_SetItem(obj, i, item) < 0) {
                            Py_XDECREF(item);
                            PyRAISE("Failed to access element in list")
                        }
                    }
                }
            } else {
                PyRAISE("Unexpected array hint");
            }
            break;
        }
        case MORLOC_TUPLE: {
            obj = PyTuple_New(schema->size);
            if(obj == NULL){
                PyRAISE("Failed in tuple");
            }
            for (size_t i = 0; i < schema->size; i++) {
                void* item_ptr = (char*)data + schema->offsets[i];
                PyObject* item = fromAnything(schema->parameters[i], item_ptr, base_ptr);
                if (!item || PyTuple_SetItem(obj, i, item) < 0) {
                    Py_XDECREF(item);
                    PyRAISE("Failed to access tuple element");
                }
            }
            break;
        }
        case MORLOC_MAP: {
            obj = PyDict_New();
            if(obj == NULL){
                PyRAISE("Failed in map");
            }
            for (size_t i = 0; i < schema->size; i++) {
                void* item_ptr = (char*)data + schema->offsets[i];
                PyObject* value = fromAnything(schema->parameters[i], item_ptr, base_ptr);
                PyObject* key = PyUnicode_FromString(schema->keys[i]);
                if (!value || !key || PyDict_SetItem(obj, key, value) < 0) {
                    Py_XDECREF(value);
                    Py_XDECREF(key);
                    PyRAISE("Failed to access map element");
                }
                Py_DECREF(key);
                Py_DECREF(value);
            }
            break;
        }
        case MORLOC_OPTIONAL: {
            uint8_t tag = *(const uint8_t*)data;
            if (tag == 0) {
                Py_RETURN_NONE;
            }
            obj = fromAnything(schema->parameters[0], (const char*)data + schema->offsets[0], base_ptr);
            if (!obj) {
                PyRAISE("Failed to deserialize optional inner value");
            }
            break;
        }
        case MORLOC_TENSOR: {
            import_numpy();
            const Tensor* tensor = (const Tensor*)data;
            size_t ndim = schema_tensor_ndim(schema);

            int type_num = schema_to_npy_type(schema->parameters[0]->type);
            if (type_num < 0) { PyRAISE("Unsupported tensor element type"); }

            if (tensor->total_elements == 0) {
                npy_intp zero_dims[1] = {0};
                obj = PyArray_SimpleNew(1, zero_dims, type_num);
                break;
            }

            const int64_t* shape = (const int64_t*)resolve_relptr(tensor->shape, base_ptr, NULL);
            const void* tdata = resolve_relptr(tensor->data, base_ptr, NULL);

            npy_intp np_dims[5];
            for (size_t i = 0; i < ndim; i++) np_dims[i] = (npy_intp)shape[i];

            // Create numpy array as a copy (R/W) from the data
            obj = PyArray_SimpleNewFromData((int)ndim, np_dims, type_num, (void*)tdata);
            if (!obj) { PyRAISE("Failed to create numpy array from tensor"); }

            // Make a copy so the array owns its data (SHM may be freed)
            PyObject* owned = PyArray_NewCopy((PyArrayObject*)obj, NPY_CORDER);
            Py_DECREF(obj);
            obj = owned;
            if (!obj) { PyRAISE("Failed to copy tensor data"); }
            break;
        }
        default:
            PyRAISE("Unsupported schema type");
    }

    return obj;

error:
    Py_XDECREF(obj);
    return NULL;
}


#define HANDLE_SINT_TYPE(CTYPE, PYLONG_FUNC, MIN, MAX) \
    do { \
        if (!PyLong_Check(obj)) { \
            PyErr_Format(PyExc_TypeError, "Expected int for %s, but got %s", #CTYPE, Py_TYPE(obj)->tp_name); \
            goto error; \
        } \
        long long value = PYLONG_FUNC(obj); \
        if (value < MIN || value > MAX || PyErr_Occurred()) { \
            PyErr_Format(PyExc_OverflowError, "Integer overflow for %s", #CTYPE); \
            goto error; \
        } \
        *(CTYPE*)dest = (CTYPE)value; \
    } while(0)

#define HANDLE_UINT_TYPE(CTYPE, PYLONG_FUNC, MAX) \
    do { \
        if (!PyLong_Check(obj)) { \
            PyErr_Format(PyExc_TypeError, "Expected int for %s, but got %s", #CTYPE, Py_TYPE(obj)->tp_name); \
            goto error; \
        } \
        unsigned long long value = PYLONG_FUNC(obj); \
        if (value > MAX || PyErr_Occurred()) { \
            PyErr_Format(PyExc_OverflowError, "Integer overflow for %s", #CTYPE); \
            goto error; \
        } \
        *(CTYPE*)dest = (CTYPE)value; \
    } while(0)


ssize_t get_shm_size(const Schema* schema, PyObject* obj) {
    switch (schema->type) {
        case MORLOC_NIL:
        case MORLOC_BOOL:
        case MORLOC_SINT8:
        case MORLOC_SINT16:
        case MORLOC_SINT32:
        case MORLOC_SINT64:
        case MORLOC_UINT8:
        case MORLOC_UINT16:
        case MORLOC_UINT32:
        case MORLOC_UINT64:
        case MORLOC_FLOAT32:
        case MORLOC_FLOAT64:
            return schema->width;
        case MORLOC_STRING:
        case MORLOC_ARRAY:
            if (schema->type == MORLOC_STRING && !(PyUnicode_Check(obj) || PyBytes_Check(obj) || PyByteArray_Check(obj) )) {
                PyRAISE("Expected str or bytes for MORLOC_STRING, but got %s", Py_TYPE(obj)->tp_name);
            }
            if (schema->type == MORLOC_ARRAY && !(PyList_Check(obj) || PyBytes_Check(obj) || PyByteArray_Check(obj) || PyObject_HasAttrString(obj, "__array_interface__"))) {
                PyRAISE("Expected list, bytes, bytearray, or numpy array for MORLOC_ARRAY, but got %s", Py_TYPE(obj)->tp_name);
            }
        
            {
                ssize_t required_size = 0;
                // worst-case cursor alignment padding for element data
                required_size += (ssize_t)(schema_alignment(schema->parameters[0]) - 1);

                if (PyList_Check(obj)) {
                    Py_ssize_t list_size = PyList_Size(obj);
                    size_t element_width = schema->parameters[0]->width;
                    switch(schema->parameters[0]->type){
                        case MORLOC_NIL:
                        case MORLOC_BOOL:
                        case MORLOC_SINT8:
                        case MORLOC_SINT16:
                        case MORLOC_SINT32:
                        case MORLOC_SINT64:
                        case MORLOC_UINT8:
                        case MORLOC_UINT16:
                        case MORLOC_UINT32:
                        case MORLOC_UINT64:
                        case MORLOC_FLOAT32:
                        case MORLOC_FLOAT64:
                            required_size += list_size * element_width;
                            break;
                        case MORLOC_STRING:
                        case MORLOC_ARRAY:
                        case MORLOC_TUPLE:
                        case MORLOC_MAP:
                        case MORLOC_OPTIONAL:
                            for(size_t i = 0; i < (size_t)list_size; i++){
                               required_size += get_shm_size(schema->parameters[0], PyList_GetItem(obj, i));
                            }
                            break;
                    }
                } else if (PyObject_HasAttrString(obj, "__array_interface__")) {
                    import_numpy();
                    PyArrayObject *arr = (PyArrayObject *)obj;
                    npy_intp *dims = PyArray_DIMS(arr);
                    int ndim = PyArray_NDIM(arr);
                    size_t total_elements = 1;
                    for (int i = 0; i < ndim; i++) {
                        total_elements *= dims[i];
                    }
                    required_size += total_elements * PyArray_ITEMSIZE(arr);
                } else if (PyBytes_Check(obj)) {
                    required_size += (ssize_t)PyBytes_GET_SIZE(obj);
                } else if (PyByteArray_Check(obj)) {
                    required_size += (ssize_t)PyByteArray_GET_SIZE(obj);
                } else if (PyUnicode_Check(obj)) {
                    PyUnicode_AsUTF8AndSize(obj, &required_size);
                } else {
                    PyRAISE("Unsupported data type");
                }

                required_size += sizeof(Array);
                return required_size;
            }

        case MORLOC_TUPLE:
            if (!PyTuple_Check(obj) && !PyList_Check(obj)) {
                PyRAISE("Expected tuple or list for MORLOC_TUPLE, but got %s", Py_TYPE(obj)->tp_name);
            }

            {
                Py_ssize_t size = PyTuple_Check(obj) ? PyTuple_Size(obj) : PyList_Size(obj);
                if ((size_t)size != schema->size) {
                    PyRAISE("Tuple/List size mismatch");
                }

                size_t required_size = schema->width;

                for (Py_ssize_t i = 0; i < size; ++i) {
                    PyObject* item = PyTuple_Check(obj) ? PyTuple_GetItem(obj, i) : PyList_GetItem(obj, i);
                    ssize_t element_size = get_shm_size(schema->parameters[i], item);
                    if(element_size != -1){
                        if ((size_t)element_size > schema->parameters[i]->width) {
                            required_size += (size_t)element_size - schema->parameters[i]->width;
                        }
                    } else {
                        return -1;
                    }
                }
                return (ssize_t)required_size;
            }

        case MORLOC_MAP:
            if (!PyDict_Check(obj)) {
                PyRAISE("Expected dict for MORLOC_MAP, but got %s", Py_TYPE(obj)->tp_name);
            }

            {
                size_t required_size = schema->width;
                for (size_t i = 0; i < schema->size; ++i) {
                    PyObject* key = PyUnicode_FromString(schema->keys[i]);
                    PyObject* value = PyDict_GetItem(obj, key);
                    Py_DECREF(key);
                    if (value) {
                        ssize_t element_size = get_shm_size(schema->parameters[i], value);
                        if(element_size != -1){
                            if ((size_t)element_size > schema->parameters[i]->width) {
                                required_size += (size_t)element_size - schema->parameters[i]->width;
                            }
                        } else {
                            return -1;
                        }
                    }
                }
                return (ssize_t)required_size;
            }

        case MORLOC_OPTIONAL:
            if (obj == Py_None) {
                return (ssize_t)schema->width;
            }
            {
                ssize_t inner_size = get_shm_size(schema->parameters[0], obj);
                if (inner_size == -1) return -1;
                ssize_t extra = (inner_size > (ssize_t)schema->parameters[0]->width) ? inner_size - (ssize_t)schema->parameters[0]->width : 0;
                return (ssize_t)schema->width + extra;
            }

        case MORLOC_TENSOR:
            {
                import_numpy();
                int type_num = schema_to_npy_type(schema->parameters[0]->type);
                if (type_num < 0) { PyRAISE("Unsupported tensor element type"); }
                PyArrayObject* arr = (PyArrayObject*)PyArray_FROM_OTF(obj, type_num, NPY_ARRAY_C_CONTIGUOUS);
                if (!arr) { PyRAISE("Expected numpy array for MORLOC_TENSOR"); }
                size_t total = (size_t)PyArray_SIZE(arr);
                size_t elem_width = schema->parameters[0]->width;
                ssize_t required = (ssize_t)sizeof(Tensor);
                required += (ssize_t)(_Alignof(int64_t) - 1);
                required += (ssize_t)(schema_tensor_ndim(schema) * sizeof(int64_t));
                required += (ssize_t)(schema_alignment(schema->parameters[0]) - 1);
                required += (ssize_t)(total * elem_width);
                Py_DECREF(arr);
                return required;
            }

        default:
            PyRAISE("Unsupported schema type");
    }

    PyRAISE("Reached the unreachable");

error:
    return -1;
}


int to_voidstar_r(void* dest, void** cursor, const Schema* schema, PyObject* obj) { MAYFAIL
    switch (schema->type) {
        case MORLOC_NIL:
            if (obj != Py_None) {
                PyRAISE("Expected None for MORLOC_NIL, but got %s", Py_TYPE(obj)->tp_name);
            }
            *((int8_t*)dest) = (int8_t)0;
            break;

        case MORLOC_BOOL:
            if (!PyBool_Check(obj)) {
                PyRAISE("Expected bool for MORLOC_BOOL, but got %s", Py_TYPE(obj)->tp_name);
            }
            *((bool*)dest) = (obj == Py_True);
            break;

        case MORLOC_SINT8:
            HANDLE_SINT_TYPE(int8_t, PyLong_AsLongLong, INT8_MIN, INT8_MAX);
            break;
        case MORLOC_SINT16:
            HANDLE_SINT_TYPE(int16_t, PyLong_AsLongLong, INT16_MIN, INT16_MAX);
            break;
        case MORLOC_SINT32:
            HANDLE_SINT_TYPE(int32_t, PyLong_AsLongLong, INT32_MIN, INT32_MAX);
            break;
        case MORLOC_SINT64:
            HANDLE_SINT_TYPE(int64_t, PyLong_AsLongLong, INT64_MIN, INT64_MAX);
            break;
        case MORLOC_UINT8:
            HANDLE_UINT_TYPE(uint8_t, PyLong_AsUnsignedLongLong, UINT8_MAX);
            break;
        case MORLOC_UINT16:
            HANDLE_UINT_TYPE(uint16_t, PyLong_AsUnsignedLongLong, UINT16_MAX);
            break;
        case MORLOC_UINT32:
            HANDLE_UINT_TYPE(uint32_t, PyLong_AsUnsignedLongLong, UINT32_MAX);
            break;
        case MORLOC_UINT64:
            HANDLE_UINT_TYPE(uint64_t, PyLong_AsUnsignedLongLong, UINT64_MAX);
            break;

        case MORLOC_FLOAT32:
            if (!PyFloat_Check(obj)) {
                PyRAISE("Expected float for MORLOC_FLOAT32, but got %s", Py_TYPE(obj)->tp_name);
            }
            *((float*)dest) = (float)PyFloat_AsDouble(obj);
            break;

        case MORLOC_FLOAT64:
            if(PyFloat_Check(obj))
            {
                *((double*)dest) = PyFloat_AsDouble(obj);
            } else if(PyLong_Check(obj)){
                *((double*)dest) = (double)PyLong_AsLongLong(obj);
            } else {
                PyRAISE("Expected float or int for MORLOC_FLOAT64, but got %s", Py_TYPE(obj)->tp_name);
            }
            break;

        case MORLOC_STRING:
        case MORLOC_ARRAY:
            if (schema->type == MORLOC_STRING && !(PyUnicode_Check(obj) || PyBytes_Check(obj)  || PyByteArray_Check(obj))) {
                PyRAISE("Expected str or bytes for MORLOC_STRING, but got %s", Py_TYPE(obj)->tp_name);
            }
    
            if (schema->type == MORLOC_ARRAY && !(PyList_Check(obj) || PyBytes_Check(obj) || PyByteArray_Check(obj) || PyObject_HasAttrString(obj, "__array_interface__"))) { 
                PyRAISE("Expected list, bytes, bytearray, or numpy array for MORLOC_ARRAY, but got %s", Py_TYPE(obj)->tp_name);
            }
    
            {
                Py_ssize_t size;

                // "bytes" type is mutable, so it exposes a non-const pointer 
                char* mutable_data = NULL;

                // strings type are immutable, so const
                const char* immutable_data = NULL; 

                if (PyList_Check(obj)) {
                    size = PyList_Size(obj);
                } else if (PyBytes_Check(obj)) {
                    // This needs non-const data
                    PyBytes_AsStringAndSize(obj, &mutable_data, &size);
                } else if (PyByteArray_Check(obj)) {
                    mutable_data = PyByteArray_AS_STRING(obj);
                    size = PyByteArray_GET_SIZE(obj);
                } else if (schema->type == MORLOC_ARRAY && PyObject_HasAttrString(obj, "__array_interface__")) { // check if it is a numpy array
                    import_numpy();
                    PyArrayObject* arr = (PyArrayObject*)obj;
                    size = PyArray_SIZE(arr);
                    // This needs const data
                    immutable_data = PyArray_DATA(arr); // Get the data pointer

                    // Verify that the array is contiguous
                    if (!PyArray_ISCONTIGUOUS(arr)) {
                        PyRAISE("NumPy array must be contiguous");
                    }
                } else {
                    immutable_data = PyUnicode_AsUTF8AndSize(obj, &size);
                }
    
                Array* result = (Array*)dest;
                result->size = (size_t)size;

                if(result->size == 0){
                    result->data = RELNULL;
                    break;
                }

                // align cursor for element data placement
                *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, schema_alignment(schema->parameters[0]));

                result->data = PyTRY(abs2rel, *cursor);

                if (PyList_Check(obj)) {
                    // Fixed size width of each element (variable size data will
                    // be written to the cursor location)
                    size_t width = schema->parameters[0]->width;
    
                    // Move the cursor to the location immediately after the
                    // fixed sized elements
                    *cursor = (void*)(*(char**)cursor + size * width);

                    char* start = (char*) PyTRY(rel2abs, result->data);
                    Schema* element_schema = schema->parameters[0];
                    for (Py_ssize_t i = 0; i < size; i++) {
                        PyObject* item = PyList_GetItem(obj, i);
                        if (to_voidstar_r(start + width * i, cursor, element_schema, item) != 0) {
                            goto error;
                        }
                    }

                } else if (PyBytes_Check(obj) || PyByteArray_Check(obj)){
                    absptr_t tmp_ptr = PyTRY(rel2abs, result->data);
                    memcpy(tmp_ptr, mutable_data, size);
                    // move cursor to the location after the copied data
                    *cursor = (void*)(*(char**)cursor + size);
                }
                else{
                    size_t width = schema->parameters[0]->width;

                    absptr_t tmp_ptr = PyTRY(rel2abs, result->data);
                    memcpy(tmp_ptr, immutable_data, size * width);

                    // Move the cursor to the location immediately after the
                    // fixed sized elements
                    *cursor = (void*)(*(char**)cursor + size * width);
                }
            }
            break;


        case MORLOC_TUPLE:
            if (!PyTuple_Check(obj) && !PyList_Check(obj)) {
                PyRAISE("Expected tuple or list for MORLOC_TUPLE, but got %s", Py_TYPE(obj)->tp_name);
            }

            {
                Py_ssize_t size = PyTuple_Check(obj) ? PyTuple_Size(obj) : PyList_Size(obj);
                if ((size_t)size != schema->size) {
                    PyRAISE("Tuple/List size mismatch");
                }
                for (Py_ssize_t i = 0; i < size; ++i) {
                    PyObject* item = PyTuple_Check(obj) ? PyTuple_GetItem(obj, i) : PyList_GetItem(obj, i);
                    if (to_voidstar_r((char*)dest + schema->offsets[i], cursor, schema->parameters[i], item) != 0) {
                        goto error;
                    }
                }
            }
            break;

        case MORLOC_MAP:
            if (!PyDict_Check(obj)) {
                PyRAISE("Expected dict for MORLOC_MAP, but got %s", Py_TYPE(obj)->tp_name);
            }

            {
                for (size_t i = 0; i < schema->size; ++i) {
                    PyObject* key = PyUnicode_FromString(schema->keys[i]);
                    PyObject* value = PyDict_GetItem(obj, key);
                    Py_DECREF(key);
                    if (value) {
                        if (to_voidstar_r((char*)dest + schema->offsets[i], cursor, schema->parameters[i], value) != 0) {
                            goto error;
                        }
                    }
                }
            }
            break;

        case MORLOC_OPTIONAL:
            if (obj == Py_None) {
                *((uint8_t*)dest) = 0;
                memset((char*)dest + schema->offsets[0], 0, schema->parameters[0]->width);
            } else {
                *((uint8_t*)dest) = 1;
                if (to_voidstar_r((char*)dest + schema->offsets[0], cursor, schema->parameters[0], obj) != 0) {
                    goto error;
                }
            }
            break;

        case MORLOC_TENSOR:
            {
                import_numpy();
                int type_num = schema_to_npy_type(schema->parameters[0]->type);
                if (type_num < 0) { PyRAISE("Unsupported tensor element type"); }
                PyArrayObject* arr = (PyArrayObject*)PyArray_FROM_OTF(obj, type_num, NPY_ARRAY_C_CONTIGUOUS);
                if (!arr) { PyRAISE("Expected numpy array for MORLOC_TENSOR"); }

                int ndim = PyArray_NDIM(arr);
                npy_intp* np_shape = PyArray_DIMS(arr);
                size_t total = (size_t)PyArray_SIZE(arr);
                size_t elem_width = schema->parameters[0]->width;

                Tensor* tensor = (Tensor*)dest;
                tensor->total_elements = total;
                tensor->device_type = 0;
                tensor->device_id = 0;

                if (total == 0) {
                    tensor->shape = RELNULL;
                    tensor->data = RELNULL;
                    Py_DECREF(arr);
                    break;
                }

                // Write shape array
                *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, _Alignof(int64_t));
                {
                    char* rel_err = NULL;
                    tensor->shape = abs2rel((absptr_t)*cursor, &rel_err);
                    if (rel_err) { free(rel_err); Py_DECREF(arr); PyRAISE("abs2rel failed for tensor shape"); }
                }
                int64_t* shape_dst = (int64_t*)*cursor;
                for (int i = 0; i < ndim; i++) shape_dst[i] = (int64_t)np_shape[i];
                *cursor = (char*)*cursor + ndim * sizeof(int64_t);

                // Write data buffer
                size_t elem_align = schema_alignment(schema->parameters[0]);
                *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, elem_align);
                {
                    char* rel_err = NULL;
                    tensor->data = abs2rel((absptr_t)*cursor, &rel_err);
                    if (rel_err) { free(rel_err); Py_DECREF(arr); PyRAISE("abs2rel failed for tensor data"); }
                }
                memcpy(*cursor, PyArray_DATA(arr), total * elem_width);
                *cursor = (char*)*cursor + total * elem_width;

                Py_DECREF(arr);
            }
            break;

        default:
            PyRAISE("Unsupported schema type");
    }

    return 0;

error:
    return -1;
}

void* to_voidstar(const Schema* schema, PyObject* obj){ MAYFAIL
  void* dest = NULL;

  // calculate the required size of the shared memory object
  ssize_t shm_size = get_shm_size(schema, obj);
  if(shm_size == -1){
      PyRAISE("Schema does not match object");
  }

  // allocate the required memory as a single block
  dest = PyTRY(shmalloc, (size_t)shm_size);

  // set the write location of variable size chunks
  void* cursor = (void*)((char*)dest + schema->width);

  // write the data to the block
  int result = to_voidstar_r(dest, &cursor, schema, obj);
  if (result != 0) {
      goto error;
  }

  return dest;

error:
  if (dest != NULL) {
      char* free_errmsg = NULL;
      shfree(dest, &free_errmsg);
      free(free_errmsg);
  }
  return NULL;
}


static PyObject* pybinding__wait_for_client(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* daemon_capsule;

    if (!PyArg_ParseTuple(args, "O", &daemon_capsule)) {
        PyRAISE("Failed to parse arguments");
    }

    language_daemon_t* daemon = (language_daemon_t*)PyCapsule_GetPointer(daemon_capsule, "language_daemon_t");

    int client_fd = PyTRY(wait_for_client, daemon);

    return PyLong_FromLong((long)client_fd);

error:
    return NULL;
}

static PyObject* pybinding__start_daemon(PyObject* self, PyObject* args) { MAYFAIL
    const char* socket_path;
    const char* tmpdir;
    const char* shm_basename;
    size_t shm_default_size;
    language_daemon_t* daemon = NULL;

    if (!PyArg_ParseTuple(args, "sssk", &socket_path, &tmpdir, &shm_basename, &shm_default_size)) {
      goto error;
    }

    daemon = PyTRY(
        start_daemon,
        socket_path,
        tmpdir,
        shm_basename,
        shm_default_size
    );

    return PyCapsule_New(daemon, "language_daemon_t", NULL);

error:
    FREE(daemon)
    return NULL;
}


static PyObject* pybinding__close_daemon(PyObject* self, PyObject* args) {
    PyObject* daemon_capsule;

    if (!PyArg_ParseTuple(args, "O", &daemon_capsule)) {
        PyRAISE("Failed to parse arguments");
    }

    language_daemon_t* daemon = (language_daemon_t*)PyCapsule_GetPointer(daemon_capsule, "language_daemon_t");

    if(daemon != NULL){
        close_daemon(&daemon);
    }

    Py_RETURN_NONE;

error:
    return NULL;
}


static PyObject*  pybinding__read_morloc_call_packet(PyObject* self, PyObject* args){ MAYFAIL
    char* packet;
    size_t packet_size;
    morloc_call_t* call_packet = NULL;
    PyObject* py_tuple = NULL;
    PyObject* py_args = NULL;
    PyObject* py_mid = NULL;

    if (!PyArg_ParseTuple(args, "y#", &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }
    call_packet = PyTRY(read_morloc_call_packet, (const uint8_t*)packet);

    py_tuple = PyTuple_New(2);
    if (!py_tuple) { PyRAISE("Allocation failed"); }
    py_args = PyList_New(call_packet->nargs);
    if (!py_args) { PyRAISE("Allocation failed"); }
    py_mid = PyLong_FromLong((long)call_packet->midx);
    if (!py_mid) { PyRAISE("Allocation failed"); }
    for(size_t i = 0; i < call_packet->nargs; i++){
        size_t arg_packet_size = PyTRY(morloc_packet_size, call_packet->args[i]);
        PyObject* py_arg = PyBytes_FromStringAndSize(
            (char*)call_packet->args[i],
            arg_packet_size
        );
        PyList_SetItem(py_args, i, py_arg);
    }

    PyTuple_SetItem(py_tuple, 0, py_mid);
    PyTuple_SetItem(py_tuple, 1, py_args);
    py_mid = NULL;  // stolen by PyTuple_SetItem
    py_args = NULL;  // stolen by PyTuple_SetItem

    free_morloc_call(call_packet);

    return py_tuple;

error:
    if (call_packet) free_morloc_call(call_packet);
    Py_XDECREF(py_mid);
    Py_XDECREF(py_args);
    Py_XDECREF(py_tuple);
    return NULL;
}

static PyObject*  pybinding__send_packet_to_foreign_server(PyObject* self, PyObject* args){ MAYFAIL
    int client_fd = 0;
    uint8_t* packet = NULL;
    size_t packet_size = 0;

    if (!PyArg_ParseTuple(args, "iy#", &client_fd, &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }

    size_t bytes_sent = PyTRY(send_packet_to_foreign_server, client_fd, packet);

    return PyLong_FromSize_t(bytes_sent);

error:
    return NULL;
}


static PyObject*  pybinding__stream_from_client(PyObject* self, PyObject* args){ MAYFAIL
    int client_fd = 0;
    uint8_t* packet = NULL;

    if (!PyArg_ParseTuple(args, "i", &client_fd)) {
        PyRAISE("Failed to parse arguments");
    }

    packet = PyTRY(stream_from_client, client_fd);

    size_t packet_size = PyTRY(morloc_packet_size, packet);

    PyObject* retval = PyBytes_FromStringAndSize((char*)packet, packet_size);

    free(packet);

    return retval;

error:
    FREE(packet)
    return NULL;
}


static PyObject*  pybinding__close_socket(PyObject* self, PyObject* args){
    int socket_id = 0;

    if (!PyArg_ParseTuple(args, "i", &socket_id)) {
        PyRAISE("Failed to parse arguments");
    }

    close_socket(socket_id);

    Py_RETURN_NONE;

error:
    return NULL;
}

// Transforms a value into a message ready for the socket
static PyObject* pybinding__put_value(PyObject* self, PyObject* args){ MAYFAIL
    uint8_t* packet = NULL;
    Schema* schema = NULL;
    void* voidstar = NULL;
    size_t packet_size = 0;
    bool tracked = false;

    PyObject* obj;
    const char* schema_str;

    if (!PyArg_ParseTuple(args, "Os", &obj, &schema_str)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    // Arrow dispatch: if schema hint is "arrow", use Arrow C Data Interface
    if (schema->hint && strcmp(schema->hint, "arrow") == 0) {
        // Export pyarrow object via C Data Interface -> copy to shm -> packet
        struct ArrowSchema arrow_schema;
        struct ArrowArray arrow_array;

        // Call obj._export_to_c(arrow_array_ptr, arrow_schema_ptr)
        PyObject* export_result = PyObject_CallMethod(
            obj, "_export_to_c",
            "nn", (Py_ssize_t)&arrow_array, (Py_ssize_t)&arrow_schema);
        if (!export_result) {
            free_schema(schema);
            PyRAISE("Failed to export pyarrow object via C Data Interface");
        }
        Py_DECREF(export_result);

        char* errmsg = NULL;
        relptr_t relptr = arrow_to_shm(&arrow_array, &arrow_schema, &errmsg);

        // Release the exported C Data Interface structs
        if (arrow_schema.release) arrow_schema.release(&arrow_schema);
        if (arrow_array.release) arrow_array.release(&arrow_array);

        if (errmsg) {
            free_schema(schema);
            PyErr_SetString(PyExc_RuntimeError, errmsg);
            free(errmsg);
            return NULL;
        }

        packet = make_arrow_data_packet(relptr, schema);
        if (!packet) {
            free_schema(schema);
            PyRAISE("Failed to create arrow data packet");
        }

        // Track shm for cleanup
        char* resolve_err = NULL;
        void* shm_ptr = rel2abs(relptr, &resolve_err);
        if (resolve_err) { free(resolve_err); }
        if (shm_ptr) {
            shm_tracker_push((absptr_t)shm_ptr, NULL);
            tracked = true;
        }

        packet_size = PyTRY(morloc_packet_size, packet);
        PyObject* retval = PyBytes_FromStringAndSize((char*)packet, packet_size);
        free(packet);
        free_schema(schema);
        return retval;
    }

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    // convert to a relative pointer conserved between language servers
    relptr_t relptr = PyTRY(abs2rel, voidstar);

    packet = PyTRY(make_data_packet_auto, voidstar, relptr, schema);

    {
        const morloc_packet_header_t* hdr = (const morloc_packet_header_t*)packet;
        if (hdr->command.data.source == PACKET_SOURCE_RPTR) {
            // SHM referenced by packet -- track for deferred cleanup
            shm_tracker_push((absptr_t)voidstar, schema);
            tracked = true;
        } else {
            // Data inlined in packet -- free SHM immediately
            char* free_err = NULL;
            shfree_by_schema((absptr_t)voidstar, schema, &free_err);
            if (free_err) { free(free_err); free_err = NULL; }
            shfree((absptr_t)voidstar, &free_err);
            if (free_err) { free(free_err); }
            voidstar = NULL;
        }
    }

    packet_size = PyTRY(morloc_packet_size, packet);

    {
        PyObject* retval = PyBytes_FromStringAndSize((char*)packet, packet_size);
        free(packet);
        if (!tracked) {
            free_schema(schema);
        }
        return retval;
    }

error:
    FREE(packet)
    if (!tracked) {
        if (voidstar && schema) {
            char* free_err = NULL;
            shfree_by_schema((absptr_t)voidstar, schema, &free_err);
            if (free_err) { free(free_err); free_err = NULL; }
            shfree((absptr_t)voidstar, &free_err);
            if (free_err) { free(free_err); }
        }
        free_schema(schema);
    }
    return NULL;
}


// Use a key to retrieve a value
static PyObject* pybinding__get_value(PyObject* self, PyObject* args){ MAYFAIL
    uint8_t* voidstar = NULL;
    Schema* schema = NULL;
    PyObject* obj = NULL;
    bool tracked = false;

    const char* packet;
    size_t packet_size;
    const char* schema_str;

    if (!PyArg_ParseTuple(args, "y#s", &packet, &packet_size, &schema_str)) {
        PyRAISE("Failed to parse arguments");
    }

    const morloc_packet_header_t* header = (const morloc_packet_header_t*)packet;
    uint8_t source = header->command.data.source;
    uint8_t format = header->command.data.format;

    schema = PyTRY(parse_schema, schema_str)

    // Arrow dispatch: if packet format is Arrow, import via C Data Interface
    if (format == PACKET_FORMAT_ARROW) {
        voidstar = PyTRY(get_morloc_data_packet_value, (uint8_t*)packet, schema);

        const arrow_shm_header_t* arrow_hdr = (const arrow_shm_header_t*)voidstar;

        struct ArrowSchema arrow_schema;
        struct ArrowArray arrow_array;
        char* arrow_err = NULL;
        arrow_from_shm(arrow_hdr, &arrow_schema, &arrow_array, &arrow_err);
        if (arrow_err) {
            free_schema(schema);
            PyErr_SetString(PyExc_RuntimeError, arrow_err);
            free(arrow_err);
            return NULL;
        }

        // Import via pyarrow RecordBatch.from_buffers or _import_from_c
        PyObject* pyarrow_mod = PyImport_ImportModule("pyarrow");
        if (!pyarrow_mod) {
            if (arrow_schema.release) arrow_schema.release(&arrow_schema);
            if (arrow_array.release) arrow_array.release(&arrow_array);
            free_schema(schema);
            PyRAISE("pyarrow is required for arrow-typed data");
        }

        PyObject* rb_class = PyObject_GetAttrString(pyarrow_mod, "RecordBatch");
        Py_DECREF(pyarrow_mod);
        if (!rb_class) {
            if (arrow_schema.release) arrow_schema.release(&arrow_schema);
            if (arrow_array.release) arrow_array.release(&arrow_array);
            free_schema(schema);
            PyRAISE("Failed to get pyarrow.RecordBatch");
        }

        // Use RecordBatch._import_from_c(array_ptr, schema_ptr)
        obj = PyObject_CallMethod(rb_class, "_import_from_c",
            "nn", (Py_ssize_t)&arrow_array, (Py_ssize_t)&arrow_schema);
        Py_DECREF(rb_class);

        // Incref shm so it stays alive while pyarrow references the buffers
        char* incref_err = NULL;
        shincref((absptr_t)voidstar, &incref_err);
        if (incref_err) { free(incref_err); }
        shm_tracker_push((absptr_t)voidstar, NULL);

        free_schema(schema);
        if (!obj) return NULL;
        return obj;
    }

    // Fast path: inline voidstar -- read directly from packet, no SHM needed
    if (source == PACKET_SOURCE_MESG && format == PACKET_FORMAT_VOIDSTAR) {
        const uint8_t* payload = (const uint8_t*)packet + sizeof(morloc_packet_header_t) + header->offset;
        obj = fromAnything(schema, (const void*)payload, (const void*)payload);
        PyTRACE(obj == NULL)
        free_schema(schema);
        return obj;
    }

    // SHM paths (RPTR or MESG+MSGPACK)
    bool is_rptr = (source == PACKET_SOURCE_RPTR);

    voidstar = PyTRY(get_morloc_data_packet_value, (uint8_t*)packet, schema);

    // For RPTR data, increment refcount so the owner's tracker flush
    // won't destroy data we may still need (e.g. forwarded packets).
    if (is_rptr) {
        char* incref_err = NULL;
        shincref((absptr_t)voidstar, &incref_err);
        if (incref_err) { free(incref_err); }
        // Track for deferred decref (tracker takes schema ownership)
        shm_tracker_push((absptr_t)voidstar, schema);
        tracked = true;
    }

    obj = fromAnything(schema, voidstar, NULL);
    PyTRACE(obj == NULL)

    if (!tracked) {
        free_schema(schema);
    }

    return obj;

error:
    if (!tracked) {
        free_schema(schema);
    }
    return NULL;
}


// Free tracked SHM allocations from put_value calls.
// Called at dispatch start to free result SHM from previous dispatch.
static PyObject* pybinding__flush_shm_tracker(PyObject* self, PyObject* args) {
    (void)self; (void)args;
    flush_shm_tracker();
    Py_RETURN_NONE;
}


// Make a foreign call
//
// Arguments:
//   1. socket path
//   2. midx
//   3. list of arguments, each is bytestring packet
static PyObject* pybinding__foreign_call(PyObject* self, PyObject* args) { MAYFAIL
    char* socket_path;
    int mid;
    PyObject* py_args;
    const uint8_t** arg_packets = NULL;
    Py_ssize_t nargs;
    Py_ssize_t i;
    uint8_t* packet = NULL;
    uint8_t* result = NULL;
    size_t result_length = 0;

    // Parse arguments: string, integer, and sequence
    if (!PyArg_ParseTuple(args, "siO", &socket_path, &mid, &py_args)) {
        PyRAISE("Failed to parse argument")
    }

    // Verify third argument is a sequence
    if (!PySequence_Check(py_args)) {
        PyRAISE("Third argument must be a sequence");
    }

    // Get sequence size and allocate C arrays
    nargs = PySequence_Size(py_args);
    arg_packets = (const uint8_t**)calloc(nargs, sizeof(uint8_t*));
    if (!arg_packets) {
        PyErr_NoMemory();
        goto error;
    }

    // Convert Python bytes to C buffers
    for (i = 0; i < nargs; i++) {
        PyObject* item = PySequence_GetItem(py_args, i);
        if (!PyBytes_Check(item)) {
            Py_DECREF(item);
            free(arg_packets);
            arg_packets = NULL;
            PyRAISE("All arguments must be bytes objects");
        }
        arg_packets[i] = (const uint8_t*)PyBytes_AsString(item);
        Py_DECREF(item);
    }

    packet = PyTRY(make_morloc_local_call_packet, (uint32_t)mid, arg_packets, (size_t)nargs);

    free(arg_packets);
    arg_packets = NULL;

    result = PyTRY(send_and_receive_over_socket, socket_path, packet);
    free(packet);
    packet = NULL;

    // Incref the result's SHM so the callee's tracker flush won't destroy
    // data we may still need (e.g. forwarded result packets).
    {
        const morloc_packet_header_t* res_header = (const morloc_packet_header_t*)result;
        if (res_header->command.data.source == PACKET_SOURCE_RPTR) {
            size_t relptr = *(size_t*)((uint8_t*)result + res_header->offset + sizeof(morloc_packet_header_t));
            char* resolve_err = NULL;
            void* res_voidstar = rel2abs(relptr, &resolve_err);
            if (resolve_err) { free(resolve_err); resolve_err = NULL; }
            if (res_voidstar) {
                char* incref_err = NULL;
                shincref((absptr_t)res_voidstar, &incref_err);
                if (incref_err) { free(incref_err); }
                shm_tracker_push((absptr_t)res_voidstar, NULL);
            }
        }
    }

    result_length = PyTRY(morloc_packet_size, result);

    PyObject* retval = PyBytes_FromStringAndSize((char*)result, result_length);

    free(result);

    return retval;

error:
    FREE(arg_packets)
    FREE(packet)
    return NULL;
}


static PyObject* pybinding__remote_call(PyObject* self, PyObject* args) { MAYFAIL
    int midx;
    char* socket_base;
    char* cache_path;
    PyObject* res_struct; // python struct that is converted to a resource_t struct
    PyObject* arg_packets_obj; // python list of bytes types
    const uint8_t** arg_packets = NULL;
    uint8_t* result = NULL;

    if (!PyArg_ParseTuple(args, "issOO", &midx, &socket_base, &cache_path, &res_struct, &arg_packets_obj)) {
        PyRAISE("Failed to parse arguments");
    }

    if (!PyBytes_Check(res_struct)) {
        PyRAISE("res_struct must be a bytes object from struct.pack()");
    }

    // Ensure the resources struct is the right size
    if (PyBytes_Size(res_struct) != sizeof(resources_t)) {
        PyRAISE("Struct size mismatch");
    }

    resources_t* res = (resources_t*)PyBytes_AsString(res_struct);
    PyTRACE(res == NULL)

    Py_ssize_t nargs = PyList_Size(arg_packets_obj);

    arg_packets = calloc(nargs, sizeof(uint8_t*));
    if (arg_packets == NULL) {
        PyRAISE("Memory allocation failed");
    }

    for (Py_ssize_t i = 0; i < nargs; i++) {
        PyObject* packet_obj = PyList_GetItem(arg_packets_obj, i);
        if (!PyBytes_Check(packet_obj)) {
            PyRAISE("Packets must be bytes");
        }
        arg_packets[i] = (uint8_t*)PyBytes_AsString(packet_obj);
    }

    result = PyTRY(
        remote_call,
        midx,
        socket_base,
        cache_path,
        res,
        arg_packets,
        (size_t)nargs
    );

    free(arg_packets);

    if (result == NULL) Py_RETURN_NONE;
    size_t result_length = PyTRY(morloc_packet_size, result);
    PyObject* py_result = PyBytes_FromStringAndSize((char*)result, result_length);
    free(result);
    return py_result;

error:
    if (result != NULL){
        free(result);
    }
    if (arg_packets != NULL){
        // The elements are handled by Python and should not be freed
        free(arg_packets);
    }
    return NULL;
}


static PyObject* pybinding__is_ping(PyObject* self, PyObject* args) { MAYFAIL
    char* packet;
    size_t packet_size;

    if (!PyArg_ParseTuple(args, "y#", &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }

    bool is_ping = PyTRY(packet_is_ping, (uint8_t*)packet);

    PyObject* obj = PyBool_FromLong((long)is_ping);

    return obj;

error:
    return NULL;
}


static PyObject* pybinding__is_local_call(PyObject* self, PyObject* args) { MAYFAIL
    char* packet;
    size_t packet_size;

    if (!PyArg_ParseTuple(args, "y#", &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }

    bool is_local_call = PyTRY(packet_is_local_call, (uint8_t*)packet);

    PyObject* obj = PyBool_FromLong((long)is_local_call);

    return obj;

error:
    return NULL;
}

static PyObject* pybinding__is_remote_call(PyObject* self, PyObject* args) { MAYFAIL
    char* packet;
    size_t packet_size;

    if (!PyArg_ParseTuple(args, "y#", &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }

    bool is_remote_call = PyTRY(packet_is_remote_call, (uint8_t*)packet);

    PyObject* obj = PyBool_FromLong((long)is_remote_call);

    return obj;

error:
    return NULL;
}


static PyObject* pybinding__pong(PyObject* self, PyObject* args) { MAYFAIL
    char* packet;
    size_t packet_size;
    uint8_t* pong = NULL;

    if (!PyArg_ParseTuple(args, "y#", &packet, &packet_size)) {
        PyRAISE("Failed to parse arguments");
    }

    pong = PyTRY(return_ping, (uint8_t*)packet);

    size_t pong_size = PyTRY(morloc_packet_size, pong);

    {
        PyObject* retval = PyBytes_FromStringAndSize((char*)pong, pong_size);
        free(pong);
        return retval;
    }

error:
    FREE(pong)
    return NULL;
}

static PyObject* pybinding__set_fallback_dir(PyObject* self, PyObject* args) {
    const char* dir;
    if (!PyArg_ParseTuple(args, "s", &dir)) {
        return NULL;
    }
    shm_set_fallback_dir(dir);
    Py_RETURN_NONE;
}

static PyObject* pybinding__shinit(PyObject* self, PyObject* args) { MAYFAIL
    shm_t* shm = NULL;
    
    const char* shm_basename;
    size_t volume_index;
    size_t shm_default_size;

    if (!PyArg_ParseTuple(args, "skk", &shm_basename, &volume_index, &shm_default_size)) {
        PyRAISE("Failed to parse arguments");
    }

    shm = PyTRY(
        shinit,
        shm_basename,
        volume_index,
        shm_default_size
    );

    return PyCapsule_New(shm, "shm_t", NULL);

error:
    FREE(shm)
    return NULL;
}


static PyObject* pybinding__make_fail_packetg(PyObject* self, PyObject* args) { MAYFAIL
    const char* packet_errmsg;
    uint8_t* packet = NULL;

    if (!PyArg_ParseTuple(args, "s", &packet_errmsg)) {
        PyRAISE("Failed to parse arguments");
    }

    packet = make_fail_packet(packet_errmsg);

    size_t packet_size = PyTRY(morloc_packet_size, packet);

    {
        PyObject* retval = PyBytes_FromStringAndSize((char*)packet, packet_size);
        free(packet);
        return retval;
    }

error:
    FREE(packet)
    return NULL;
}

static PyObject* pybinding__mlc_hash(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* obj;
    const char* schema_str;
    Schema* schema = NULL;
    void* voidstar = NULL;
    char* hex = NULL;

    if (!PyArg_ParseTuple(args, "Os", &obj, &schema_str)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    hex = PyTRY(mlc_hash, voidstar, schema);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);

    {
        PyObject* retval = PyUnicode_FromString(hex);
        free(hex);
        return retval;
    }

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    FREE(hex)
    return NULL;
}

static PyObject* pybinding__mlc_save(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* obj;
    const char* schema_str;
    const char* path;
    Schema* schema = NULL;
    void* voidstar = NULL;

    if (!PyArg_ParseTuple(args, "Oss", &obj, &schema_str, &path)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    PyTRY(mlc_save, voidstar, schema, path);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    Py_RETURN_NONE;

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    return NULL;
}

static PyObject* pybinding__mlc_save_voidstar(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* obj;
    const char* schema_str;
    const char* path;
    Schema* schema = NULL;
    void* voidstar = NULL;

    if (!PyArg_ParseTuple(args, "Oss", &obj, &schema_str, &path)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    PyTRY(mlc_save_voidstar, voidstar, schema, path);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    Py_RETURN_NONE;

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    return NULL;
}

static PyObject* pybinding__mlc_save_json(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* obj;
    const char* schema_str;
    const char* path;
    Schema* schema = NULL;
    void* voidstar = NULL;

    if (!PyArg_ParseTuple(args, "Oss", &obj, &schema_str, &path)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    PyTRY(mlc_save_json, voidstar, schema, path);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    Py_RETURN_NONE;

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    return NULL;
}

static PyObject* pybinding__mlc_show(PyObject* self, PyObject* args) { MAYFAIL
    PyObject* obj;
    const char* schema_str;
    Schema* schema = NULL;
    void* voidstar = NULL;
    char* json = NULL;

    if (!PyArg_ParseTuple(args, "Os", &obj, &schema_str)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = to_voidstar(schema, obj);
    PyTRACE(voidstar == NULL)

    json = PyTRY(mlc_show, voidstar, schema);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);

    {
        PyObject* retval = PyUnicode_FromString(json);
        free(json);
        return retval;
    }

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    FREE(json)
    return NULL;
}

static PyObject* pybinding__mlc_read(PyObject* self, PyObject* args) { MAYFAIL
    const char* schema_str;
    const char* json_str;
    Schema* schema = NULL;
    void* voidstar = NULL;

    if (!PyArg_ParseTuple(args, "ss", &schema_str, &json_str)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    {
        char* errmsg = NULL;
        voidstar = mlc_read(json_str, schema, &errmsg);
        if (errmsg != NULL) {
            free(errmsg);
        }
    }

    if (voidstar == NULL) {
        free_schema(schema);
        Py_RETURN_NONE;
    }

    {
        PyObject* obj = fromAnything(schema, voidstar, NULL);
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
        free_schema(schema);
        PyTRACE(obj == NULL)
        return obj;
    }

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    return NULL;
}

static PyObject* pybinding__mlc_load(PyObject* self, PyObject* args) { MAYFAIL
    const char* schema_str;
    const char* path;
    Schema* schema = NULL;
    void* voidstar = NULL;

    if (!PyArg_ParseTuple(args, "ss", &schema_str, &path)) {
        PyRAISE("Failed to parse arguments");
    }

    schema = PyTRY(parse_schema, schema_str);

    voidstar = PyTRY(mlc_load, path, schema);

    if (voidstar == NULL) {
        free_schema(schema);
        Py_RETURN_NONE;
    }

    {
        PyObject* obj = fromAnything(schema, voidstar, NULL);
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
        free_schema(schema);
        PyTRACE(obj == NULL)
        return obj;
    }

error:
    if (voidstar) {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);
    return NULL;
}

static PyMethodDef Methods[] = {
    {"set_fallback_dir", pybinding__set_fallback_dir, METH_VARARGS, "Set fallback directory for file-backed shared memory"},
    {"shinit", pybinding__shinit, METH_VARARGS, "Open the shared memory pool"},
    {"start_daemon", pybinding__start_daemon, METH_VARARGS, "Initialize the shared memory and socket for the python daemon"},
    {"close_daemon", pybinding__close_daemon, METH_VARARGS, "Banish the daemon back to the abyss from whence it came"},
    {"wait_for_client", pybinding__wait_for_client, METH_VARARGS, "Listen over a pipe until a client packet arrives"},
    {"read_morloc_call_packet", pybinding__read_morloc_call_packet, METH_VARARGS, "Parse a morloc call packet"},
    {"send_packet_to_foreign_server", pybinding__send_packet_to_foreign_server, METH_VARARGS, "Send data to a foreign server"},
    {"stream_from_client", pybinding__stream_from_client, METH_VARARGS, "Stream data from the client"},
    {"close_socket", pybinding__close_socket, METH_VARARGS, "Close the socket"},
    {"flush_shm_tracker", pybinding__flush_shm_tracker, METH_NOARGS, "Free tracked SHM allocations from put_value calls"},
    {"foreign_call", pybinding__foreign_call, METH_VARARGS, "Send a call packet to a foreign pool"},
    {"get_value", pybinding__get_value, METH_VARARGS, "Convert a packet to a Python value"},
    {"put_value", pybinding__put_value, METH_VARARGS, "Convert a Python value to a packet"},
    {"is_ping", pybinding__is_ping, METH_VARARGS, "Packet is a ping"},
    {"is_local_call", pybinding__is_local_call, METH_VARARGS, "Packet is a local call"},
    {"is_remote_call", pybinding__is_remote_call, METH_VARARGS, "Packet is a remote call"},
    {"pong", pybinding__pong, METH_VARARGS, "Return a ping"},
    {"make_fail_packet", pybinding__make_fail_packetg, METH_VARARGS, "Create a fail packet from an error message"},
    {"remote_call", pybinding__remote_call, METH_VARARGS, "Make a call to a remote cluster"},
    {"mlc_hash", pybinding__mlc_hash, METH_VARARGS, "Hash a value using xxhash"},
    {"mlc_save", pybinding__mlc_save, METH_VARARGS, "Save a value to file in msgpack format"},
    {"mlc_save_voidstar", pybinding__mlc_save_voidstar, METH_VARARGS, "Save a value to file in flat voidstar binary format"},
    {"mlc_save_json", pybinding__mlc_save_json, METH_VARARGS, "Save a value to file in JSON format"},
    {"mlc_load", pybinding__mlc_load, METH_VARARGS, "Load a value from file"},
    {"mlc_show", pybinding__mlc_show, METH_VARARGS, "Serialize a value to JSON string"},
    {"mlc_read", pybinding__mlc_read, METH_VARARGS, "Deserialize a JSON string to a value"},
    {NULL, NULL, 0, NULL} // this is a sentinel value
};

static struct PyModuleDef pymorloc = {
    PyModuleDef_HEAD_INIT,
    "pymorloc",
    "Python interface to Morloc binary and MessagePack data",
    -1,
    Methods
};

PyMODINIT_FUNC PyInit_pymorloc(void) {
    return PyModule_Create(&pymorloc);
}


================================================
FILE: data/lang/py/setup.py
================================================
import os
from setuptools import setup, Extension
import numpy as np

try:
    np_include_path = np.get_include()
except AttributeError:
    raise RuntimeError("Numpy is required to build this extension")

morloc_home = os.environ.get(
    'MORLOC_HOME',
    os.path.expanduser('~/.local/share/morloc')
)

module = Extension(
    'pymorloc',
    sources=['pymorloc.c'],
    include_dirs=[
        os.path.join(morloc_home, 'include'),
        np_include_path
    ],
    library_dirs=[os.path.join(morloc_home, 'lib')],
    runtime_library_dirs=[os.path.join(morloc_home, 'lib')],
    libraries=['morloc']
)

setup(
    name='pymorloc',
    version='0.1',
    ext_modules=[module],
    extras_require={
        'numpy': ['numpy']
    }
)


================================================
FILE: data/lang/r/init.sh
================================================
#!/bin/bash
set -e

MORLOC_HOME="$1"
BUILD_DIR="$2"
SANITIZE_FLAGS="$3"
INCLUDE_DIR="$MORLOC_HOME/include"
LIB_DIR="$MORLOC_HOME/lib"

# Write source to include dir (R CMD SHLIB expects it there)
cp "$BUILD_DIR/rmorloc.c" "$INCLUDE_DIR/"

# Compile directly with gcc so SANITIZE_FLAGS can be passed at both compile
# and link time. R CMD SHLIB drops sanitizer flags from the link step, which
# would leave librmorloc.so with unresolved ubsan symbols (R itself is not
# built with ubsan, so dlopen would fail with:
#   "undefined symbol: __ubsan_handle_type_mismatch_v1_abort").
#
# We only link against R's core shared lib (libR). R's full --ldflags include
# libs the R interpreter uses (pcre2, tirpc, icu...) that may not be present
# as separate dev packages on the build machine; R-loadable shared objects
# resolve those symbols through the loaded R interpreter at dlopen time, not
# at link time.
R_CPPFLAGS=$(R CMD config --cppflags)
R_HOME=$(R RHOME)
gcc $R_CPPFLAGS -I"$INCLUDE_DIR" $SANITIZE_FLAGS -fpic -O2 \
    -c "$INCLUDE_DIR/rmorloc.c" -o "$INCLUDE_DIR/rmorloc.o"
gcc -shared $SANITIZE_FLAGS \
    -Wl,-Bsymbolic-functions -Wl,-z,relro \
    -o "$LIB_DIR/librmorloc.so" "$INCLUDE_DIR/rmorloc.o" \
    -L"$LIB_DIR" -Wl,-rpath,"$LIB_DIR" -lmorloc -lpthread \
    -L"$R_HOME/lib" -lR

# Clean up
rm -f "$INCLUDE_DIR/rmorloc.c" "$INCLUDE_DIR/rmorloc.o"


================================================
FILE: data/lang/r/lang.yaml
================================================
# R language descriptor for morloc compiler
# Metadata fields (read by LangRegistry) + descriptor fields (read by generic translator)

# Identity and metadata
name: r
extension: R
aliases: []
is_compiled: false
run_command: ["Rscript"]
serial_type: "character"
cost: 4
preamble:
  - 'dyn.load("{{home}}/lib/librmorloc.so")'
  - '.morloc.srcdir <- normalizePath(file.path(dirname(sub("^--file=", "", grep("^--file=", commandArgs(FALSE), value=TRUE)[1])), "..", ".."), mustWork=FALSE)'
  - '.morloc.source <- function(p) source(ifelse(startsWith(p, "/"), p, file.path(.morloc.srcdir, p)), chdir=TRUE)'

# Literals
ldBoolTrue: "TRUE"
ldBoolFalse: "FALSE"
ldNullLiteral: "NULL"

# Constructors
ldListStyle: type_dependent
ldTupleConstructor: "list"
ldRecordConstructor: "list"
ldRecordSeparator: "="

# Access styles
ldIndexStyle: one_double_bracket
ldKeyAccess: "double_bracket"
ldFieldAccess: dollar

# Serialize/deserialize
ldSerializeFn: "morloc_put_value"
ldDeserializeFn: "morloc_get_value"
ldIntrinsicPrefix: "morloc_"

# Foreign call
ldForeignCallFn: "morloc_foreign_call"
ldForeignCallIntSuffix: "L"
ldIntLiteralSuffix: "L"

# Remote call
ldRemoteCallFn: "morloc_remote_call"

# Record handling
ldDictStyleRecords: false
ldQuoteRecordKeys: false

# Import syntax
ldQualifiedImports: false
ldIncludeRelToFile: false

# Template fields
ldAssignOp: "<-"
ldLambdaTemplate: "function({{args}}) { {{body}} }"
ldDoBlockExpr: "(function() {{expr}})"
ldDoBlockBlock: "(function(){\n{{body}}\n})"
ldPartialTemplate: "function({{bound_args}}) { {{fn}}({{all_args}}) }"
ldImportTemplate: ".morloc.source(\"{{path}}\")"
ldSocketPathTemplate: "paste0(global_state$tmpdir, \"/\", {{socket}})"
ldResourcePackTemplate: "list(memory={{mem}}L, time={{time}}L, cpus={{cpus}}L, gpus={{gpus}}L)"
ldReturnTemplate: "return({{expr}})"
ldFuncDefHeader: "{{name}} <- function({{args}})"
ldBlockStyle: braces
ldBlockEnd: "}"
ldErrorWrapOpen: ""
ldErrorWrapClose: []
ldPatternStyle: concat_call
ldConcatFn: "paste0"
ldQuoteTerminator: '"'
ldQuoteTerminatorEsc: '\"'
ldAtomicTypes: ["integer", "numeric", "double", "logical", "character"]
ldAtomicListFn: "c"
ldGenericListFn: "list"
ldMapStyle: apply_callback
ldDispatchLocalHeader: ".dispatch <- list()"
ldDispatchLocalEntry: ".dispatch[[{{mid}}L]] <- {{name}}"
ldDispatchLocalFooter: ""
ldDispatchRemoteHeader: ".remote_dispatch <- list()"
ldDispatchRemoteEntry: ".remote_dispatch[[{{mid}}L]] <- {{name}}_remote"
ldDispatchRemoteFooter: ""

# Pool template (loaded from pool.R, left empty here)
ldPoolTemplate: ""
ldBreakMarker: "# <<<BREAK>>>"
ldCommentMarker: "#"


================================================
FILE: data/lang/r/pool.R
================================================
# AUTO include sources start
# <<<BREAK>>>
# AUTO include sources end

morloc_is_ping                       <- function(...){ .Call("morloc_is_ping",                       ...) }
morloc_pong                          <- function(...){ .Call("morloc_pong",                          ...) }
morloc_is_local_call                 <- function(...){ .Call("morloc_is_local_call",                 ...) }
morloc_is_remote_call                <- function(...){ .Call("morloc_is_remote_call",                ...) }
morloc_make_fail_packet              <- function(...){ .Call("morloc_make_fail_packet",              ...) }
morloc_wait_for_client               <- function(...){ .Call("morloc_wait_for_client",               ...) }
morloc_stream_from_client            <- function(...){ .Call("morloc_stream_from_client",            ...) }
morloc_read_morloc_call_packet       <- function(...){ .Call("morloc_read_morloc_call_packet",       ...) }
morloc_send_packet_to_foreign_server <- function(...){ .Call("morloc_send_packet_to_foreign_server", ...) }
morloc_close_socket                  <- function(...){ .Call("morloc_close_socket",                  ...) }
morloc_start_daemon                  <- function(...){ .Call("morloc_start_daemon",                  ...) }
morloc_shinit                        <- function(...){ .Call("morloc_shinit",                        ...) }
morloc_foreign_call                  <- function(...){ .Call("morloc_foreign_call",                  ...) }
morloc_get_value                     <- function(...){ .Call("morloc_get_value",                     ...) }
morloc_put_value                     <- function(...){ .Call("morloc_put_value",                     ...) }
morloc_mlc_show                      <- function(...){ .Call("morloc_mlc_show",                      ...) }
morloc_socketpair                    <- function(...){ .Call("morloc_socketpair",                    ...) }
morloc_fork                          <- function(...){ .Call("morloc_fork",                          ...) }
morloc_send_fd                       <- function(...){ .Call("morloc_send_fd",                       ...) }
morloc_recv_fd                       <- function(...){ .Call("morloc_recv_fd",                       ...) }
morloc_kill                          <- function(...){ .Call("morloc_kill",                          ...) }
morloc_waitpid                       <- function(...){ .Call("morloc_waitpid",                       ...) }
morloc_install_sigterm_handler       <- function(...){ .Call("morloc_install_sigterm_handler",       ...) }
morloc_is_shutting_down              <- function(...){ .Call("morloc_is_shutting_down",              ...) }
morloc_waitpid_blocking              <- function(...){ .Call("morloc_waitpid_blocking",              ...) }
morloc_detach_daemon                 <- function(...){ .Call("morloc_detach_daemon",                 ...) }
morloc_shared_counter_create         <- function(...){ .Call("morloc_shared_counter_create",         ...) }
morloc_shared_counter_inc            <- function(...){ .Call("morloc_shared_counter_inc",            ...) }
morloc_shared_counter_dec            <- function(...){ .Call("morloc_shared_counter_dec",            ...) }
morloc_shared_counter_read           <- function(...){ .Call("morloc_shared_counter_read",           ...) }
morloc_pipe                          <- function(...){ .Call("morloc_pipe",                          ...) }
morloc_write_byte                    <- function(...){ .Call("morloc_write_byte",                    ...) }
morloc_close_fd                      <- function(...){ .Call("morloc_close_fd",                      ...) }
morloc_worker_loop_c                 <- function(...){ .Call("morloc_worker_loop_c",                 ...) }
morloc_set_line_buffered             <- function(...){ .Call("morloc_set_line_buffered",             ...) }
morloc_exit                          <- function(...){ .Call("morloc_exit",                          ...) }

global_state <- list()

# Dynamic worker spawning: monkey-patch morloc_foreign_call to track busy workers.
# Workers atomically increment a shared counter before a foreign_call and
# decrement after. When all workers are busy, a byte is written to a wake-up
# pipe to tell the dispatcher to spawn a new worker.
.orig_foreign_call <- morloc_foreign_call
.busy_counter <- NULL
.wakeup_fd <- NULL
.n_workers_total <- 0L

morloc_foreign_call <- function(...) {
  val <- morloc_shared_counter_inc(.busy_counter)
  if (val >= .n_workers_total && !is.null(.wakeup_fd)) {
    tryCatch(morloc_write_byte(.wakeup_fd, as.raw(0x21)), error = function(e) NULL)
  }
  on.exit(morloc_shared_counter_dec(.busy_counter))
  .orig_foreign_call(...)
}

# AUTO include manifolds start
# <<<BREAK>>>
# AUTO include manifolds end

# AUTO include dispatch start
# <<<BREAK>>>
# AUTO include dispatch end

worker_loop <- function(pipe_fd) {
  morloc_worker_loop_c(pipe_fd, .dispatch, .remote_dispatch)
}

main <- function(socket_path, tmpdir, shm_basename) {
  # Force line-buffered stdout/stderr so output from user functions is not lost
  # when the nexus kills the pool process group.
  morloc_set_line_buffered()
  morloc_install_sigterm_handler()

  daemon <- morloc_start_daemon(socket_path, tmpdir, shm_basename, 0xffff)
  n_workers <- 1L

  # Shared job queue: dispatcher writes fds to fd[1], workers read from fd[2].
  # Only idle workers (blocked in recvmsg) pick up jobs, preventing the
  # round-robin deadlock where a callback gets dispatched to a busy worker.
  job_queue <- morloc_socketpair()

  # Shared counter for dynamic worker spawning
  busy_counter <- morloc_shared_counter_create()
  wakeup <- morloc_pipe()  # c(read_fd, write_fd)

  # Set globals so the monkey-patched morloc_foreign_call can use them.
  # Forked children inherit these values.
  .busy_counter <<- busy_counter
  .wakeup_fd <<- wakeup[2L]
  .n_workers_total <<- n_workers

  pids <- integer(n_workers)
  for (i in seq_len(n_workers)) {
    pid <- morloc_fork()
    if (pid == 0L) {
      morloc_detach_daemon(daemon)
      morloc_close_socket(job_queue[1L])  # child doesn't write
      morloc_close_fd(wakeup[1L])         # child doesn't read wakeup pipe
      worker_loop(job_queue[2L])
      morloc_exit(0L)
    }
    pids[i] <- pid
  }
  # Keep job_queue[2L] open so dynamically spawned children can use it

  on.exit({
    tryCatch(morloc_close_socket(job_queue[1L]), error = function(e) NULL)
    tryCatch(morloc_close_socket(job_queue[2L]), error = function(e) NULL)
    tryCatch(morloc_close_fd(wakeup[1L]), error = function(e) NULL)
    tryCatch(morloc_close_fd(wakeup[2L]), error = function(e) NULL)
    for (pid in pids) {
      if (pid > 0L) {
        tryCatch(morloc_kill(pid, 9L), error = function(e) NULL)
        tryCatch(morloc_waitpid_blocking(pid), error = function(e) NULL)
      }
    }
  })

  # Dispatch loop - idle workers pull from shared queue.
  # After each dispatch cycle, check if all workers are busy and spawn more.
  while (!morloc_is_shutting_down()) {
    client_fd <- morloc_wait_for_client(daemon)
    if (client_fd > 0L) {
      tryCatch({
        morloc_send_fd(job_queue[1L], client_fd)
      }, error = function(e) {
        cat(paste("Failed to dispatch job:", e$message, "\n"), file = stderr())
      }, finally = {
        morloc_close_socket(client_fd)
      })
    }

    # Dynamic worker spawning: if all workers are blocked in foreign_call,
    # spawn a new one so incoming callbacks can still be served.
    current_busy <- morloc_shared_counter_read(busy_counter)
    if (current_busy >= n_workers) {
      pid <- morloc_fork()
      if (pid == 0L) {
        morloc_detach_daemon(daemon)
        morloc_close_socket(job_queue[1L])
        morloc_close_fd(wakeup[1L])
        worker_loop(job_queue[2L])
        morloc_exit(0L)
      }
      pids <- c(pids, pid)
      n_workers <- n_workers + 1L
      .n_workers_total <<- n_workers
    }
  }
}

args <- commandArgs(trailingOnly = TRUE)

# Health check: confirm sources loaded and print version
if (length(args) == 1 && args[1] == "--health") {
  cat('{"status":"ok","version":"__MORLOC_VERSION__"}\n')
  quit(status = 0)
}

if (length(args) != 3) {
  cat("Usage: Rscript pool.R <socket_path> <tmpdir> <shm_basename>\n", file=stderr())
  quit(status = 1)
}

socket_path <- args[1]
tmpdir <- args[2]
shm_basename <- args[3]

global_state$tmpdir <- tmpdir

tryCatch(
  {
    main(socket_path, tmpdir, shm_basename)
  },  error = function(e) {
      stop(paste("Pool failed:", e$message))
  })

# Use _exit to avoid R cleanup which triggers heap corruption on glibc >= 2.39
# (R's finalizers attempt to free objects in SHM-related C extensions)
morloc_exit(0L)


================================================
FILE: data/lang/r/rmorloc.c
================================================
#include <R.h>
#include <Rinternals.h>
#include <Rdefines.h>
#include <R_ext/Arith.h>

#include <stdint.h>
#include <stdbool.h>
#include <limits.h>
#include <string.h>
#include <errno.h>
#include <fcntl.h>
#include <sys/mman.h>
#include <sys/select.h>
#include <sys/socket.h>
#include <sys/wait.h>
#include <signal.h>
#include <unistd.h>

#include "morloc.h"

// {{{ macros

#define MAYFAIL char* child_errmsg_ = NULL;

#define R_TRY(fun, ...) \
    fun(__VA_ARGS__ __VA_OPT__(,) &child_errmsg_); \
    if(child_errmsg_ != NULL){ \
        error("Error in R pool (%s:%d in %s):\n%s", __FILE__, __LINE__, __func__, child_errmsg_); \
    }

#define R_TRY_WITH(clean, fun, ...) \
    fun(__VA_ARGS__ __VA_OPT__(,) &child_errmsg_); \
    if(child_errmsg_ != NULL){ \
        clean; \
        error("Error in R pool (%s:%d in %s):\n%s", __FILE__, __LINE__, __func__, child_errmsg_); \
    }

#define MORLOC_ERROR(msg, ...) error("Error in R pool (%s:%d in %s):" msg, __FILE__, __LINE__, __func__, ##__VA_ARGS__);

/// }}}

// {{{ to_voidstar

static size_t get_shm_size(const Schema* schema, SEXP obj) {
    size_t size = 0;
    switch (schema->type) {
        case MORLOC_NIL:
        case MORLOC_BOOL:
        case MORLOC_SINT8:
        case MORLOC_SINT16:
        case MORLOC_SINT32:
        case MORLOC_SINT64:
        case MORLOC_UINT8:
        case MORLOC_UINT16:
        case MORLOC_UINT32:
        case MORLOC_UINT64:
        case MORLOC_FLOAT32:
        case MORLOC_FLOAT64:
            return schema->width;
        case MORLOC_STRING:
        case MORLOC_ARRAY:
            {
                size_t length = (size_t)LENGTH(obj);
                size = sizeof(Array);
                // worst-case cursor alignment padding for element data
                size += schema_alignment(schema->parameters[0]) - 1;
                const char* str;

                switch (TYPEOF(obj)) {
                    case CHARSXP:
                        str = CHAR(obj);
                        size += (size_t)strlen(str);  // Do not include null terminator
                        break;
                    case STRSXP:
                        if (LENGTH(obj) == 1) {
                            str = CHAR(STRING_ELT(obj, 0));
                            size += (size_t)strlen(str);  // Do not include null terminator
                        } else {
                            if(schema->parameters[0]->type == MORLOC_STRING){
                                for(size_t i = 0; i < length; i++){
                                    size += get_shm_size(schema->parameters[0], STRING_ELT(obj, i));
                                }
                            } else {
                                MORLOC_ERROR("Expected character vector of length 1, but got length %zu", length);
                            }
                        }
                        break;
                    case VECSXP:  // This handles lists
                        for (int i = 0; i < length; i++) {
                            size += get_shm_size(schema->parameters[0], VECTOR_ELT(obj, i));
                        }
                        break;
                    case LGLSXP:
                    case INTSXP:
                    case REALSXP:
                    case RAWSXP:
                        size += length * schema->parameters[0]->width;
                        break;
                    default:
                        MORLOC_ERROR("Unsupported type in get_shm_size array: %s", type2char(TYPEOF(obj)));
                }
                return size;
            }

        case MORLOC_TUPLE:
            if (!isVectorList(obj)) {
                MORLOC_ERROR("Expected list for MORLOC_TUPLE, but got %s", type2char(TYPEOF(obj)));
            }

            {
                size_t array_size = (size_t)xlength(obj);
                if (array_size != schema->size) {
                    MORLOC_ERROR("Expected tuple of length %zu, but found list of length %zu", schema->size, size);
                }
                size = schema->width;
                for (R_xlen_t i = 0; i < (R_xlen_t)array_size; ++i) {
                    SEXP item = VECTOR_ELT(obj, i);
                    size_t elem = get_shm_size(schema->parameters[i], item);
                    if (elem > schema->parameters[i]->width) {
                        size += elem - schema->parameters[i]->width;
                    }
                }
                return size;
            }

        case MORLOC_MAP:
            {
                if (isNewList(obj)) {
                    // Handle named list
                    size = schema->width;
                    SEXP names = getAttrib(obj, R_NamesSymbol);
                    if (names == R_NilValue) {
                        error("List must have names for MORLOC_MAP");
                    }
                    for (size_t i = 0; i < schema->size; ++i) {
                        SEXP key = PROTECT(mkChar(schema->keys[i]));
                        int index = -1;
                        for (int j = 0; j < length(obj); j++) {
                            if (strcmp(CHAR(STRING_ELT(names, j)), CHAR(key)) == 0) {
                                index = j;
                                break;
                            }
                        }
                        if (index != -1) {
                            SEXP value = VECTOR_ELT(obj, index);
                            size_t elem = get_shm_size(schema->parameters[i], value);
                            if (elem > schema->parameters[i]->width) {
                                size += elem - schema->parameters[i]->width;
                            }
                        }
                        UNPROTECT(1);
                    }
                    return size;
                } else {
                    error("Expected a named list for MORLOC_MAP");
                }
            }

        case MORLOC_OPTIONAL:
            if (obj == R_NilValue) {
                return schema->width;
            }
            {
                size_t inner_size = get_shm_size(schema->parameters[0], obj);
                size = schema->width;
                if (inner_size > schema->parameters[0]->width) {
                    size += inner_size - schema->parameters[0]->width;
                }
                return size;
            }

        case MORLOC_TENSOR:
            {
                size_t ndim = schema_tensor_ndim(schema);
                size_t elem_width = schema->parameters[0]->width;
                SEXP dim = getAttrib(obj, R_DimSymbol);
                size_t total = 1;
                if (dim != R_NilValue) {
                    for (int i = 0; i < length(dim); i++)
                        total *= (size_t)INTEGER(dim)[i];
                } else {
                    total = (size_t)XLENGTH(obj);
                }
                size = sizeof(Tensor);
                size += _Alignof(int64_t) - 1;
                size += ndim * sizeof(int64_t);
                size += schema_alignment(schema->parameters[0]) - 1;
                size += total * elem_width;
                return size;
            }

        default:
            MORLOC_ERROR("Unhandled schema type");
            break;
    }

    return size;
}


#define HANDLE_SINT_TYPE(CTYPE, MIN, MAX) \
    do { \
        if (!(isInteger(obj) || isReal(obj))) { \
            MORLOC_ERROR("Expected integer for %s, but got %s", #CTYPE, type2char(TYPEOF(obj))); \
        } \
        double value = asReal(obj); \
        if (value < MIN || value > MAX) { \
            MORLOC_ERROR("Integer overflow for %s", #CTYPE); \
        } \
        *(CTYPE*)dest = (CTYPE)value; \
    } while(0)

#define HANDLE_UINT_TYPE(CTYPE, MAX) \
    do { \
        if (!(isInteger(obj) || isReal(obj))) { \
            MORLOC_ERROR("Expected integer for %s, but got %s", #CTYPE, type2char(TYPEOF(obj))); \
        } \
        double value = asReal(obj); \
        if (value < 0 || value > MAX) { \
            MORLOC_ERROR("Integer overflow for %s", #CTYPE); \
        } \
        *(CTYPE*)dest = (CTYPE)value; \
    } while(0)

static void* to_voidstar_r(void* dest, void** cursor, SEXP obj, const Schema* schema){
    MAYFAIL

    switch (schema->type) {
        case MORLOC_NIL:
            if (obj != R_NilValue) {
                MORLOC_ERROR("Expected NULL for MORLOC_NIL, but got %s", type2char(TYPEOF(obj)));
            }
            *((int8_t*)dest) = (int8_t)0;
            break;
        case MORLOC_BOOL:
            if (!isLogical(obj)) {
                MORLOC_ERROR("Expected logical for MORLOC_BOOL, but got %s", type2char(TYPEOF(obj)));
            }
            *((uint8_t*)dest) = (uint8_t)((LOGICAL(obj)[0] == TRUE) ? 1 : 0);
            break;
        case MORLOC_SINT8:
            HANDLE_SINT_TYPE(int8_t, INT8_MIN, INT8_MAX);
            break;
        case MORLOC_SINT16:
            HANDLE_SINT_TYPE(int16_t, INT16_MIN, INT16_MAX);
            break;
        case MORLOC_SINT32:
            HANDLE_SINT_TYPE(int32_t, INT32_MIN, INT32_MAX);
            break;
        case MORLOC_SINT64:
            HANDLE_SINT_TYPE(int64_t, INT64_MIN, INT64_MAX);
            break;
        case MORLOC_UINT8:
            HANDLE_UINT_TYPE(uint8_t, UINT8_MAX);
            break;
        case MORLOC_UINT16:
            HANDLE_UINT_TYPE(uint16_t, UINT16_MAX);
            break;
        case MORLOC_UINT32:
            HANDLE_UINT_TYPE(uint32_t, UINT32_MAX);
            break;
        case MORLOC_UINT64:
            HANDLE_UINT_TYPE(uint64_t, UINT64_MAX);
            break;
        case MORLOC_FLOAT32:
            if (!(isReal(obj) || isInteger(obj))) {
                MORLOC_ERROR("Expected numeric for MORLOC_FLOAT32, but got %s", type2char(TYPEOF(obj)));
            }
            *((float*)dest) = (float)asReal(obj);
            break;

        case MORLOC_FLOAT64:
            if (!(isReal(obj) || isInteger(obj))) {
                MORLOC_ERROR("Expected numeric for MORLOC_FLOAT64, but got %s", type2char(TYPEOF(obj)));
            }
            *((double*)dest) = asReal(obj);
            break;
        case MORLOC_STRING:
            {
                const char* str = NULL;
                size_t length = 0;
                switch(TYPEOF(obj)){
                    case CHARSXP:
                        str = CHAR(obj);
                        length = (size_t)strlen(str);
                        break;
                    case STRSXP:
                        if (LENGTH(obj) == 1) {
                            str = CHAR(STRING_ELT(obj, 0));
                            length = (size_t)strlen(str);
                        } else {
                            MORLOC_ERROR("Expected character of length 1");
                        }
                        break;
                    case RAWSXP:
                        str = RAW(obj);
                        length = LENGTH(obj);
                        break;
                    default:
                      MORLOC_ERROR("Expected a character type");
                      break;
                }
                Array* array = (Array*)dest;
                array->size = length;  // Do not include null terminator
                if(length > 0){
                    // align cursor for element data placement
                    *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, schema_alignment(schema->parameters[0]));
                    array->data = R_TRY(abs2rel, *cursor);
                    absptr_t tmp_ptr = R_TRY(rel2abs, array->data);
                    memcpy(tmp_ptr, str, array->size);
                } else {
                    array->data = RELNULL;
                }

                // move cursor to the location after the copied data
                *cursor = (void*)(*(char**)cursor + array->size);
            }
            break;
        case MORLOC_ARRAY:
            Array* array = (Array*)dest;
            array->size = (size_t)length(obj);
            if(array->size == 0){
                array->data = RELNULL;
                break;
            }

            // align cursor for element data placement
            *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, schema_alignment(schema->parameters[0]));
            array->data = R_TRY(abs2rel, *cursor);
            Schema* element_schema = schema->parameters[0];
            char* start;

            switch (TYPEOF(obj)) {
                case STRSXP:
                    {
                        if(element_schema->type == MORLOC_STRING){
                            // set the cursor the the location after the array headers
                            *cursor = (void*)(*(char**)cursor + array->size * element_schema->width);
                            start = R_TRY(rel2abs, array->data);
                            for(size_t i = 0; i < array->size; i++){
                                SEXP elem = STRING_ELT(obj, i);
                                to_voidstar_r(start + i * element_schema->width, cursor, elem, element_schema);
                            }
                        } else {
                            MORLOC_ERROR("Expected character vector of length 1, but got length %ld", array->size);
                        }
                    }
                    break;
                case RAWSXP:  // Raw vectors
                    if (element_schema->type != MORLOC_UINT8) {
                        MORLOC_ERROR("Expected MORLOC_UINT8 for raw vector");
                    }
                    absptr_t tmp_ptr = R_TRY(rel2abs, array->data);
                    memcpy(tmp_ptr, RAW(obj), array->size * sizeof(uint8_t));
                    *cursor = (void*)(*(char**)cursor + array->size * sizeof(uint8_t));
                    break;
                case VECSXP:  // This handles lists
                    *cursor = (void*)(*(char**)cursor + array->size * element_schema->width);
                    start = R_TRY(rel2abs, array->data);
                    for (int i = 0; i < array->size; i++) {
                        SEXP elem = VECTOR_ELT(obj, i);
                        to_voidstar_r(start + i * element_schema->width, cursor, elem, element_schema);
                    }
                    break;
                case LGLSXP:
                    *cursor = (void*)(*(char**)cursor + array->size * element_schema->width);
                    start = R_TRY(rel2abs, array->data);
                    for (int i = 0; i < array->size; i++) {
                        SEXP elem = PROTECT(ScalarLogical(LOGICAL(obj)[i]));
                        to_voidstar_r(start + i * element_schema->width, cursor, elem, element_schema);
                        UNPROTECT(1);
                    }
                    break;
                case INTSXP:
                    *cursor = (void*)(*(char**)cursor + array->size * element_schema->width);
                    start = R_TRY(rel2abs, array->data);
                    for (int i = 0; i < array->size; i++) {
                        SEXP elem = PROTECT(ScalarInteger(INTEGER(obj)[i]));
                        to_voidstar_r(start + i * element_schema->width, cursor, elem, element_schema);
                        UNPROTECT(1);
                    }
                    break;
                case REALSXP:
                    *cursor = (void*)(*(char**)cursor + array->size * element_schema->width);
                    start = R_TRY(rel2abs, array->data);
                    for (int i = 0; i < array->size; i++) {
                        SEXP elem = PROTECT(ScalarReal(REAL(obj)[i]));
                        to_voidstar_r(start + i * element_schema->width, cursor, elem, element_schema);
                        UNPROTECT(1);
                    }
                    break;
                default:
                    MORLOC_ERROR("Unsupported type in to_voidstar array: %s", type2char(TYPEOF(obj)));
            }
            break;


        case MORLOC_TUPLE:
            if (!isVectorList(obj)) {
                MORLOC_ERROR("Expected list for MORLOC_TUPLE, but got %s", type2char(TYPEOF(obj)));
            }

            {
                R_xlen_t size = xlength(obj);
                if ((size_t)size != schema->size) {
                    MORLOC_ERROR("Expected tuple of length %zu, but found list of length %zu", schema->size, size);
                }
                for (R_xlen_t i = 0; i < size; ++i) {
                    SEXP item = VECTOR_ELT(obj, i);
                    to_voidstar_r(dest + schema->offsets[i], cursor, item, schema->parameters[i]);
                }
            }
            break;

        case MORLOC_MAP:
            {
                if (isNewList(obj)) {
                    // Handle named list
                    SEXP names = getAttrib(obj, R_NamesSymbol);
                    if (names == R_NilValue) {
                        MORLOC_ERROR("List must have names for MORLOC_MAP");
                    }
                    for (size_t i = 0; i < schema->size; ++i) {
                        SEXP key = PROTECT(mkChar(schema->keys[i]));
                        int index = -1;
                        for (int j = 0; j < length(obj); j++) {
                            if (strcmp(CHAR(STRING_ELT(names, j)), CHAR(key)) == 0) {
                                index = j;
                                break;
                            }
                        }
                        if (index != -1) {
                            SEXP value = VECTOR_ELT(obj, index);
                            to_voidstar_r(dest + schema->offsets[i], cursor, value, schema->parameters[i]);
                        }
                        UNPROTECT(1);
                    }
                } else {
                    MORLOC_ERROR("Expected a named list for MORLOC_MAP");
                }
            }
            break;

        case MORLOC_OPTIONAL:
            if (obj == R_NilValue) {
                *((uint8_t*)dest) = 0;
                memset((char*)dest + schema->offsets[0], 0, schema->parameters[0]->width);
            } else {
                *((uint8_t*)dest) = 1;
                to_voidstar_r((char*)dest + schema->offsets[0], cursor, obj, schema->parameters[0]);
            }
            break;

        case MORLOC_TENSOR:
            {
                size_t ndim = schema_tensor_ndim(schema);
                size_t elem_width = schema->parameters[0]->width;

                // Get shape from dim attribute (or length for 1D)
                SEXP dim = getAttrib(obj, R_DimSymbol);
                int64_t shape[5];
                size_t total = 1;
                if (dim != R_NilValue) {
                    for (size_t i = 0; i < ndim; i++) {
                        shape[i] = (int64_t)INTEGER(dim)[i];
                        total *= (size_t)shape[i];
                    }
                } else {
                    shape[0] = (int64_t)XLENGTH(obj);
                    total = (size_t)shape[0];
                }

                Tensor* tensor = (Tensor*)dest;
                tensor->total_elements = total;
                tensor->device_type = 0;
                tensor->device_id = 0;

                if (total == 0) {
                    tensor->shape = RELNULL;
                    tensor->data = RELNULL;
                    break;
                }

                // Write shape
                *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, _Alignof(int64_t));
                tensor->shape = R_TRY(abs2rel, (absptr_t)*cursor);
                int64_t* shape_dst = (int64_t*)*cursor;
                for (size_t i = 0; i < ndim; i++) shape_dst[i] = shape[i];
                *cursor = (char*)*cursor + ndim * sizeof(int64_t);

                // Write data: transpose from column-major (R) to row-major (C)
                size_t data_align = schema_alignment(schema->parameters[0]);
                *cursor = (void*)ALIGN_UP((uintptr_t)*cursor, data_align);
                tensor->data = R_TRY(abs2rel, (absptr_t)*cursor);

                    // Coerce R object to match schema element type
                SEXP coerced = obj;
                int need_protect = 0;
                morloc_serial_type etype = schema->parameters[0]->type;
                if ((etype == MORLOC_FLOAT64 || etype == MORLOC_FLOAT32) && !isReal(obj)) {
                    coerced = PROTECT(coerceVector(obj, REALSXP));
                    need_protect = 1;
                } else if (etype != MORLOC_FLOAT64 && etype != MORLOC_FLOAT32 && etype != MORLOC_BOOL && !isInteger(obj)) {
                    coerced = PROTECT(coerceVector(obj, INTSXP));
                    need_protect = 1;
                }

                if (ndim == 1) {
                    // 1D: no transpose needed
                    if (isReal(coerced)) {
                        memcpy(*cursor, REAL(coerced), total * elem_width);
                    } else if (isInteger(coerced)) {
                        memcpy(*cursor, INTEGER(coerced), total * elem_width);
                    } else if (isLogical(coerced)) {
                        int* src = LOGICAL(coerced);
                        uint8_t* dst = (uint8_t*)*cursor;
                        for (size_t i = 0; i < total; i++) dst[i] = (uint8_t)(src[i] != 0);
                    }
                } else if (ndim == 2) {
                    size_t nrows = (size_t)shape[0];
                    size_t ncols = (size_t)shape[1];
                    if (isReal(coerced)) {
                        double* src = REAL(coerced);
                        double* dst = (double*)*cursor;
                        for (size_t r = 0; r < nrows; r++)
                            for (size_t c = 0; c < ncols; c++)
                                dst[r * ncols + c] = src[c * nrows + r];
                    } else if (isInteger(coerced)) {
                        int* src = INTEGER(coerced);
                        int* dst = (int*)*cursor;
                        for (size_t r = 0; r < nrows; r++)
                            for (size_t c = 0; c < ncols; c++)
                                dst[r * ncols + c] = src[c * nrows + r];
                    }
                } else {
                    size_t col_strides[5];
                    col_strides[0] = 1;
                    for (size_t d = 1; d < ndim; d++)
                        col_strides[d] = col_strides[d-1] * (size_t)shape[d-1];
                    size_t row_strides[5];
                    row_strides[ndim-1] = 1;
                    for (size_t d = ndim-1; d > 0; d--)
                        row_strides[d-1] = row_strides[d] * (size_t)shape[d];

                    if (isReal(coerced)) {
                        double* src = REAL(coerced);
                        double* dst = (double*)*cursor;
                        for (size_t i = 0; i < total; i++) {
                            size_t rem = i;
                            size_t col_idx = 0;
                            for (size_t d = 0; d < ndim; d++) {
                                size_t coord = rem / row_strides[d];
                                rem %= row_strides[d];
                                col_idx += coord * col_strides[d];
                            }
                            dst[i] = src[col_idx];
                        }
                    } else if (isInteger(coerced)) {
                        int* src = INTEGER(coerced);
                        int* dst = (int*)*cursor;
                        for (size_t i = 0; i < total; i++) {
                            size_t rem = i;
                            size_t col_idx = 0;
                            for (size_t d = 0; d < ndim; d++) {
                                size_t coord = rem / row_strides[d];
                                rem %= row_strides[d];
                                col_idx += coord * col_strides[d];
                            }
                            dst[i] = src[col_idx];
                        }
                    }
                }
                if (need_protect) UNPROTECT(1);
                *cursor = (char*)*cursor + total * elem_width;
            }
            break;

        default:
            MORLOC_ERROR("Unhandled schema type");
            break;
    }

    return dest;

}


// NOTE: If to_voidstar_r calls error() (via MORLOC_ERROR or R_TRY), the shared
// memory at dest leaks. This only happens on type mismatches (a development-time
// bug) and the memory is reclaimed when the pool process exits.
static void* to_voidstar(SEXP obj, const Schema* schema) {
    MAYFAIL

    size_t total_size = get_shm_size(schema, obj);

    void* dest = R_TRY(shmalloc, total_size);

    void* cursor = (void*)((char*)dest + schema->width);

    return to_voidstar_r(dest, &cursor, obj, schema);
}

// }}} to_voidstar

// {{{ from_voidstar

static SEXP from_voidstar(const void* data, const Schema* schema, const void* base_ptr) {
    MAYFAIL

    if(data == NULL){
        MORLOC_ERROR("NULL data (%s:%d in %s)", __FILE__, __LINE__, __func__);
    }

    if(schema == NULL){
        MORLOC_ERROR("NULL schema (%s:%d in %s)", __FILE__, __LINE__, __func__);
    }

    SEXP obj = R_NilValue;
    switch (schema->type) {
        case MORLOC_NIL:
            return R_NilValue;
        case MORLOC_BOOL:
            obj = ScalarLogical((bool)*(uint8_t*)data);
            break;
        case MORLOC_SINT8:
            obj = ScalarInteger((int)(*(int8_t*)data));
            break;
        case MORLOC_SINT16:
            obj = ScalarInteger((int)(*(int16_t*)data));
            break;
        case MORLOC_SINT32:
            obj = ScalarInteger(*(int32_t*)data);
            break;
        case MORLOC_SINT64:
            obj = ScalarReal((double)(*(int64_t*)data));
            break;
        case MORLOC_UINT8:
            obj = ScalarInteger((int)(*(uint8_t*)data));
            break;
        case MORLOC_UINT16:
            obj = ScalarInteger((int)(*(uint16_t*)data));
            break;
        case MORLOC_UINT32:
            obj = ScalarReal((double)(*(uint32_t*)data));
            break;
        case MORLOC_UINT64:
            obj = ScalarReal((double)(*(uint64_t*)data));
            break;
        case MORLOC_FLOAT32:
            obj = ScalarReal((double)(*(float*)data));
            break;
        case MORLOC_FLOAT64:
            obj = ScalarReal(*(double*)data);
            break;
        case MORLOC_STRING: {
                if (schema->hint != NULL && strcmp(schema->hint, "raw") == 0){
                    Array* raw_array = (Array*)data;
                    if(raw_array->size > 0){
                        void* tmp_ptr = R_TRY(resolve_relptr, raw_array->data, base_ptr);
                        obj = PROTECT(allocVector(RAWSXP, raw_array->size));
                        memcpy(RAW(obj), tmp_ptr, raw_array->size);
                    } else {
                        obj = PROTECT(allocVector(RAWSXP, 0));
                    }
                    UNPROTECT(1);
                } else {
                    Array* str_array = (Array*)data;
                    if(str_array->size > 0){
                        void* tmp_ptr = R_TRY(resolve_relptr, str_array->data, base_ptr);
                        SEXP chr = PROTECT(mkCharLen(tmp_ptr, str_array->size));
                        obj = PROTECT(ScalarString(chr));
                    } else {
                        SEXP chr = PROTECT(mkChar(""));
                        obj = PROTECT(ScalarString(chr));
                    }
                    UNPROTECT(2);
                }
            }
            break;
        case MORLOC_ARRAY:
            {
                Array* array = (Array*)data;
                Schema* element_schema = schema->parameters[0];
                char* start;

                switch(element_schema->type){
                    case MORLOC_BOOL:
                        obj = PROTECT(allocVector(LGLSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            LOGICAL(obj)[i] = (bool)*(uint8_t*)(start + i) ? TRUE : FALSE;
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_SINT8:
                        obj = PROTECT(allocVector(INTSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            INTEGER(obj)[i] = (int)(*(int8_t*)(start + i * sizeof(int8_t)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_SINT16:
                        obj = PROTECT(allocVector(INTSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            INTEGER(obj)[i] = (int)(*(int16_t*)(start + i * sizeof(int16_t)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_SINT32:
                        obj = PROTECT(allocVector(INTSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        {
                            void* tmp_ptr = R_TRY(resolve_relptr, array->data, base_ptr);
                            memcpy(INTEGER(obj), tmp_ptr, array->size * sizeof(int32_t));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_SINT64:
                        obj = PROTECT(allocVector(REALSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            REAL(obj)[i] = (double)(*(int64_t*)(start + i * sizeof(int64_t)));
                        }
                        UNPROTECT(1);
                        break;
                    // Interpret the uint8 as a raw vector
                    case MORLOC_UINT8:
                        obj = PROTECT(allocVector(RAWSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        memcpy(RAW(obj), start, array->size * sizeof(uint8_t));
                        UNPROTECT(1);
                        break;
                    case MORLOC_UINT16:
                        obj = PROTECT(allocVector(INTSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            INTEGER(obj)[i] = (int)(*(uint16_t*)(start + i * sizeof(uint16_t)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_UINT32:
                        obj = PROTECT(allocVector(REALSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            REAL(obj)[i] = (double)(*(uint32_t*)(start + i * sizeof(uint32_t)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_UINT64:
                        // NOTE: the R integer cannot store a 64 bit int
                        obj = PROTECT(allocVector(REALSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            REAL(obj)[i] = (double)(*(uint64_t*)(start + i * sizeof(uint64_t)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_FLOAT32:
                        obj = PROTECT(allocVector(REALSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        for (size_t i = 0; i < array->size; i++) {
                            REAL(obj)[i] = (double)(*(float*)(start + i * sizeof(float)));
                        }
                        UNPROTECT(1);
                        break;
                    case MORLOC_FLOAT64:
                        obj = PROTECT(allocVector(REALSXP, array->size));
                        if(array->size == 0) {
                            UNPROTECT(1);
                            break;
                        }
                        start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                        memcpy(REAL(obj), start, array->size * sizeof(double));
                        UNPROTECT(1);
                        break;
                    case MORLOC_STRING:
                        {
                            obj = PROTECT(allocVector(STRSXP, array->size));
                            if(array->size == 0) {
                                UNPROTECT(1);
                                break;
                            }
                            start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                            size_t width = schema->width;
                            for (size_t i = 0; i < array->size; i++) {
                                Array* str_array = (Array*)(start + i * width);
                                SEXP item;
                                if(str_array->size == 0){
                                    item = PROTECT(mkCharLen("", 0));
                                } else {
                                    void* str_ptr = R_TRY_WITH(UNPROTECT(1), resolve_relptr, str_array->data, base_ptr);
                                    item = PROTECT(mkCharLen(str_ptr, str_array->size));
                                }
                                UNPROTECT(1);
                                SET_STRING_ELT(obj, i, item);
                            }
                            UNPROTECT(1);
                        }
                        break;
                    default:
                        {
                            obj = PROTECT(allocVector(VECSXP, array->size));
                            if(array->size == 0) {
                                UNPROTECT(1);
                                break;
                            }
                            start = (char*)R_TRY(resolve_relptr, array->data, base_ptr);
                            size_t width = element_schema->width;
                            for (size_t i = 0; i < array->size; i++) {
                                SEXP item = from_voidstar(start + width * i, element_schema, base_ptr);
                                if (item == R_NilValue) {
                                    UNPROTECT(1);
                                    obj = R_NilValue;
                                    goto error;
                                }
                                SET_VECTOR_ELT(obj, i, item);
                            }
                            UNPROTECT(1);
                        }
                        break;
                }
            }
            break;
        case MORLOC_TUPLE: {
            obj = PROTECT(allocVector(VECSXP, schema->size));
            for (size_t i = 0; i < schema->size; i++) {
                void* item_ptr = (char*)data + schema->offsets[i];
                SEXP item = from_voidstar(item_ptr, schema->parameters[i], base_ptr);
                if (item == R_NilValue) {
                    UNPROTECT(1);
                    obj = R_NilValue;
                    goto error;
                }
                SET_VECTOR_ELT(obj, i, item);
            }
            UNPROTECT(1);
            break;
        }
        case MORLOC_MAP: {
            obj = PROTECT(allocVector(VECSXP, schema->size));
            SEXP names = PROTECT(allocVector(STRSXP, schema->size));
            for (size_t i = 0; i < schema->size; i++) {
                void* item_ptr = (char*)data + schema->offsets[i];
                SEXP value = from_voidstar(item_ptr, schema->parameters[i], base_ptr);
                if (value == R_NilValue) {
                    UNPROTECT(2);
                    obj = R_NilValue;
                    goto error;
                }
                SET_VECTOR_ELT(obj, i, value);
                SET_STRING_ELT(names, i, mkChar(schema->keys[i]));
            }
            setAttrib(obj, R_NamesSymbol, names);
            UNPROTECT(2);
            break;
        }
        case MORLOC_OPTIONAL: {
            uint8_t tag = *(const uint8_t*)data;
            if (tag == 0) {
                return R_NilValue;
            }
            obj = from_voidstar((const char*)data + schema->offsets[0], schema->parameters[0], base_ptr);
            break;
        }
        case MORLOC_TENSOR: {
            const Tensor* tensor = (const Tensor*)data;
            size_t ndim = schema_tensor_ndim(schema);
            size_t total = tensor->total_elements;

            if (total == 0) {
                if (isReal(obj)) {
                    obj = PROTECT(allocVector(REALSXP, 0));
                } else {
                    obj = PROTECT(allocVector(INTSXP, 0));
                }
                UNPROTECT(1);
                break;
            }

            const int64_t* shape = (const int64_t*)resolve_relptr(tensor->shape, base_ptr, NULL);
            const void* tdata = resolve_relptr(tensor->data, base_ptr, NULL);

            // Allocate R vector
            int sexptype;
            switch (schema->parameters[0]->type) {
                case MORLOC_FLOAT32:
                case MORLOC_FLOAT64: sexptype = REALSXP; break;
                case MORLOC_BOOL:    sexptype = LGLSXP; break;
                default:             sexptype = INTSXP; break;
            }

            obj = PROTECT(allocVector(sexptype, (R_xlen_t)total));

            if (ndim == 1) {
                // 1D: no transpose
                if (sexptype == REALSXP) {
                    if (schema->parameters[0]->type == MORLOC_FLOAT32) {
                        const float* src = (const float*)tdata;
                        double* dst = REAL(obj);
                        for (size_t i = 0; i < total; i++) dst[i] = (double)src[i];
                    } else {
                        memcpy(REAL(obj), tdata, total * sizeof(double));
                    }
                } else if (sexptype == INTSXP) {
                    size_t elem_w = schema->parameters[0]->width;
                    if (elem_w == sizeof(int)) {
                        memcpy(INTEGER(obj), tdata, total * sizeof(int));
                    } else {
                        // Widen or narrow to int
                        int* dst = INTEGER(obj);
                        const char* src = (const char*)tdata;
                        for (size_t i = 0; i < total; i++) {
                            int64_t v = 0;
                            memcpy(&v, src + i * elem_w, elem_w);
                            dst[i] = (int)v;
                        }
                    }
                } else if (sexptype == LGLSXP) {
                    const uint8_t* src = (const uint8_t*)tdata;
                    int* dst = LOGICAL(obj);
                    for (size_t i = 0; i < total; i++) dst[i] = src[i] ? 1 : 0;
                }
            } else if (ndim == 2) {
                // 2D: row-major to col-major transpose
                size_t nrows = (size_t)shape[0];
                size_t ncols = (size_t)shape[1];
                if (sexptype == REALSXP) {
                    const double* src = (const double*)tdata;
                    double* dst = REAL(obj);
                    for (size_t r = 0; r < nrows; r++)
                        for (size_t c = 0; c < ncols; c++)
                            dst[c * nrows + r] = src[r * ncols + c];
                } else if (sexptype == INTSXP) {
                    const int* src = (const int*)tdata;
                    int* dst = INTEGER(obj);
                    for (size_t r = 0; r < nrows; r++)
                        for (size_t c = 0; c < ncols; c++)
                            dst[c * nrows + r] = src[r * ncols + c];
                }
            } else {
                // General N-D: row-major to col-major
                size_t col_strides[5];
                col_strides[0] = 1;
                for (size_t d = 1; d < ndim; d++)
                    col_strides[d] = col_strides[d-1] * (size_t)shape[d-1];
                size_t row_strides[5];
                row_strides[ndim-1] = 1;
                for (size_t d = ndim-1; d > 0; d--)
                    row_strides[d-1] = row_strides[d] * (size_t)shape[d];

                if (sexptype == REALSXP) {
                    const double* src = (const double*)tdata;
                    double* dst = REAL(obj);
                    for (size_t i = 0; i < total; i++) {
                        // i is row-major index, compute col-major index
                        size_t rem = i;
                        size_t col_idx = 0;
                        for (size_t d = 0; d < ndim; d++) {
                            size_t coord = rem / row_strides[d];
                            rem %= row_strides[d];
                            col_idx += coord * col_strides[d];
                        }
                        dst[col_idx] = src[i];
                    }
                } else if (sexptype == INTSXP) {
                    const int* src = (const int*)tdata;
                    int* dst = INTEGER(obj);
                    for (size_t i = 0; i < total; i++) {
                        size_t rem = i;
                        size_t col_idx = 0;
                        for (size_t d = 0; d < ndim; d++) {
                            size_t coord = rem / row_strides[d];
                            rem %= row_strides[d];
                            col_idx += coord * col_strides[d];
                        }
                        dst[col_idx] = src[i];
                    }
                }
            }

            // Set dim attribute
            SEXP r_dim = PROTECT(allocVector(INTSXP, (R_xlen_t)ndim));
            for (size_t i = 0; i < ndim; i++)
                INTEGER(r_dim)[i] = (int)shape[i];
            setAttrib(obj, R_DimSymbol, r_dim);
            UNPROTECT(2);
            break;
        }
        default:
            MORLOC_ERROR("Unsupported schema type");
            goto error;
    }

    return obj;

error:
    return R_NilValue;
}

// }}} from_voidstar

// {{{ exported morloc API functions

// PID of the process that created the daemon (set in morloc_start_daemon)
static pid_t daemon_creator_pid = 0;

// Close the daemon when the R object dies
static void daemon_finalizer(SEXP ptr) {
    if (!R_ExternalPtrAddr(ptr)) return;
    // Skip cleanup in forked children -- they must not unlink the socket file
    if (daemon_creator_pid != 0 && getpid() != daemon_creator_pid) {
        R_ClearExternalPtr(ptr);
        return;
    }
    language_daemon_t* daemon = (language_daemon_t*)R_ExternalPtrAddr(ptr);
    if(daemon != NULL){
        close_daemon(&daemon);
    }
    R_ClearExternalPtr(ptr);
}

// Release daemon resources in a forked child WITHOUT unlinking the socket file.
// Workers call this after fork so they don't hold the server_fd or accidentally
// destroy the socket when they exit.
SEXP morloc_detach_daemon(SEXP daemon_r) {
    if (!R_ExternalPtrAddr(daemon_r)) return R_NilValue;
    language_daemon_t* daemon = (language_daemon_t*)R_ExternalPtrAddr(daemon_r);
    if (daemon != NULL) {
        close_socket(daemon->server_fd);
        client_list_t *current = daemon->client_fds;
        while (current) {
            client_list_t *next = current->next;
            close(current->fd);
            free(current);
            current = next;
        }
        free(daemon->socket_path);
        free(daemon->tmpdir);
        free(daemon->shm_basename);
        free(daemon);
    }
    R_ClearExternalPtr(daemon_r);
    return R_NilValue;
}

SEXP morloc_start_daemon(
    SEXP socket_path_r,
    SEXP tmpdir_r,
    SEXP shm_basename_r,
    SEXP shm_default_size_r
){ MAYFAIL
    const char* socket_path = CHAR(STRING_ELT(socket_path_r, 0));
    const char* tmpdir = CHAR(STRING_ELT(tmpdir_r, 0));
    const char* shm_basename = CHAR(STRING_ELT(shm_basename_r, 0));
    size_t shm_default_size = (size_t)asInteger(shm_default_size_r);

    language_daemon_t* daemon = R_TRY(
        start_daemon,
        socket_path,
        tmpdir,
        shm_basename,
        shm_default_size
    );

    // Wrap pointer in external pointer
    SEXP result = PROTECT(R_MakeExternalPtr(daemon, R_NilValue, R_NilValue));

    // Record which process owns the daemon (for the PID guard in daemon_finalizer)
    daemon_creator_pid = getpid();

    // Register finalizer with wrapper
    R_RegisterCFinalizerEx(result, daemon_finalizer, TRUE);

    // Set class attribute
    SEXP class_name = PROTECT(mkString("language_daemon"));
    SET_CLASS(result, class_name);

    UNPROTECT(2);
    return result;
}


SEXP morloc_shinit(SEXP shm_basename_r, SEXP volume_index_r, SEXP shm_size_r) { MAYFAIL
    const char* shm_basename = CHAR(STRING_ELT(shm_basename_r, 0));
    size_t volume_index = (size_t)asInteger(volume_index_r);
    size_t shm_size = (size_t)asInteger(shm_size_r);

    R_TRY(shinit, shm_basename, volume_index, shm_size);

    return R_NilValue;
}


// {{{ signal handling for graceful shutdown

static volatile sig_atomic_t r_shutting_down = 0;

static void r_sigterm_handler(int sig) {
    (void)sig;
    r_shutting_down = 1;
}

SEXP morloc_install_sigterm_handler(void) {
    struct sigaction sa;
    sa.sa_handler = r_sigterm_handler;
    sigemptyset(&sa.sa_mask);
    sa.sa_flags = 0;
    sigaction(SIGTERM, &sa, NULL);
    return R_NilValue;
}

SEXP morloc_is_shutting_down(void) {
    return ScalarLogical(r_shutting_down != 0);
}

SEXP morloc_set_line_buffered(void) {
    // Only stderr - stdout is left fully buffered for performance
    // and flushed explicitly after each job.
    setvbuf(stderr, NULL, _IOLBF, 0);
    return R_NilValue;
}

// }}} signal handling

SEXP morloc_wait_for_client(SEXP daemon_r){ MAYFAIL
    if (!R_ExternalPtrAddr(daemon_r)) {
        MORLOC_ERROR("Expected a daemon pointer");
    }

    // Return immediately if shutdown was requested
    if (r_shutting_down) {
        return ScalarInteger(-1);
    }

    language_daemon_t* daemon = (language_daemon_t*)R_ExternalPtrAddr(daemon_r);

    // Use pselect directly (not wait_for_client_with_timeout) so we can
    // return immediately on EINTR from SIGTERM instead of retrying via WAIT
    fd_set read_fds;
    FD_ZERO(&read_fds);
    FD_SET(daemon->server_fd, &read_fds);
    int max_fd = daemon->server_fd;

    for (client_list_t* cl = daemon->client_fds; cl != NULL; cl = cl->next) {
        FD_SET(cl->fd, &read_fds);
        if (cl->fd > max_fd) max_fd = cl->fd;
    }

    // 100ms timeout -- short enough for responsive SIGTERM handling
    struct timespec ts = { .tv_sec = 0, .tv_nsec = 100000000 };
    sigset_t emptymask;
    sigemptyset(&emptymask);

    int ready = pselect(max_fd + 1, &read_fds, NULL, NULL, &ts, &emptymask);

    // Check shutdown after pselect (signal may have arrived during the call)
    if (r_shutting_down) {
        return ScalarInteger(-1);
    }

    // Timeout or interrupted -- return 0 (no client)
    if (ready <= 0) {
        return ScalarInteger(0);
    }

    // Accept new connection if server_fd is ready
    if (FD_ISSET(daemon->server_fd, &read_fds)) {
        int fd = accept(daemon->server_fd, NULL, NULL);
        if (fd >= 0) {
            fcntl(fd, F_SETFL, O_NONBLOCK);
            client_list_t* new_client = (client_list_t*)calloc(1, sizeof(client_list_t));
            if (new_client == NULL) {
                close(fd);
                MORLOC_ERROR("calloc failed");
            }
            new_client->fd = fd;
            new_client->next = NULL;
            if (daemon->client_fds == NULL) {
                daemon->client_fds = new_client;
            } else {
                client_list_t* last = daemon->client_fds;
                while (last->next) last = last->next;
                last->next = new_client;
            }
        }
    }

    // Return first ready client fd
    if (daemon->client_fds != NULL) {
        client_list_t* first = daemon->client_fds;
        int client_fd = first->fd;
        daemon->client_fds = first->next;
        free(first);
        return ScalarInteger(client_fd);
    }

    return ScalarInteger(0);
}


SEXP morloc_read_morloc_call_packet(SEXP packet_r) { MAYFAIL
    uint8_t* packet = RAW(packet_r);
    morloc_call_t* call_packet = R_TRY(read_morloc_call_packet, packet);

    // Create two element R list
    //  1: manifold id
    //  2: argument list of raw packets
    SEXP r_list = PROTECT(allocVector(VECSXP, 2));

    // Convert midx to R integer
    SEXP r_mid = PROTECT(ScalarInteger(call_packet->midx));

    // Create arguments list
    SEXP r_args = PROTECT(allocVector(VECSXP, call_packet->nargs));

    for(size_t i = 0; i < call_packet->nargs; i++) {
        size_t arg_packet_size = R_TRY_WITH(UNPROTECT(3), morloc_packet_size, call_packet->args[i]);
        SEXP r_arg = PROTECT(allocVector(RAWSXP, arg_packet_size));
        memcpy(RAW(r_arg), call_packet->args[i], arg_packet_size);
        SET_VECTOR_ELT(r_args, i, r_arg);
        UNPROTECT(1);  // r_arg
    }

    // Assemble final list
    SET_VECTOR_ELT(r_list, 0, r_mid);
    SET_VECTOR_ELT(r_list, 1, r_args);

    free_morloc_call(call_packet);

    UNPROTECT(3);  // r_list, r_mid, r_args
    return r_list;
}


SEXP morloc_send_packet_to_foreign_server(SEXP client_fd_r, SEXP packet_r) { MAYFAIL
    if (TYPEOF(client_fd_r) != INTSXP || LENGTH(client_fd_r) != 1) {
        MORLOC_ERROR("client_fd must be a single integer");
    }
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }

    // Extract arguments
    int client_fd = INTEGER(client_fd_r)[0];
    uint8_t* packet = RAW(packet_r);
    size_t packet_size = (size_t)LENGTH(packet_r);

    // Call underlying implementation
    size_t bytes_sent = R_TRY(send_packet_to_foreign_server, client_fd, packet);

    // This could in theory be problematic, since int is smaller than size_t
    // In practice it should not be, since packets are typically small
    // However, if I refactor to send large packets in the future, this could be
    // problematic. Then I would need to convert to a double return.
    return ScalarInteger((int)bytes_sent);
}


// Read from socket returning raw vector of received data
SEXP morloc_stream_from_client(SEXP client_fd_r) { MAYFAIL
    if (TYPEOF(client_fd_r) != INTSXP || LENGTH(client_fd_r) != 1) {
        MORLOC_ERROR("client_fd must be a single integer");
    }

    int client_fd = INTEGER(client_fd_r)[0];

    // Read packet from socket
    uint8_t* packet = R_TRY(stream_from_client, client_fd);

    // Read the packet size from the header (free packet before longjmp on error)
    size_t packet_size = R_TRY_WITH(free(packet), morloc_packet_size, packet);

    // Create raw vector for result
    SEXP result = PROTECT(allocVector(RAWSXP, packet_size));
    memcpy(RAW(result), packet, packet_size);
    free(packet);

    UNPROTECT(1);
    return result;
}


// close_socket
SEXP morloc_close_socket(SEXP socket_id_r) {
    if (TYPEOF(socket_id_r) != INTSXP || LENGTH(socket_id_r) != 1) {
        MORLOC_ERROR("socket_id must be a single integer");
    }
    int socket_id = INTEGER(socket_id_r)[0];
    close_socket(socket_id);
    // Return invisible NULL
    return R_NilValue;
}


// put_value
SEXP morloc_put_value(SEXP obj_r, SEXP schema_str_r) { MAYFAIL
    if (TYPEOF(schema_str_r) != STRSXP || LENGTH(schema_str_r) != 1) {
        MORLOC_ERROR("schema must be a single string");
    }

    const char* schema_cstr = CHAR(STRING_ELT(schema_str_r, 0));

    char* schema_str = strdup(schema_cstr);
    Schema* schema = R_TRY_WITH(free(schema_str), parse_schema, schema_str);
    free(schema_str);

    // Arrow dispatch: if schema hint is "arrow", use Arrow C Data Interface
    if (schema->hint && strcmp(schema->hint, "arrow") == 0) {
        // Export R arrow RecordBatch via C Data Interface -> copy to shm -> packet
        // arrow::ExportRecordBatch(batch, array_ptr, schema_ptr)
        struct ArrowSchema arrow_schema;
        struct ArrowArray arrow_array;
        memset(&arrow_schema, 0, sizeof(arrow_schema));
        memset(&arrow_array, 0, sizeof(arrow_array));

        SEXP arrow_ns = PROTECT(R_FindNamespace(mkString("arrow")));
        SEXP export_fn = PROTECT(findVarInFrame(arrow_ns, install("ExportRecordBatch")));
        if (export_fn == R_UnboundValue) {
            UNPROTECT(2);
            free_schema(schema);
            MORLOC_ERROR("arrow::ExportRecordBatch not found; is the arrow package installed?");
        }

        SEXP array_ptr_r = PROTECT(R_MakeExternalPtr(&arrow_array, R_NilValue, R_NilValue));
        SEXP schema_ptr_r = PROTECT(R_MakeExternalPtr(&arrow_schema, R_NilValue, R_NilValue));
        SEXP call = PROTECT(lang4(export_fn, obj_r, array_ptr_r, schema_ptr_r));
        eval(call, arrow_ns);
        UNPROTECT(5);

        char* errmsg = NULL;
        relptr_t relptr = arrow_to_shm(&arrow_array, &arrow_schema, &errmsg);

        if (arrow_schema.release) arrow_schema.release(&arrow_schema);
        if (arrow_array.release) arrow_array.release(&arrow_array);

        if (errmsg) {
            free_schema(schema);
            MORLOC_ERROR("Arrow export failed: %s", errmsg);
        }

        uint8_t* packet = make_arrow_data_packet(relptr, schema);
        if (!packet) {
            free_schema(schema);
            MORLOC_ERROR("Failed to create arrow data packet");
        }

        size_t packet_size = R_TRY_WITH({free(packet); free_schema(schema);}, morloc_packet_size, packet);
        SEXP result = PROTECT(allocVector(RAWSXP, packet_size));
        memcpy(RAW(result), packet, packet_size);
        free(packet);
        free_schema(schema);
        UNPROTECT(1);
        return result;
    }

    void* voidstar = to_voidstar(obj_r, schema);
    if (!voidstar) {
        free_schema(schema);
        MORLOC_ERROR("Failed to convert R object to internal representation");
    }

    relptr_t relptr = R_TRY_WITH(free_schema(schema), abs2rel, voidstar);

    uint8_t* packet = R_TRY_WITH(free_schema(schema), make_data_packet_auto, voidstar, relptr, schema);

    const morloc_packet_header_t* hdr = (const morloc_packet_header_t*)packet;
    if (hdr->command.data.source != PACKET_SOURCE_RPTR) {
        // Data inlined in packet -- free SHM immediately
        char* free_err = NULL;
        shfree_by_schema((absptr_t)voidstar, schema, &free_err);
        if (free_err) { free(free_err); free_err = NULL; }
        shfree((absptr_t)voidstar, &free_err);
        if (free_err) { free(free_err); }
    }

    size_t packet_size = R_TRY_WITH({free(packet); free_schema(schema);}, morloc_packet_size, packet);

    SEXP result = PROTECT(allocVector(RAWSXP, packet_size));
    memcpy(RAW(result), packet, packet_size);
    free(packet);
    free_schema(schema);

    UNPROTECT(1);
    return result;
}


// mlc_show: serialize a value to a JSON string
SEXP morloc_mlc_show(SEXP obj_r, SEXP schema_str_r) { MAYFAIL
    if (TYPEOF(schema_str_r) != STRSXP || LENGTH(schema_str_r) != 1) {
        MORLOC_ERROR("schema must be a single string");
    }

    char* schema_str = strdup(CHAR(STRING_ELT(schema_str_r, 0)));
    Schema* schema = R_TRY_WITH(free(schema_str), parse_schema, schema_str);
    free(schema_str);

    void* voidstar = to_voidstar(obj_r, schema);
    if (!voidstar) {
        free_schema(schema);
        MORLOC_ERROR("Failed to convert R object to internal representation");
    }

    char* json = R_TRY_WITH(free_schema(schema), mlc_show, voidstar, schema);

    {
        char* shfree_errmsg = NULL;
        shfree(voidstar, &shfree_errmsg);
        free(shfree_errmsg);
    }
    free_schema(schema);

    SEXP result = PROTECT(mkString(json));
    free(json);
    UNPROTECT(1);
    return result;
}


SEXP morloc_get_value(SEXP packet_r, SEXP schema_str_r) { MAYFAIL
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }
    if (TYPEOF(schema_str_r) != STRSXP || LENGTH(schema_str_r) != 1) {
        MORLOC_ERROR("schema must be a single string");
    }

    // Extract arguments
    uint8_t* packet = RAW(packet_r);
    size_t packet_size = (size_t)LENGTH(packet_r);

    const morloc_packet_header_t* header = (const morloc_packet_header_t*)packet;
    uint8_t source = header->command.data.source;
    uint8_t format = header->command.data.format;

    const char* schema_cstr = CHAR(STRING_ELT(schema_str_r, 0));

    char* schema_str = strdup(schema_cstr);
    Schema* schema = R_TRY_WITH(free(schema_str), parse_schema, schema_str);
    free(schema_str);

    // Arrow dispatch: if packet format is Arrow, import via C Data Interface
    if (format == PACKET_FORMAT_ARROW) {
        uint8_t* arrow_ptr = R_TRY_WITH(free_schema(schema),
            get_morloc_data_packet_value, packet, schema);
        const arrow_shm_header_t* arrow_hdr = (const arrow_shm_header_t*)arrow_ptr;

        struct ArrowSchema arrow_schema;
        struct ArrowArray arrow_array;
        char* arrow_err = NULL;
        arrow_from_shm(arrow_hdr, &arrow_schema, &arrow_array, &arrow_err);
        if (arrow_err) {
            if (arrow_schema.release) arrow_schema.release(&arrow_schema);
            if (arrow_array.release) arrow_array.release(&arrow_array);
            free_schema(schema);
            MORLOC_ERROR("Arrow import failed: %s", arrow_err);
        }

        // Import via R arrow package: arrow::ImportRecordBatch(array_ptr, schema_ptr)
        SEXP arrow_ns = PROTECT(R_FindNamespace(mkString("arrow")));
        SEXP import_fn = PROTECT(findVarInFrame(arrow_ns, install("ImportRecordBatch")));
        if (import_fn == R_UnboundValue) {
            if (arrow_schema.release) arrow_schema.release(&arrow_schema);
            if (arrow_array.release) arrow_array.release(&arrow_array);
            UNPROTECT(2);
            free_schema(schema);
            MORLOC_ERROR("arrow::ImportRecordBatch not found; is the arrow package installed?");
        }

        SEXP array_ptr_r = PROTECT(R_MakeExternalPtr(&arrow_array, R_NilValue, R_NilValue));
        SEXP schema_ptr_r = PROTECT(R_MakeExternalPtr(&arrow_schema, R_NilValue, R_NilValue));
        SEXP call = PROTECT(lang3(import_fn, array_ptr_r, schema_ptr_r));
        SEXP obj_r = PROTECT(eval(call, arrow_ns));
        UNPROTECT(6);

        // Incref shm so data stays alive
        char* incref_err = NULL;
        shincref((absptr_t)arrow_ptr, &incref_err);
        if (incref_err) { free(incref_err); }

        free_schema(schema);
        return obj_r;
    }

    // Fast path: inline voidstar -- read directly from packet, no SHM needed
    if (source == PACKET_SOURCE_MESG && format == PACKET_FORMAT_VOIDSTAR) {
        const uint8_t* payload = packet + sizeof(morloc_packet_header_t) + header->offset;
        SEXP obj_r = from_voidstar((const void*)payload, schema, (const void*)payload);
        free_schema(schema);
        if (obj_r == NULL) {
            MORLOC_ERROR("Failed to convert internal representation to R object");
        }
        return obj_r;
    }

    // SHM paths
    uint8_t* voidstar = R_TRY_WITH(free_schema(schema), get_morloc_data_packet_value, packet, schema);

    SEXP obj_r = from_voidstar(voidstar, schema, NULL);
    if (obj_r == NULL) {
        free_schema(schema);
        MORLOC_ERROR("Failed to convert internal representation to R object");
    }

    free_schema(schema);

    return obj_r;
}


SEXP morloc_foreign_call(SEXP socket_path_r, SEXP mid_r, SEXP args_r) { MAYFAIL
    // Validate inputs
    if (TYPEOF(socket_path_r) != STRSXP || LENGTH(socket_path_r) != 1) {
        MORLOC_ERROR("socket_path must be a single string");
    }
    if (TYPEOF(mid_r) != INTSXP || LENGTH(mid_r) != 1) {
        MORLOC_ERROR("mid must be a single integer");
    }
    if (TYPEOF(args_r) != VECSXP) {
        MORLOC_ERROR("args must be a list of raw vectors");
    }

    // Extract arguments
    const char* socket_path = CHAR(STRING_ELT(socket_path_r, 0));
    int mid = INTEGER(mid_r)[0];
    size_t nargs = (size_t)LENGTH(args_r);

    // Allocate temporary storage
    const uint8_t** arg_packets = (const uint8_t**)R_alloc(nargs, sizeof(uint8_t*));

    // Convert R raw vectors to C buffers
    for (size_t i = 0; i < nargs; i++) {
        SEXP arg = VECTOR_ELT(args_r, i);
        if (TYPEOF(arg) != RAWSXP) {
            MORLOC_ERROR("All arguments must be raw vectors (argument %zu)", i+1);
        }
        arg_packets[i] = RAW(arg);
    }

    // Create call packet
    uint8_t* packet = R_TRY(
        make_morloc_local_call_packet,
        (uint32_t)mid,
        arg_packets,
        nargs
    );

    // Send/receive over socket
    uint8_t* result = R_TRY_WITH(free(packet),
        send_and_receive_over_socket,
        socket_path,
        packet
    );

    // Get result size
    size_t result_length = R_TRY_WITH({free(packet); free(result);}, morloc_packet_size, result);

    // Create result raw vector
    SEXP result_r = PROTECT(allocVector(RAWSXP, result_length));
    memcpy(RAW(result_r), result, result_length);
    free(packet);
    free(result);

    // Cleanup
    UNPROTECT(1);
    return result_r;
}


SEXP morloc_is_ping(SEXP packet_r) { MAYFAIL
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }

    bool is_ping = R_TRY(packet_is_ping, RAW(packet_r));

    return ScalarLogical(is_ping);
}


SEXP morloc_is_local_call(SEXP packet_r) { MAYFAIL
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }

    bool is_local_call = R_TRY(packet_is_local_call, RAW(packet_r));

    return ScalarLogical(is_local_call);
}


SEXP morloc_is_remote_call(SEXP packet_r) { MAYFAIL
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }

    bool is_remote_call = R_TRY(packet_is_remote_call, RAW(packet_r));

    return ScalarLogical(is_remote_call);
}


SEXP morloc_pong(SEXP packet_r) { MAYFAIL
    if (TYPEOF(packet_r) != RAWSXP) {
        MORLOC_ERROR("packet must be a raw vector");
    }

    // Generate a response to ping
    uint8_t* pong = R_TRY(return_ping, RAW(packet_r));

    size_t pong_size = R_TRY_WITH(free(pong), morloc_packet_size, pong);

    SEXP result_r = PROTECT(allocVector(RAWSXP, pong_size));
    memcpy(RAW(result_r), pong, pong_size);
    free(pong);

    UNPROTECT(1);
    return result_r;
}


SEXP morloc_make_fail_packet(SEXP failure_message_r) { MAYFAIL
    const char* failure_message = CHAR(STRING_ELT(failure_message_r, 0));
    uint8_t* fail_packet = make_fail_packet(failure_message);

    size_t packet_size = R_TRY(morloc_packet_size, fail_packet);

    SEXP packet_r = PROTECT(allocVector(RAWSXP, packet_size));
    memcpy(RAW(packet_r), fail_packet, packet_size);
    free(fail_packet);

    UNPROTECT(1);
    return packet_r;
}


SEXP extract_element_by_name(SEXP list, const char* key) {
  // Ensure inputs are correct types
  if (TYPEOF(list) != VECSXP) MORLOC_ERROR("Input must be a list");

  // Get list names attribute
  SEXP names = Rf_getAttrib(list, R_NamesSymbol);
  if (names == R_NilValue) MORLOC_ERROR("List must have names");

  // Iterate through list elements
  for (int i = 0; i < Rf_length(list); i++) {
    const char *current_name = CHAR(STRING_ELT(names, i));

    if (strcmp(key, current_name) == 0) {
      return VECTOR_ELT(list, i);  // Return matching element
    }
  }

  return R_NilValue;  // Return NULL if name not found
}


SEXP morloc_remote_call(SEXP midx, SEXP socket_path, SEXP cache_path, SEXP resources, SEXP arg_packets) { MAYFAIL
    // Protect all R inputs immediately
    PROTECT(socket_path);
    PROTECT(cache_path);
    PROTECT(resources);
    PROTECT(arg_packets = coerceVector(arg_packets, VECSXP));

    // Convert basic parameters
    int c_midx = INTEGER(midx)[0];
    const char* c_socket_path = CHAR(STRING_ELT(socket_path, 0));
    const char* c_cache_path = CHAR(STRING_ELT(cache_path, 0));

    // Extract resources with validation
    resources_t c_resources;
    SEXP mem = extract_element_by_name(resources, "memory");
    SEXP tim = extract_element_by_name(resources, "time");
    SEXP cpu = extract_element_by_name(resources, "cpus");
    SEXP gpu = extract_element_by_name(resources, "gpus");
    if (mem == R_NilValue || tim == R_NilValue || cpu == R_NilValue || gpu == R_NilValue) {
        UNPROTECT(4);
        MORLOC_ERROR("Missing required resource field (memory, time, cpus, or gpus)");
    }
    c_resources.memory = INTEGER(mem)[0];
    c_resources.time = INTEGER(tim)[0];
    c_resources.cpus = INTEGER(cpu)[0];
    c_resources.gpus = INTEGER(gpu)[0];

    // Process argument packets with type checking
    size_t nargs = LENGTH(arg_packets);
    const uint8_t** c_arg_packets = (const uint8_t**) R_alloc(nargs, sizeof(uint8_t*));

    for(size_t i = 0; i < nargs; i++) {
        SEXP raw_vec = VECTOR_ELT(arg_packets, i);
        if(TYPEOF(raw_vec) != RAWSXP) {
            UNPROTECT(4);
            MORLOC_ERROR("arg_packets must contain only raw vectors");
        }
        c_arg_packets[i] = (uint8_t*)RAW(raw_vec);
    }

    // Execute remote call
    uint8_t* result_packet = R_TRY_WITH(UNPROTECT(4),
        remote_call,
        c_midx,
        c_socket_path,
        c_cache_path,
        &c_resources,
        c_arg_packets,
        nargs
    );

    // Validate and copy result
    size_t packet_size = R_TRY_WITH({free(result_packet); UNPROTECT(4);}, morloc_packet_size, result_packet);
    if(!result_packet || packet_size == 0) {
        if(result_packet) free(result_packet);
        UNPROTECT(4);
        MORLOC_ERROR("Invalid result packet from remote call");
    }

    SEXP result_packet_r = PROTECT(allocVector(RAWSXP, packet_size));
    memcpy(RAW(result_packet_r), result_packet, packet_size);
    free(result_packet);

    // Cleanup and return
    UNPROTECT(5);  // socket_path, cache_path, resources, arg_packets, result_packet_r
    return result_packet_r;
}


// {{{ fork and fd-passing functions

SEXP morloc_socketpair(void) {
    int sv[2];
    if (socketpair(AF_UNIX, SOCK_STREAM, 0, sv) < 0) {
        error("socketpair failed: %s", strerror(errno));
    }
    SEXP result = PROTECT(allocVector(INTSXP, 2));
    INTEGER(result)[0] = sv[0];
    INTEGER(result)[1] = sv[1];
    UNPROTECT(1);
    return result;
}

SEXP morloc_fork(void) {
    pid_t pid = fork();
    if (pid < 0) {
        error("fork failed: %s", strerror(errno));
    }
    return ScalarInteger((int)pid);
}

// Immediately terminate the process without running any cleanup.
// Must be used by forked worker children instead of R's quit().
// R's quit() runs finalizers that try to free objects allocated by the
// parent process, which corrupts the heap on glibc >= 2.39.
SEXP morloc_exit(SEXP status_r) {
    int status = INTEGER(status_r)[0];
    _exit(status);
    return R_NilValue; // unreachable
}

SEXP morloc_send_fd(SEXP pipe_fd_r, SEXP client_fd_r) {
    int pipe_fd = INTEGER(pipe_fd_r)[0];
    int client_fd = INTEGER(client_fd_r)[0];

    struct msghdr msg = {0};
    struct iovec iov;
    char buf[1] = {0};
    char cmsgbuf[CMSG_SPACE(sizeof(int))];

    iov.iov_base = buf;
    iov.iov_len = 1;
    msg.msg_iov = &iov;
    msg.msg_iovlen = 1;
    msg.msg_control = cmsgbuf;
    msg.msg_controllen = sizeof(cmsgbuf);

    struct cmsghdr *cmsg = CMSG_FIRSTHDR(&msg);
    cmsg->cmsg_level = SOL_SOCKET;
    cmsg->cmsg_type = SCM_RIGHTS;
    cmsg->cmsg_len = CMSG_LEN(sizeof(int));
    memcpy(CMSG_DATA(cmsg), &client_fd, sizeof(int));

    ssize_t n = sendmsg(pipe_fd, &msg, 0);
    if (n < 0) {
        error("sendmsg SCM_RIGHTS failed: %s", strerror(errno));
    }
    return R_NilValue;
}

SEXP morloc_recv_fd(SEXP pipe_fd_r) {
    int pipe_fd = INTEGER(pipe_fd_r)[0];

    struct msghdr msg = {0};
    struct iovec iov;
    char buf[1];
    char cmsgbuf[CMSG_SPACE(sizeof(int))];

    iov.iov_base = buf;
    iov.iov_len = 1;
    msg.msg_iov = &iov;
    msg.msg_iovlen = 1;
    msg.msg_control = cmsgbuf;
    msg.msg_controllen = sizeof(cmsgbuf);

    ssize_t n = recvmsg(pipe_fd, &msg, 0);
    if (n <= 0) {
        return ScalarInteger(-1);
    }

    struct cmsghdr *cmsg = CMSG_FIRSTHDR(&msg);
    if (cmsg == NULL || cmsg->cmsg_level != SOL_SOCKET || cmsg->cmsg_type != SCM_RIGHTS) {
        return ScalarInteger(-1);
    }

    int fd;
    memcpy(&fd, CMSG_DATA(cmsg), sizeof(int));
    return ScalarInteger(fd);
}

SEXP morloc_kill(SEXP pid_r, SEXP sig_r) {
    pid_t pid = (pid_t)INTEGER(pid_r)[0];
    int sig = INTEGER(sig_r)[0];
    int ret = kill(pid, sig);
    return ScalarInteger(ret);
}

SEXP morloc_waitpid(SEXP pid_r) {
    pid_t pid = (pid_t)INTEGER(pid_r)[0];
    int status;
    pid_t result = waitpid(pid, &status, WNOHANG);
    return ScalarInteger((int)result);
}

SEXP morloc_waitpid_blocking(SEXP pid_r) {
    pid_t pid = (pid_t)INTEGER(pid_r)[0];
    int status;
    pid_t result = waitpid(pid, &status, 0);
    return ScalarInteger((int)result);
}

// }}} fork and fd-passing functions

// {{{ shared counter functions (for dynamic worker spawning)

static void shared_counter_finalizer(SEXP ptr) {
    int* p = (int*)R_ExternalPtrAddr(ptr);
    if (p != NULL) {
        munmap(p, sizeof(int));
        R_ClearExternalPtr(ptr);
    }
}

SEXP morloc_shared_counter_create(void) {
    int* p = (int*)mmap(NULL, sizeof(int),
                        PROT_READ | PROT_WRITE,
                        MAP_SHARED | MAP_ANONYMOUS, -1, 0);
    if (p == MAP_FAILED) {
        error("mmap failed for shared counter: %s", strerror(errno));
    }
    *p = 0;
    SEXP ptr = PROTECT(R_MakeExternalPtr(p, R_NilValue, R_NilValue));
    R_RegisterCFinalizerEx(ptr, shared_counter_finalizer, TRUE);
    UNPROTECT(1);
    return ptr;
}

SEXP morloc_shared_counter_inc(SEXP ptr_r) {
    int* p = (int*)R_ExternalPtrAddr(ptr_r);
    if (p == NULL) error("shared counter is NULL");
    int val = __atomic_add_fetch(p, 1, __ATOMIC_RELAXED);
    return ScalarInteger(val);
}

SEXP morloc_shared_counter_dec(SEXP ptr_r) {
    int* p = (int*)R_ExternalPtrAddr(ptr_r);
    if (p == NULL) error("shared counter is NULL");
    int val = __atomic_sub_fetch(p, 1, __ATOMIC_RELAXED);
    return ScalarInteger(val);
}

SEXP morloc_shared_counter_read(SEXP ptr_r) {
    int* p = (int*)R_ExternalPtrAddr(ptr_r);
    if (p == NULL) error("shared counter is NULL");
    int val = __atomic_load_n(p, __ATOMIC_RELAXED);
    return ScalarInteger(val);
}

SEXP morloc_pipe(void) {
    int fds[2];
    if (pipe(fds) != 0) {
        error("pipe failed: %s", strerror(errno));
    }
    SEXP result = PROTECT(allocVector(INTSXP, 2));
    INTEGER(result)[0] = fds[0];  /* read end */
    INTEGER(result)[1] = fds[1];  /* write end */
    UNPROTECT(1);
    return result;
}

SEXP morloc_write_byte(SEXP fd_r, SEXP byte_r) {
    int fd = INTEGER(fd_r)[0];
    unsigned char b = (unsigned char)RAW(byte_r)[0];
    ssize_t n = write(fd, &b, 1);
    return ScalarInteger((int)n);
}

SEXP morloc_close_fd(SEXP fd_r) {
    int fd = INTEGER(fd_r)[0];
    close(fd);
    return R_NilValue;
}

// }}} shared counter functions

// {{{ C-level worker loop

// Receive a file descriptor over a Unix domain socket (C-level helper).
static int recv_fd_c(int pipe_fd) {
    struct msghdr msg = {0};
    struct iovec iov;
    char buf[1];
    char cmsgbuf[CMSG_SPACE(sizeof(int))];

    iov.iov_base = buf;
    iov.iov_len = 1;
    msg.msg_iov = &iov;
    msg.msg_iovlen = 1;
    msg.msg_control = cmsgbuf;
    msg.msg_controllen = sizeof(cmsgbuf);

    ssize_t n = recvmsg(pipe_fd, &msg, 0);
    if (n <= 0) return -1;

    struct cmsghdr *cmsg = CMSG_FIRSTHDR(&msg);
    if (!cmsg || cmsg->cmsg_level != SOL_SOCKET || cmsg->cmsg_type != SCM_RIGHTS)
        return -1;

    int fd;
    memcpy(&fd, CMSG_DATA(cmsg), sizeof(int));
    return fd;
}

// Send a fail packet to the client (best-effort, ignores send errors).
static void send_fail_to_client(int client_fd, const char* msg) {
    char* errmsg = NULL;
    uint8_t* fail = make_fail_packet(msg);
    send_packet_to_foreign_server(client_fd, fail, &errmsg);
    free(fail);
}

// Dispatch a call to a manifold function. All packet handling is in C;
// only the manifold evaluation crosses into R via R_tryEval.
static void dispatch_manifold_c(int client_fd, const uint8_t* packet,
                                SEXP dispatch, const char* label) {
    char* errmsg = NULL;

    morloc_call_t* call = read_morloc_call_packet(packet, &errmsg);
    if (errmsg) {
        send_fail_to_client(client_fd, errmsg);
        return;
    }

    int midx = (int)call->midx;
    SEXP fn = (midx >= 1 && midx <= LENGTH(dispatch))
              ? VECTOR_ELT(dispatch, midx - 1) : R_NilValue;

    if (fn == R_NilValue) {
        char msg[128];
        snprintf(msg, sizeof(msg), "%s function not found: m%d", label, midx);
        send_fail_to_client(client_fd, msg);
        free_morloc_call(call);
        return;
    }

    // Build R pairlist of raw-vector arguments: fn(arg1, arg2, ...)
    int nprotect = 0;
    SEXP pairlist = R_NilValue;
    for (int i = (int)call->nargs - 1; i >= 0; i--) {
        size_t arg_size = morloc_packet_size(call->args[i], &errmsg);
        if (errmsg) {
            UNPROTECT(nprotect);
            send_fail_to_client(client_fd, errmsg);
            free_morloc_call(call);
            return;
        }
        SEXP r_arg = PROTECT(allocVector(RAWSXP, arg_size));
        nprotect++;
        memcpy(RAW(r_arg), call->args[i], arg_size);
        pairlist = PROTECT(Rf_cons(r_arg, pairlist));
        nprotect++;
    }
    free_morloc_call(call);

    SEXP r_call = PROTECT(Rf_lcons(fn, pairlist));
    nprotect++;

    // Single crossing into R: evaluate the manifold
    int eval_err = 0;
    SEXP result = R_tryEvalSilent(r_call, R_GlobalEnv, &eval_err);

    if (eval_err || result == R_NilValue || TYPEOF(result) != RAWSXP) {
        UNPROTECT(nprotect);
        send_fail_to_client(client_fd,
            eval_err ? R_curErrorBuf() : "manifold returned non-raw result");
        return;
    }

    PROTECT(result);
    nprotect++;

    send_packet_to_foreign_server(client_fd, RAW(result), &errmsg);
    UNPROTECT(nprotect);
}

// Process one client job entirely in C. Only crosses into R for
// the actual manifold evaluation.
static void run_job_c(int client_fd, SEXP dispatch, SEXP remote_dispatch) {
    char* errmsg = NULL;

    uint8_t* packet = stream_from_client(client_fd, &errmsg);
    if (errmsg) {
        send_fail_to_client(client_fd, errmsg);
        free(errmsg);
        close_socket(client_fd);
        return;
    }

    bool is_local = packet_is_local_call(packet, &errmsg);
    if (!errmsg && is_local) {
        dispatch_manifold_c(client_fd, packet, dispatch, "Local");
    } else if (!errmsg) {
        bool is_remote = packet_is_remote_call(packet, &errmsg);
        if (!errmsg && is_remote) {
            dispatch_manifold_c(client_fd, packet, remote_dispatch, "Remote");
        } else if (!errmsg) {
            bool is_ping_pkt = packet_is_ping(packet, &errmsg);
            if (!errmsg && is_ping_pkt) {
                uint8_t* pong = return_ping(packet, &errmsg);
                if (!errmsg) {
                    send_packet_to_foreign_server(client_fd, pong, &errmsg);
                    free(pong);
                }
            } else if (!errmsg) {
                send_fail_to_client(client_fd, "Unexpected packet type");
            }
        }
    }

    if (errmsg) {
        send_fail_to_client(client_fd, errmsg);
    }

    free(packet);
    close_socket(client_fd);
}

// Tight C worker loop. Receives fds from the job queue and processes them,
// crossing into R only for manifold evaluation.
SEXP morloc_worker_loop_c(SEXP pipe_fd_r, SEXP dispatch_r, SEXP remote_dispatch_r) {
    int pipe_fd = INTEGER(pipe_fd_r)[0];
    PROTECT(dispatch_r);
    PROTECT(remote_dispatch_r);

    while (!r_shutting_down) {
        int client_fd = recv_fd_c(pipe_fd);
        if (client_fd < 0) break;
        run_job_c(client_fd, dispatch_r, remote_dispatch_r);
        fflush(stdout);
    }

    UNPROTECT(2);
    return R_NilValue;
}

// }}} C-level worker loop

// }}} exported functions


void R_init_rmorloc(DllInfo *info) {
    R_CallMethodDef callMethods[] = {
        {"morloc_start_daemon", (DL_FUNC) &morloc_start_daemon, 4},
        {"morloc_wait_for_client", (DL_FUNC) &morloc_wait_for_client, 1},
        {"morloc_read_morloc_call_packet", (DL_FUNC) &morloc_read_morloc_call_packet, 1},
        {"morloc_send_packet_to_foreign_server", (DL_FUNC) &morloc_send_packet_to_foreign_server, 2},
        {"morloc_stream_from_client", (DL_FUNC) &morloc_stream_from_client, 1},
        {"morloc_close_socket", (DL_FUNC) &morloc_close_socket, 1},
        {"morloc_foreign_call", (DL_FUNC) &morloc_foreign_call, 3},
        {"morloc_get_value", (DL_FUNC) &morloc_get_value, 2},
        {"morloc_put_value", (DL_FUNC) &morloc_put_value, 2},
        {"morloc_mlc_show", (DL_FUNC) &morloc_mlc_show, 2},
        {"morloc_is_ping", (DL_FUNC) &morloc_is_ping, 1},
        {"morloc_is_local_call", (DL_FUNC) &morloc_is_local_call, 1},
        {"morloc_is_remote_call", (DL_FUNC) &morloc_is_remote_call, 1},
        {"morloc_remote_call", (DL_FUNC) &morloc_remote_call, 5},
        {"morloc_pong", (DL_FUNC) &morloc_pong, 1},
        {"morloc_make_fail_packet", (DL_FUNC) &morloc_make_fail_packet, 1},
        {"morloc_shinit", (DL_FUNC) &morloc_shinit, 3},
        {"morloc_socketpair", (DL_FUNC) &morloc_socketpair, 0},
        {"morloc_fork", (DL_FUNC) &morloc_fork, 0},
        {"morloc_exit", (DL_FUNC) &morloc_exit, 1},
        {"morloc_send_fd", (DL_FUNC) &morloc_send_fd, 2},
        {"morloc_recv_fd", (DL_FUNC) &morloc_recv_fd, 1},
        {"morloc_kill", (DL_FUNC) &morloc_kill, 2},
        {"morloc_waitpid", (DL_FUNC) &morloc_waitpid, 1},
        {"morloc_waitpid_blocking", (DL_FUNC) &morloc_waitpid_blocking, 1},
        {"morloc_install_sigterm_handler", (DL_FUNC) &morloc_install_sigterm_handler, 0},
        {"morloc_set_line_buffered", (DL_FUNC) &morloc_set_line_buffered, 0},
        {"morloc_is_shutting_down", (DL_FUNC) &morloc_is_shutting_down, 0},
        {"morloc_detach_daemon", (DL_FUNC) &morloc_detach_daemon, 1},
        {"morloc_shared_counter_create", (DL_FUNC) &morloc_shared_counter_create, 0},
        {"morloc_shared_counter_inc", (DL_FUNC) &morloc_shared_counter_inc, 1},
        {"morloc_shared_counter_dec", (DL_FUNC) &morloc_shared_counter_dec, 1},
        {"morloc_shared_counter_read", (DL_FUNC) &morloc_shared_counter_read, 1},
        {"morloc_pipe", (DL_FUNC) &morloc_pipe, 0},
        {"morloc_write_byte", (DL_FUNC) &morloc_write_byte, 2},
        {"morloc_close_fd", (DL_FUNC) &morloc_close_fd, 1},
        {"morloc_worker_loop_c", (DL_FUNC) &morloc_worker_loop_c, 3},
        {NULL, NULL, 0}
    };

    R_registerRoutines(info, NULL, callMethods, NULL, NULL);
    R_useDynamicSymbols(info, FALSE);
}


================================================
FILE: data/misc/mlccpptypes.hpp
================================================


================================================
FILE: data/morloc/morloc.h
================================================
// morloc.h -- C ABI contract for libmorloc.so
//
// This is the single public header for consumers of the morloc runtime library.
// It defines all types and function declarations exported by libmorloc.so.

#ifndef __MORLOC_H__
#define __MORLOC_H__

#ifdef __cplusplus
extern "C" {
#endif

// ========================================================================
// Section 1: System includes and basic typedefs
// ========================================================================

#include <stdarg.h>     // va_list, va_start, va_arg, va_end (used by pool templates)
#include <stdbool.h>
#include <stddef.h>
#include <stdint.h>
#include <stdio.h>      // FILE* for read_binary_fd
#include <sys/select.h> // fd_set
#include <sys/socket.h>
#include <sys/types.h>  // pid_t, ssize_t
#include <sys/un.h>     // struct sockaddr_un

// Error message output parameter: all fallible functions take this as their
// last argument. On failure the callee sets *errmsg_ to a heap-allocated
// string describing the error. On success *errmsg_ is set to NULL.
typedef char** errmsg_;
#define ERRMSG char** errmsg_

// Exit codes used by several functions.
#define EXIT_PASS 0
#define EXIT_FAIL 1

// Convenience macros used by language extensions (pymorloc.c, rmorloc.c, cppmorloc.cpp)
#include <stdlib.h>  // free
#define FREE(ptr) if(ptr != NULL){ free(ptr); ptr = NULL; }

// Size limits shared between library and consumers.
#define MAX_FILENAME_SIZE 128
#define MAX_ERRMSG_SIZE   1024
#define MAX_PATH_SIZE     512
#define BUFFER_SIZE       4096

// Opaque JSON builder handle (Rust uses its own struct internally).
typedef void* json_buf_t;

// ========================================================================
// Section 2: Memory / SHM types
// ========================================================================

// Pointer types for the multi-volume shared memory pool.
//
// relptr_t  -- index into the logical (multi-volume) pool; shared between
//              processes.
// volptr_t  -- index into a single volume (0 = first block after shm header).
// absptr_t  -- absolute virtual address in the current process.
typedef ssize_t relptr_t;
typedef ssize_t volptr_t;
typedef void*   absptr_t;

#define VOLNULL -1
#define RELNULL -1

// Magic numbers for integrity checks.
#define SHM_MAGIC 0xFECA0DF0
#define BLK_MAGIC 0x0CB10DF0

#define MAX_VOLUME_NUMBER 32

// Shared memory volume header (lives at the start of each mmap'd region).
typedef struct shm_s {
    unsigned int magic;
    char volume_name[MAX_FILENAME_SIZE];
    int volume_index;
    size_t volume_size;
    size_t relative_offset;
    // Note: pthread_rwlock_t is opaque; consumers should not access it directly.
    // It is included here so that sizeof(shm_t) is correct for mmap calculations.
    // On Linux x86_64 this is typically 56 bytes.
    char _rwlock_storage[56]; // placeholder for pthread_rwlock_t
    volptr_t cursor;
} shm_t;

// Block header preceding every allocation inside a shared memory volume.
// Atomic reference count for thread safety. Layout is stable (no padding).
typedef struct block_header_s {
    unsigned int magic;
    unsigned int reference_count; // actually _Atomic in the C impl
    size_t size;
} block_header_t;

// ========================================================================
// Section 3: Schema types
// ========================================================================

typedef enum {
    MORLOC_NIL,
    MORLOC_BOOL,
    MORLOC_SINT8,
    MORLOC_SINT16,
    MORLOC_SINT32,
    MORLOC_SINT64,
    MORLOC_UINT8,
    MORLOC_UINT16,
    MORLOC_UINT32,
    MORLOC_UINT64,
    MORLOC_FLOAT32,
    MORLOC_FLOAT64,
    MORLOC_TENSOR,
    MORLOC_STRING,
    MORLOC_ARRAY,
    MORLOC_TUPLE,
    MORLOC_MAP,
    MORLOC_OPTIONAL
} morloc_serial_type;

// Single-character schema encoding tokens.
#define SCHEMA_NIL      'z'
#define SCHEMA_BOOL     'b'
#define SCHEMA_SINT     'i'
#define SCHEMA_UINT     'u'
#define SCHEMA_FLOAT    'f'
#define SCHEMA_STRING   's'
#define SCHEMA_ARRAY    'a'
#define SCHEMA_TENSOR   'T'
#define SCHEMA_TUPLE    't'
#define SCHEMA_MAP      'm'
#define SCHEMA_OPTIONAL '?'

// Schema: recursive type descriptor used for serialisation/deserialisation.
struct Schema;
typedef struct Schema {
    morloc_serial_type type;
    size_t size;       // number of parameters
    size_t width;      // bytes per element when stored in a fixed-width array
    size_t* offsets;   // field offsets (tuples) or ndim (tensors, in offsets[0])
    char* hint;
    struct Schema** parameters;
    char** keys;       // field names (records only)
} Schema;

// Variable-length array in voidstar representation.
typedef struct Array {
    size_t size;
    relptr_t data;
} Array;

// Dense N-dimensional tensor in voidstar representation (row-major / C order).
typedef struct Tensor {
    size_t total_elements;
    uint32_t device_type;   // reserved: 0 = CPU
    uint32_t device_id;     // reserved: 0
    relptr_t data;          // relptr to contiguous element data
    relptr_t shape;         // relptr to int64_t[ndim]
} Tensor;

// ========================================================================
// Section 4: Packet types
// ========================================================================

#define MORLOC_PACKET_MAGIC 0x0707f86d

// Packet type discriminator.
typedef uint8_t command_type_t;
#define PACKET_TYPE_DATA  ((command_type_t)0)
#define PACKET_TYPE_CALL  ((command_type_t)1)
#define PACKET_TYPE_PING  ((command_type_t)2)

// Packed command sub-structs (all 8 bytes wide).
typedef struct __attribute__((packed)) packet_command_type_s {
    command_type_t type;
    uint8_t padding[7];
} packet_command_type_t;

#define PACKET_ENTRYPOINT_LOCAL      0x00
#define PACKET_ENTRYPOINT_REMOTE_SFS 0x01

typedef struct __attribute__((packed)) packet_command_call_s {
    command_type_t type;
    uint8_t entrypoint;
    uint8_t padding[2];
    uint32_t midx;
} packet_command_call_t;

// Data source, format, compression, encryption, and status constants.
#define PACKET_SOURCE_MESG  0x00
#define PACKET_SOURCE_FILE  0x01
#define PACKET_SOURCE_RPTR  0x02

#define PACKET_FORMAT_JSON     0x00
#define PACKET_FORMAT_MSGPACK  0x01
#define PACKET_FORMAT_TEXT     0x02
#define PACKET_FORMAT_DATA     0x03
#define PACKET_FORMAT_VOIDSTAR 0x04
#define PACKET_FORMAT_ARROW    0x05

#define PACKET_COMPRESSION_NONE 0x00
#define PACKET_ENCRYPTION_NONE  0x00

#define PACKET_STATUS_PASS 0x00
#define PACKET_STATUS_FAIL 0x01

typedef struct __attribute__((packed)) packet_command_data_s {
    command_type_t type;
    uint8_t source;
    uint8_t format;
    uint8_t compression;
    uint8_t encryption;
    uint8_t status;
    uint8_t padding[2];
} packet_command_data_t;

typedef struct __attribute__((packed)) packet_command_ping_s {
    command_type_t type;
    uint8_t padding[7];
} packet_command_ping_t;

typedef union __attribute__((packed)) packet_command_u {
    packet_command_type_t cmd_type;
    packet_command_call_t call;
    packet_command_data_t data;
    packet_command_ping_t ping;
} packet_command_t;

// 32-byte packet header (stable binary format, packed).
typedef struct __attribute__((packed)) morloc_packet_header_s {
    uint32_t magic;
    uint16_t plain;
    uint16_t version;
    uint16_t flavor;
    uint16_t mode;
    packet_command_t command;
    uint32_t offset;
    uint64_t length;
} morloc_packet_header_t;

// Inline threshold: voidstar data <= this size is embedded in packet payload.
#define MORLOC_INLINE_THRESHOLD (64 * 1024)

// Metadata sub-header in packet metadata sections.
#define MORLOC_METADATA_TYPE_SCHEMA_STRING 0x01
#define MORLOC_METADATA_TYPE_XXHASH        0x02
#define MORLOC_METADATA_HEADER_MAGIC       "mmh"

typedef struct __attribute__((packed)) morloc_metadata_header_s {
    char magic[3];
    uint8_t type;
    uint32_t size;
} morloc_metadata_header_t;

// ========================================================================
// Section 5: Expression / eval types
// ========================================================================

typedef struct argument_s {
    char* value;
    char** fields;
    char** default_fields;
    size_t size;
} argument_t;

typedef enum {
    MORLOC_X_DAT,
    MORLOC_X_APP,
    MORLOC_X_LAM,
    MORLOC_X_BND,
    MORLOC_X_PAT,
    MORLOC_X_FMT,
    MORLOC_X_SHOW,
    MORLOC_X_READ
} morloc_expression_type;

typedef enum { APPLY_PATTERN, APPLY_LAMBDA, APPLY_FORMAT } morloc_app_expression_type;

typedef enum { SELECT_BY_KEY, SELECT_BY_INDEX, SELECT_END } morloc_pattern_type;

// Forward declarations.
typedef struct morloc_expression_s morloc_expression_t;
typedef struct morloc_app_expression_s morloc_app_expression_t;
typedef struct morloc_lam_expression_s morloc_lam_expression_t;
typedef struct morloc_data_s morloc_data_t;
typedef struct morloc_pattern_s morloc_pattern_t;

typedef union primitive_u {
    char*    s;
    uint8_t  z;
    bool     b;
    int8_t   i1;
    int16_t  i2;
    int32_t  i4;
    int64_t  i8;
    uint8_t  u1;
    uint16_t u2;
    uint32_t u4;
    uint64_t u8;
    float    f4;
    double   f8;
} primitive_t;

typedef struct morloc_data_array_s {
    Schema* schema;
    size_t size;
    morloc_expression_t** values;
} morloc_data_array_t;

typedef struct morloc_data_s {
    bool is_voidstar;
    union {
        primitive_t lit_val;
        morloc_expression_t** tuple_val;
        morloc_data_array_t* array_val;
        void* voidstar;
    } data;
} morloc_data_t;

typedef struct morloc_app_expression_s {
    morloc_app_expression_type type;
    union {
        morloc_pattern_t* pattern;
        morloc_lam_expression_t* lambda;
        char** fmt;
    } function;
    morloc_expression_t** args;
    size_t nargs;
} morloc_app_expression_t;

typedef struct morloc_lam_expression_s {
    size_t nargs;
    char** args;
    morloc_expression_t* body;
} morloc_lam_expression_t;

typedef struct morloc_pattern_s {
    morloc_pattern_type type;
    size_t size;
    union {
        size_t* indices;
        char** keys;
    } fields;
    morloc_pattern_t** selectors;
} morloc_pattern_t;

typedef struct morloc_expression_s {
    morloc_expression_type type;
    Schema* schema;
    union {
        morloc_app_expression_t* app_expr;
        morloc_lam_expression_t* lam_expr;
        char* bnd_expr;
        char** interpolation;
        morloc_pattern_t* pattern_expr;
        morloc_data_t* data_expr;
        morloc_expression_t* unary_expr;
    } expr;
} morloc_expression_t;

// ========================================================================
// Section 6: Manifest types
// ========================================================================

typedef struct {
    char* lang;
    char** exec;      // NULL-terminated array
    char* socket;     // socket basename
} manifest_pool_t;

typedef enum {
    MARG_POS = 0,
    MARG_OPT,
    MARG_FLAG,
    MARG_GRP
} manifest_arg_kind_t;

typedef struct manifest_arg_s manifest_arg_t;

typedef struct {
    char* key;
    manifest_arg_t* arg;
} manifest_grp_entry_t;

struct manifest_arg_s {
    manifest_arg_kind_t kind;
    char** desc;
    char* metavar;
    char* type_desc;
    bool quoted;
    char short_opt;
    char* long_opt;
    char* long_rev;
    char* default_val;
    char grp_short;
    char* grp_long;
    manifest_grp_entry_t* entries;
    size_t n_entries;
};

typedef struct {
    char* name;
    char** desc;
} manifest_cmd_group_t;

typedef struct {
    char* name;
    bool is_pure;
    uint32_t mid;
    size_t pool_index;
    size_t* needed_pools;
    size_t n_needed_pools;
    char** arg_schemas;
    char* return_schema;
    char** desc;
    char* return_type;
    char** return_desc;
    manifest_arg_t* args;
    size_t n_args;
    morloc_expression_t* expr;
    char* group;
} manifest_command_t;

typedef struct {
    char* type;
    char* host;
    int port;
    char* socket;
} manifest_service_t;

typedef struct {
    int version;
    char* name;
    char* build_dir;
    manifest_pool_t* pools;
    size_t n_pools;
    manifest_command_t* commands;
    size_t n_commands;
    manifest_cmd_group_t* groups;
    size_t n_groups;
    manifest_service_t* service;
} manifest_t;

// ========================================================================
// Section 7: Daemon / HTTP / Router types
// ========================================================================

// -- Call types --

typedef struct morloc_call_s {
    uint32_t midx;
    uint8_t** args;
    size_t nargs;
    int owns_args;
} morloc_call_t;

typedef struct client_list_s {
    int fd;
    struct client_list_s* next;
} client_list_t;

typedef struct language_daemon_s {
    char* socket_path;
    char* tmpdir;
    char* shm_basename;
    shm_t* shm;
    size_t shm_default_size;
    int server_fd;
    fd_set read_fds;
    client_list_t* client_fds;
} language_daemon_t;

typedef struct morloc_socket_s {
    char* lang;
    char** syscmd;
    char* socket_filename;
    int pid;
} morloc_socket_t;

// -- Binding store --

typedef struct binding_entry_s {
    uint64_t hash;
    char* expr;
    char* artifact_dir;
    char* type_sig;
    char** names;
    size_t n_names;
} binding_entry_t;

typedef struct binding_store_s {
    binding_entry_t* entries;
    size_t capacity;
    size_t count;
    char* base_dir;
    char* names_path;
} binding_store_t;

// -- Daemon config and request/response --

typedef void (*pool_check_fn_t)(morloc_socket_t* sockets, size_t n_pools);
typedef bool (*pool_alive_fn_t)(size_t pool_index);

typedef struct daemon_config_s {
    const char* unix_socket_path;
    int tcp_port;
    int http_port;
    pool_check_fn_t pool_check_fn;
    pool_alive_fn_t pool_alive_fn;
    size_t n_pools;
    int eval_timeout;
} daemon_config_t;

typedef enum {
    DAEMON_CALL,
    DAEMON_DISCOVER,
    DAEMON_HEALTH,
    DAEMON_EVAL,
    DAEMON_TYPECHECK,
    DAEMON_BIND,
    DAEMON_BINDINGS,
    DAEMON_UNBIND
} daemon_method_t;

typedef struct daemon_request_s {
    char* id;
    daemon_method_t method;
    char* command;
    char* args_json;
    char* expr;
    char* name;
} daemon_request_t;

typedef struct daemon_response_s {
    char* id;
    bool success;
    char* result_json;
    char* error;
} daemon_response_t;

// -- HTTP types --

typedef enum {
    HTTP_GET,
    HTTP_POST,
    HTTP_DELETE,
    HTTP_OPTIONS
} http_method_t;

typedef struct http_request_s {
    http_method_t method;
    char path[256];
    char* body;
    size_t body_len;
} http_request_t;

// -- Router types --

typedef struct router_program_s {
    char* name;
    char* manifest_path;
    manifest_t* manifest;
    pid_t daemon_pid;
    char daemon_socket[sizeof(((struct sockaddr_un*)0)->sun_path)];
} router_program_t;

typedef struct router_s {
    router_program_t* programs;
    size_t n_programs;
    char* fdb_path;
} router_t;

// ========================================================================
// Section 8: Pool types
// ========================================================================

typedef uint8_t* (*pool_dispatch_fn_t)(
    uint32_t mid,
    const uint8_t** args,
    size_t nargs,
    void* ctx
);

typedef enum {
    POOL_THREADS,
    POOL_FORK,
    POOL_SINGLE
} pool_concurrency_t;

typedef struct {
    pool_dispatch_fn_t local_dispatch;
    pool_dispatch_fn_t remote_dispatch;
    void* dispatch_ctx;
    pool_concurrency_t concurrency;
    int initial_workers;
    bool dynamic_scaling;
    void (*post_fork_child)(void* ctx);
} pool_config_t;

typedef struct pool_state_s pool_state_t;

// ========================================================================
// Section 9: Arrow types
// ========================================================================

#ifndef ARROW_C_DATA_INTERFACE
#define ARROW_C_DATA_INTERFACE

struct ArrowSchema {
    const char* format;
    const char* name;
    const char* metadata;
    int64_t flags;
    int64_t n_children;
    struct ArrowSchema** children;
    struct ArrowSchema* dictionary;
    void (*release)(struct ArrowSchema*);
    void* private_data;
};

struct ArrowArray {
    int64_t length;
    int64_t null_count;
    int64_t offset;
    int64_t n_buffers;
    int64_t n_children;
    const void** buffers;
    struct ArrowArray** children;
    struct ArrowArray* dictionary;
    void (*release)(struct ArrowArray*);
    void* private_data;
};

#endif // ARROW_C_DATA_INTERFACE

#define ARROW_SHM_MAGIC    0xA770DA7A
#define ARROW_BUFFER_ALIGN 64
#define ARROW_ALIGN_UP(x)  (((x) + ARROW_BUFFER_ALIGN - 1) & ~((size_t)ARROW_BUFFER_ALIGN - 1))

typedef struct arrow_column_desc {
    morloc_serial_type type;
    uint64_t length;
    uint64_t null_count;
    uint32_t name_offset;
    uint16_t name_length;
    uint64_t data_offset;
    uint64_t data_size;
} arrow_column_desc_t;

typedef struct arrow_shm_header {
    uint32_t magic;
    uint32_t n_columns;
    uint64_t n_rows;
    uint64_t total_size;
} arrow_shm_header_t;

// ========================================================================
// Section 10: Slurm / resource types
// ========================================================================

#define MAX_SLURM_COMMAND_LENGTH 1024

typedef struct resources_s {
    int memory; // in GB
    int time;   // walltime in seconds
    int cpus;
    int gpus;
} resources_t;

// ========================================================================
// Section 11: Function declarations -- Memory / SHM
// ========================================================================

shm_t* shinit(const char* shm_basename, size_t volume_index, size_t shm_size, ERRMSG);
shm_t* shopen(size_t volume_index, ERRMSG);
bool shclose(ERRMSG);
void shm_set_fallback_dir(const char* dir);
void* shmalloc(size_t size, ERRMSG);
void* shmemcpy(void* src, size_t size, ERRMSG);
bool shfree(absptr_t ptr, ERRMSG);
bool shincref(absptr_t ptr, ERRMSG);
bool shfree_by_schema(absptr_t ptr, const Schema* schema, ERRMSG);
void* shcalloc(size_t nmemb, size_t size, ERRMSG);
void* shrealloc(void* ptr, size_t size, ERRMSG);
size_t total_shm_size(void);
volptr_t rel2vol(relptr_t ptr, ERRMSG);
absptr_t rel2abs(relptr_t ptr, ERRMSG);

// Convenience: resolve a relptr, using base_ptr if available (no SHM lookup needed).
static inline void* resolve_relptr(relptr_t relptr, const void* base_ptr, ERRMSG) {
    if (base_ptr) {
        return (char*)base_ptr + relptr;
    }
    return rel2abs(relptr, errmsg_);
}
relptr_t vol2rel(volptr_t ptr, shm_t* shm);
absptr_t vol2abs(volptr_t ptr, shm_t* shm);
relptr_t abs2rel(absptr_t ptr, ERRMSG);
shm_t* abs2shm(absptr_t ptr, ERRMSG);
block_header_t* abs2blk(void* ptr, ERRMSG);

// ========================================================================
// Section 12: Function declarations -- Schema
// ========================================================================

Schema* parse_schema(const char* schema, ERRMSG);
char* schema_to_string(const Schema* schema);
void* get_ptr(const Schema* schema, ERRMSG);
void free_schema(Schema* schema);
bool schema_is_fixed_width(const Schema* schema);
size_t schema_alignment(const Schema* schema);
size_t calculate_voidstar_size(const void* data, const Schema* schema, ERRMSG);

// Inline helpers used by language extensions (pymorloc.c, rmorloc.c)
#define ALIGN_UP(x, align) (((x) + (align) - 1) & ~((size_t)(align) - 1))

static inline size_t schema_tensor_ndim(const Schema* schema) {
    if (schema == NULL || schema->size == 0) return 0;
    // ndim is stored in offsets[0] for tensor schemas
    return schema->offsets ? schema->offsets[0] : 0;
}

// ========================================================================
// Section 13: Function declarations -- Serialisation (pack/unpack)
// ========================================================================

int pack(const void* mlc, const char* schema_str, char** mpkptr, size_t* mpk_size, ERRMSG);
int pack_with_schema(const void* mlc, const Schema* schema, char** mpkptr, size_t* mpk_size, ERRMSG);
int unpack_with_schema(const char* mpk, size_t mpk_size, const Schema* schema, void** mlcptr, ERRMSG);

// ========================================================================
// Section 14: Function declarations -- Packets
// ========================================================================

morloc_packet_header_t* read_morloc_packet_header(const uint8_t* msg, ERRMSG);
bool packet_is_ping(const uint8_t* packet, ERRMSG);
bool packet_is_local_call(const uint8_t* packet, ERRMSG);
bool packet_is_remote_call(const uint8_t* packet, ERRMSG);
size_t morloc_packet_size_from_header(const morloc_packet_header_t* header);
size_t morloc_packet_size(const uint8_t* packet, ERRMSG);
uint8_t* return_ping(const uint8_t* packet, ERRMSG);
uint8_t* make_ping_packet(void);
uint8_t* make_standard_data_packet(relptr_t ptr, const Schema* schema);
uint8_t* make_arrow_data_packet(relptr_t ptr, const Schema* schema);
uint8_t* make_mpk_data_packet(const char* mpk_filename, const Schema* schema);
uint8_t* make_data_packet_from_mpk(const char* mpk, size_t mpk_size, const Schema* schema);
int get_data_packet_as_mpk(const uint8_t* packet, const Schema* schema, char** mpk_out, size_t* mpk_size_out, ERRMSG);
char* read_schema_from_packet_meta(const uint8_t* packet, ERRMSG);
uint8_t* make_fail_packet(const char* failure_message);
char* get_morloc_data_packet_error_message(const uint8_t* data, ERRMSG);
uint8_t* get_morloc_data_packet_value(const uint8_t* data, const Schema* schema, ERRMSG);
uint8_t* make_morloc_local_call_packet(uint32_t midx, const uint8_t** arg_packets, size_t nargs, ERRMSG);
uint8_t* make_morloc_remote_call_packet(uint32_t midx, const uint8_t** arg_packets, size_t nargs, ERRMSG);
morloc_call_t* read_morloc_call_packet(const uint8_t* packet, ERRMSG);
void free_morloc_call(morloc_call_t* call);
int print_morloc_data_packet(const uint8_t* packet, const Schema* schema, ERRMSG);
int flatten_voidstar_to_buffer(const void* data, const Schema* schema, uint8_t** out_buf, size_t* out_size, ERRMSG);
uint8_t* make_data_packet_auto(void* voidstar, relptr_t relptr, const Schema* schema, ERRMSG);
int adjust_voidstar_relptrs(void* data, const Schema* schema, relptr_t base_rel, ERRMSG);
void* read_voidstar_binary(const uint8_t* blob, size_t blob_size, const Schema* schema, ERRMSG);
bool parse_morloc_call_arguments(uint8_t* packet, uint8_t** args, size_t* nargs, ERRMSG);
bool hash_morloc_packet(const uint8_t* packet, const Schema* schema, uint64_t seed, uint64_t* hash, ERRMSG);

// ========================================================================
// Section 15: Function declarations -- Printing / output
// ========================================================================

char* quoted(const char* input);
bool print_voidstar(const void* voidstar, const Schema* schema, ERRMSG);
bool pretty_print_voidstar(const void* voidstar, const Schema* schema, ERRMSG);
bool print_arrow_as_json(const void* data, ERRMSG);
bool print_arrow_as_table(const void* data, ERRMSG);
bool print_hex_dump(const uint8_t* data, size_t size, ERRMSG);
char* voidstar_to_json_string(const void* voidstar, const Schema* schema, ERRMSG);

// ========================================================================
// Section 16: Function declarations -- Daemon / socket communication
// ========================================================================

void close_socket(int socket_id);
void close_daemon(language_daemon_t** daemon_ptr);
language_daemon_t* start_daemon(
    const char* socket_path, const char* tmpdir,
    const char* shm_basename, size_t shm_default_size, ERRMSG);
uint8_t* stream_from_client_wait(int client_fd, int pselect_timeout_us, int recv_timeout_us, ERRMSG);
uint8_t* stream_from_client(int client_fd, ERRMSG);
uint8_t* send_and_receive_over_socket_wait(
    const char* socket_path, const uint8_t* packet,
    int pselect_timeout_us, int recv_timeout_us, ERRMSG);
uint8_t* send_and_receive_over_socket(const char* socket_path, const uint8_t* packet, ERRMSG);
size_t send_packet_to_foreign_server(int client_fd, uint8_t* packet, ERRMSG);
int wait_for_client_with_timeout(language_daemon_t* daemon, int timeout_us, ERRMSG);
int wait_for_client(language_daemon_t* daemon, ERRMSG);

// Daemon event loop and dispatch.
void daemon_run(daemon_config_t* config, manifest_t* manifest,
                morloc_socket_t* sockets, size_t n_pools,
                const char* shm_basename);
daemon_response_t* daemon_dispatch(manifest_t* manifest,
                                   daemon_request_t* request,
                                   morloc_socket_t* sockets,
                                   const char* shm_basename);
daemon_request_t* daemon_parse_request(const char* json, size_t len, ERRMSG);
daemon_response_t* daemon_parse_response(const char* json, size_t len, ERRMSG);
char* daemon_serialize_response(daemon_response_t* response, size_t* out_len);
char* daemon_build_discovery(manifest_t* manifest);
void daemon_set_eval_timeout(int timeout_sec);
void daemon_free_request(daemon_request_t* req);
void daemon_free_response(daemon_response_t* resp);

// Binding store (public types only; internal hash table functions are Rust-side).
binding_store_t* binding_store_init(const char* base_dir);
void binding_store_free(binding_store_t* store);

// ========================================================================
// Section 17: Function declarations -- HTTP
// ========================================================================

http_request_t* http_parse_request(int fd, ERRMSG);
bool http_write_response(int fd, int status, const char* content_type,
                         const char* body, size_t body_len);
daemon_request_t* http_to_daemon_request(http_request_t* req, ERRMSG);
void http_free_request(http_request_t* req);

// ========================================================================
// Section 18: Function declarations -- Router
// ========================================================================

router_t* router_init(const char* fdb_path, ERRMSG);
void router_run(daemon_config_t* config, router_t* router);
bool router_start_program(router_program_t* prog, ERRMSG);
daemon_response_t* router_forward(router_t* router, const char* program,
                                  daemon_request_t* request, ERRMSG);
char* router_build_discovery(router_t* router);
void router_free(router_t* router);

// ========================================================================
// Section 19: Function declarations -- Pool
// ========================================================================

int pool_main(int argc, char** argv, pool_config_t* config);
uint8_t* pool_dispatch_packet(
    const uint8_t* packet,
    pool_dispatch_fn_t local_dispatch,
    pool_dispatch_fn_t remote_dispatch,
    void* ctx);
void pool_mark_busy(void);
void pool_mark_idle(void);

// ========================================================================
// Section 20: Function declarations -- Arrow
// ========================================================================

size_t arrow_element_size(morloc_serial_type type);
const char* arrow_format_string(morloc_serial_type type);
morloc_serial_type arrow_format_to_type(const char* format);
relptr_t arrow_to_shm(const struct ArrowArray* array, const struct ArrowSchema* schema, ERRMSG);
int arrow_validate(const arrow_shm_header_t* header, const Schema* schema, ERRMSG);
const void* arrow_column_data(const arrow_shm_header_t* header, uint32_t col_index);
const arrow_column_desc_t* arrow_column_desc(const arrow_shm_header_t* header, uint32_t col_index);
const char* arrow_column_name(const arrow_shm_header_t* header, uint32_t col_index);
int arrow_from_shm(const arrow_shm_header_t* header,
                   struct ArrowSchema* out_schema,
                   struct ArrowArray* out_array, ERRMSG);

// ========================================================================
// Section 21: Function declarations -- Cache
// ========================================================================

char* put_cache_packet(const uint8_t* voidstar, const Schema* schema, uint64_t key, const char* cache_path, ERRMSG);
uint8_t* get_cache_packet(uint64_t key, const char* cache_path, ERRMSG);
bool del_cache_packet(uint64_t key, const char* cache_path, ERRMSG);
char* check_cache_packet(uint64_t key, const char* cache_path, ERRMSG);

// ========================================================================
// Section 22: Function declarations -- CLI / argument parsing
// ========================================================================

argument_t* initialize_positional(char* value);
argument_t* initialize_unrolled(size_t size, char* default_value, char** fields, char** default_fields);
void free_argument_t(argument_t* arg);
uint8_t* parse_cli_data_argument(uint8_t* dest, const argument_t* arg, const Schema* schema, ERRMSG);
uint8_t* make_call_packet_from_cli(
    uint8_t* dest, uint32_t mid,
    argument_t** args, char** arg_schema_strs, ERRMSG);
void* load_morloc_data_file(const char* path, uint8_t* data, size_t data_size, const Schema* schema, ERRMSG);

// ========================================================================
// Section 23: Function declarations -- Expression evaluation
// ========================================================================

morloc_expression_t* make_morloc_bound_var(const char* schema_str, char* varname, ERRMSG);
morloc_expression_t* make_morloc_literal(const char* schema_str, primitive_t lit, ERRMSG);
morloc_expression_t* make_morloc_pattern(const char* schema_str, morloc_pattern_t* pattern, ERRMSG);
morloc_pattern_t* make_morloc_pattern_end(void);
absptr_t morloc_eval(
    morloc_expression_t* expr, Schema* return_schema,
    uint8_t** arg_voidstar, Schema** arg_schemas, size_t nargs, ERRMSG);

// ========================================================================
// Section 24: Function declarations -- Manifest
// ========================================================================

manifest_t* parse_manifest(const char* text, ERRMSG);
manifest_t* read_manifest(const char* path, ERRMSG);
void free_manifest(manifest_t* manifest);
morloc_expression_t* build_manifest_expr(const char* json_str, ERRMSG);
char* manifest_to_discovery_json(const manifest_t* manifest);

// ========================================================================
// Section 25: Function declarations -- Intrinsics
// ========================================================================

int mlc_save(const absptr_t data, const Schema* schema, const char* path, ERRMSG);
int mlc_save_json(const absptr_t data, const Schema* schema, const char* path, ERRMSG);
int mlc_save_voidstar(const absptr_t data, const Schema* schema, const char* path, ERRMSG);
void* mlc_load(const char* path, const Schema* schema, ERRMSG);
char* mlc_hash(const absptr_t data, const Schema* schema, ERRMSG);
char* mlc_show(const absptr_t data, const Schema* schema, ERRMSG);
void* mlc_read(const char* json_str, const Schema* schema, ERRMSG);
relptr_t write_voidstar_binary(int fd, const void* data, const Schema* schema, ERRMSG);

// ========================================================================
// Section 26: Function declarations -- Slurm
// ========================================================================

size_t parse_slurm_time(const char* time_str, ERRMSG);
char* write_slurm_time(int seconds);
bool slurm_job_is_complete(uint32_t job_id);
uint32_t submit_morloc_slurm_job(
    const char* nexus_path,
    const char* socket_basename,
    const char* call_packet_filename,
    const char* result_cache_filename,
    const char* output_filename,
    const char* error_filename,
    const resources_t* resources,
    ERRMSG);
uint8_t* remote_call(
    int midx,
    const char* socket_basename,
    const char* cache_path,
    const resources_t* resources,
    const uint8_t** arg_packets,
    size_t nargs,
    ERRMSG);

// ========================================================================
// Section 27: Function declarations -- Utility
// ========================================================================

void hex(const void* ptr, size_t size);
bool file_exists(const char* filename);
int mkdir_p(const char* path, ERRMSG);
void delete_directory(const char* path);
bool has_suffix(const char* x, const char* suffix);
int write_atomic(const char* filename, const uint8_t* data, size_t size, ERRMSG);
int write_binary_fd(int fd, const char* buf, size_t count, ERRMSG);
int print_binary(const char* buf, size_t count, ERRMSG);
uint8_t* read_binary_fd(FILE* file, size_t* file_size, ERRMSG);
uint8_t* read_binary_file(const char* filename, size_t* file_size, ERRMSG);

// ========================================================================
// Section 28: Function declarations -- Hashing
// ========================================================================

uint64_t morloc_xxh64(const void* input, size_t length, uint64_t seed);

// ========================================================================
// Section 29: Function declarations -- JSON reader
// ========================================================================

uint8_t* read_json_with_schema(uint8_t* voidstar, char* json_data, const Schema* schema, ERRMSG);

#ifdef __cplusplus
}
#endif

#endif // __MORLOC_H__


================================================
FILE: data/rust/.gitignore
================================================
target/


================================================
FILE: data/rust/Cargo.toml
================================================
[workspace]
members = ["morloc-manifest", "morloc-runtime", "morloc-nexus", "morloc-manager"]
resolver = "2"

[workspace.dependencies]
libc = "0.2"
serde = { version = "1", features = ["derive"] }
serde_json = "1"
rmp-serde = "1"
twox-hash = "2"
nix = { version = "0.29", features = ["signal", "socket", "mman", "process", "fs"] }
clap = { version = "4", features = ["derive"] }
thiserror = "2"

[profile.release]
opt-level = 2
lto = "thin"


================================================
FILE: data/rust/morloc-manager/Cargo.toml
================================================
[package]
name = "morloc-manager"
version = "0.23.1"
edition = "2021"
description = "Container lifecycle manager for Morloc"

[[bin]]
name = "morloc-manager"
path = "src/main.rs"

[dependencies]
serde = { workspace = true }
serde_json = { workspace = true }
nix = { version = "0.29", features = ["signal", "socket", "mman", "process", "fs", "user"] }
clap = { workspace = true }
thiserror = { workspace = true }
sha2 = "0.10"
chrono = { version = "0.4", features = ["serde"] }
dirs = "6"

[dev-dependencies]
tempfile = "3"


================================================
FILE: data/rust/morloc-manager/src/config.rs
================================================
use std::fs;
use std::os::unix::fs::{OpenOptionsExt, PermissionsExt};
use std::path::{Path, PathBuf};
use std::process::Command as StdCommand;

use crate::error::{ManagerError, Result};
use crate::types::*;

// ======================================================================
// Path utilities
// ======================================================================

pub fn config_dir(scope: Scope) -> PathBuf {
    match scope {
        Scope::Local => dirs::config_dir()
            .unwrap_or_else(|| PathBuf::from("~/.config"))
            .join("morloc"),
        Scope::System => PathBuf::from("/etc/morloc"),
    }
}

pub fn config_path(scope: Scope) -> PathBuf {
    config_dir(scope).join("config.json")
}

pub fn data_dir(scope: Scope) -> PathBuf {
    match scope {
        Scope::Local => dirs::data_dir()
            .unwrap_or_else(|| PathBuf::from("~/.local/share"))
            .join("morloc"),
        Scope::System => PathBuf::from("/usr/local/share/morloc"),
    }
}

// Environment paths

pub fn env_config_dir(scope: Scope, name: &str) -> PathBuf {
    config_dir(scope).join("environments").join(name)
}

pub fn env_config_path(scope: Scope, name: &str) -> PathBuf {
    env_config_dir(scope, name).join("env.json")
}

pub fn env_dockerfile_path(scope: Scope, name: &str) -> PathBuf {
    env_config_dir(scope, name).join("Dockerfile")
}

pub fn env_flags_path(scope: Scope, name: &str) -> PathBuf {
    env_config_dir(scope, name).join("env.flags")
}

pub fn env_data_dir(scope: Scope, name: &str) -> PathBuf {
    data_dir(scope).join("environments").join(name)
}

// ======================================================================
// Reading configuration
// ======================================================================

pub fn read_config<T: serde::de::DeserializeOwned>(path: &Path) -> Result<T> {
    let bytes = fs::read(path).map_err(|e| {
        if e.kind() == std::io::ErrorKind::PermissionDenied {
            ManagerError::ConfigPermissionDenied(path.display().to_string())
        } else {
            ManagerError::ConfigNotFound(path.display().to_string())
        }
    })?;
    serde_json::from_slice(&bytes).map_err(|e| ManagerError::ConfigParseError {
        path: path.display().to_string(),
        msg: e.to_string(),
    })
}

pub fn read_active_config() -> Option<Config> {
    let local_path = config_path(Scope::Local);
    if let Ok(cfg) = read_config::<Config>(&local_path) {
        return Some(cfg);
    }
    let system_path = config_path(Scope::System);
    read_config::<Config>(&system_path).ok()
}

pub fn read_env_config(scope: Scope, name: &str) -> Result<EnvironmentConfig> {
    read_config(&env_config_path(scope, name))
}

// ======================================================================
// Writing configuration
// ======================================================================

pub fn write_config<T: serde::Serialize>(path: &Path, val: &T) -> Result<()> {
    let dir = path.parent().unwrap();
    fs::create_dir_all(dir).map_err(|e| ManagerError::ConfigParseError {
        path: path.display().to_string(),
        msg: e.to_string(),
    })?;
    best_effort_chmod(dir, 0o755);

    let lock_path = format!("{}.lock", path.display());
    with_file_lock(&lock_path, || {
        // Atomic write: temp file then rename
        let tmp_path = path.with_extension("tmp");
        let json = serde_json::to_vec(val).map_err(|e| ManagerError::ConfigParseError {
            path: path.display().to_string(),
            msg: e.to_string(),
        })?;
        fs::write(&tmp_path, &json).map_err(|e| ManagerError::ConfigParseError {
            path: path.display().to_string(),
            msg: e.to_string(),
        })?;
        fs::rename(&tmp_path, path).map_err(|e| ManagerError::ConfigParseError {
            path: path.display().to_string(),
            msg: e.to_string(),
        })?;
        best_effort_chmod(path, 0o644);
        Ok(())
    })
}

pub fn write_env_config(scope: Scope, name: &str, ec: &EnvironmentConfig) -> Result<()> {
    write_config(&env_config_path(scope, name), ec)
}

// ======================================================================
// Scope utilities
// ======================================================================

/// Find which scope an environment lives in. Checks local first, then system.
pub fn find_env_scope(name: &str) -> Result<Scope> {
    let local_path = env_config_path(Scope::Local, name);
    if local_path.is_file() {
        return Ok(Scope::Local);
    }
    let sys_path = env_config_path(Scope::System, name);
    if sys_path.is_file() {
        return Ok(Scope::System);
    }
    Err(ManagerError::EnvironmentNotFound(name.to_string()))
}

/// List environment names in a given scope.
pub fn list_env_names(scope: Scope) -> Vec<String> {
    let env_dir = config_dir(scope).join("environments");
    if !env_dir.is_dir() {
        return Vec::new();
    }
    let Ok(entries) = fs::read_dir(&env_dir) else {
        return Vec::new();
    };
    entries
        .filter_map(|e| e.ok())
        .filter(|e| e.path().join("env.json").is_file())
        .filter_map(|e| e.file_name().into_string().ok())
        .collect()
}


// ======================================================================
// Flags files
// ======================================================================

pub fn read_flags_file(path: &Path) -> Vec<String> {
    let Ok(contents) = fs::read_to_string(path) else {
        return Vec::new();
    };
    contents
        .lines()
        .map(|line| line.trim())
        .filter(|line| !line.is_empty() && !line.starts_with('#'))
        .flat_map(shell_expand_line)
        .collect()
}

/// Expand a single flagfile line through the shell, getting glob expansion,
/// environment variable expansion, tilde expansion, and quote handling.
/// Falls back to simple whitespace splitting if the shell invocation fails.
fn shell_expand_line(line: &str) -> Vec<String> {
    let output = StdCommand::new("sh")
        .args(["-c", &format!("printf '%s\\0' {}", line)])
        .output();
    match output {
        Ok(out) if out.status.success() => {
            let stdout = String::from_utf8_lossy(&out.stdout);
            let tokens: Vec<String> = stdout
                .split('\0')
                .filter(|s| !s.is_empty())
                .map(|s| s.to_string())
                .collect();
            if tokens.is_empty() {
                line.split_whitespace().map(|s| s.to_string()).collect()
            } else {
                tokens
            }
        }
        _ => line.split_whitespace().map(|s| s.to_string()).collect(),
    }
}

/// Read flags file preserving one line per entry (for display).
pub fn read_flags_file_lines(path: &Path) -> Vec<String> {
    let Ok(contents) = fs::read_to_string(path) else {
        return Vec::new();
    };
    contents
        .lines()
        .map(|line| line.trim())
        .filter(|line| !line.is_empty() && !line.starts_with('#'))
        .map(|s| s.to_string())
        .collect()
}

// ======================================================================
// File locking
// ======================================================================

fn with_file_lock<F, T>(lock_path: &str, action: F) -> Result<T>
where
    F: FnOnce() -> Result<T>,
{
    if let Some(parent) = Path::new(lock_path).parent() {
        let _ = fs::create_dir_all(parent);
    }
    let file = std::fs::OpenOptions::new()
        .write(true)
        .create(true)
        .truncate(false)
        .mode(0o644)
        .open(lock_path)
        .map_err(|e| {
            if e.kind() == std::io::ErrorKind::PermissionDenied {
                ManagerError::ConfigPermissionDenied(format!(
                    "{}. Use sudo for system-scope operations", lock_path
                ))
            } else {
                ManagerError::ConfigParseError {
                    path: lock_path.to_string(),
                    msg: format!("Failed to open lock file: {e}"),
                }
            }
        })?;

    use nix::fcntl::FlockArg;
    let locked = nix::fcntl::Flock::lock(file, FlockArg::LockExclusive).map_err(
        |(_file, errno)| ManagerError::ConfigParseError {
            path: lock_path.to_string(),
            msg: format!("Failed to acquire lock: {errno}"),
        },
    )?;

    let result = action();

    // Lock is released when Flock is dropped
    drop(locked);
    result
}

// ======================================================================
// Internal
// ======================================================================

fn best_effort_chmod(path: &Path, mode: u32) {
    let _ = fs::set_permissions(path, fs::Permissions::from_mode(mode));
}


================================================
FILE: data/rust/morloc-manager/src/container.rs
================================================
use std::io;
use std::process::{Command, ExitStatus, Stdio};

use crate::types::ContainerEngine;

// ======================================================================
// Configuration records
// ======================================================================

#[derive(Debug, Clone)]
pub struct RunConfig {
    pub image: String,
    pub bind_mounts: Vec<(String, String)>,
    pub ports: Vec<(u16, u16)>,
    pub env: Vec<(String, String)>,
    pub read_only: bool,
    pub interactive: bool,
    pub remove_after: bool,
    pub name: Option<String>,
    pub shm_size: Option<String>,
    pub command: Option<Vec<String>>,
    pub work_dir: Option<String>,
    pub selinux_suffix: String,
    pub extra_flags: Vec<String>,
}

impl RunConfig {
    pub fn new(image: &str) -> Self {
        Self {
            image: image.to_string(),
            bind_mounts: Vec::new(),
            ports: Vec::new(),
            env: Vec::new(),
            read_only: false,
            interactive: false,
            remove_after: true,
            name: None,
            shm_size: None,
            command: None,
            work_dir: None,
            selinux_suffix: String::new(),
            extra_flags: Vec::new(),
        }
    }
}

#[derive(Debug, Clone)]
pub struct BuildConfig {
    pub dockerfile: String,
    pub context: String,
    pub tag: String,
    pub build_args: Vec<(String, String)>,
}

// ======================================================================
// Engine detection
// ======================================================================

pub fn engine_executable(engine: ContainerEngine) -> &'static str {
    match engine {
        ContainerEngine::Docker => "docker",
        ContainerEngine::Podman => "podman",
    }
}

// ======================================================================
// Operations
// ======================================================================

pub fn container_run(engine: ContainerEngine, cfg: &RunConfig) -> (ExitStatus, String, String) {
    let exe = engine_executable(engine);
    let extra = engine_specific_run_flags_io(engine);
    let args = build_run_args(engine, &extra, cfg);
    run_process(exe, &args)
}

/// Like `container_run` but captures both stdout and stderr (no streaming).
pub fn container_run_quiet(engine: ContainerEngine, cfg: &RunConfig) -> (ExitStatus, String, String) {
    let exe = engine_executable(engine);
    let extra = engine_specific_run_flags_io(engine);
    let args = build_run_args(engine, &extra, cfg);
    run_process_quiet(exe, &args)
}

pub fn container_run_passthrough(
    engine: ContainerEngine,
    verbose: bool,
    shell: bool,
    cfg: &RunConfig,
) -> ExitStatus {
    let exe = engine_executable(engine);
    let extra = engine_specific_run_flags_io(engine);
    let args = build_run_args(engine, &extra, cfg);

    if verbose || shell {
        let quoted: Vec<String> = args
            .iter()
            .map(|a| {
                if a.contains(' ') {
                    format!("'{a}'")
                } else {
                    a.clone()
                }
            })
            .collect();
        eprintln!("[morloc-manager] {exe} {}", quoted.join(" "));
    }

    Command::new(exe)
        .args(&args)
        .stdin(Stdio::inherit())
        .stdout(Stdio::inherit())
        .stderr(Stdio::inherit())
        .status()
        .unwrap_or_else(|_| std::process::exit(1))
}

pub fn container_build(engine: ContainerEngine, cfg: &BuildConfig) -> (ExitStatus, String, String) {
    let exe = engine_executable(engine);
    let args = build_build_args(cfg);
    run_process(exe, &args)
}

pub fn container_pull(engine: ContainerEngine, image: &str) -> (ExitStatus, String, String) {
    let exe = engine_executable(engine);
    run_process(exe, &["pull".to_string(), image.to_string()])
}

/// Build a container image with all output (stdout+stderr) redirected to stderr.
/// Use for IO () commands where stdout must stay clean.
pub fn container_build_visible(engine: ContainerEngine, cfg: &BuildConfig) -> ExitStatus {
    let exe = engine_executable(engine);
    let args = build_build_args(cfg);
    run_process_to_stderr(exe, &args)
}

/// Pull a container image with all output (stdout+stderr) redirected to stderr.
/// Use for IO () commands where stdout must stay clean.
pub fn container_pull_visible(engine: ContainerEngine, image: &str) -> ExitStatus {
    let exe = engine_executable(engine);
    run_process_to_stderr(exe, &["pull".to_string(), image.to_string()])
}

pub fn image_exists_locally(engine: ContainerEngine, image: &str) -> bool {
    let exe = engine_executable(engine);
    Command::new(exe)
        .args(["image", "inspect", image])
        .stdout(Stdio::null())
        .stderr(Stdio::null())
        .status()
        .map(|s| s.success())
        .unwrap_or(false)
}

/// Run `image inspect` and return the stderr if it fails.
/// Returns None on success, Some(stderr) on failure.
pub fn image_inspect_stderr(engine: ContainerEngine, image: &str) -> Option<String> {
    let exe = engine_executable(engine);
    let output = Command::new(exe)
        .args(["image", "inspect", image])
        .stdout(Stdio::null())
        .output()
        .ok()?;
    if output.status.success() {
        None
    } else {
        Some(String::from_utf8_lossy(&output.stderr).to_string())
    }
}

/// Result of checking whether a remote image exists.
pub enum RemoteImageStatus {
    /// The image exists on the registry.
    Exists,
    /// The registry was reached but the image/tag was not found.
    NotFound,
    /// The check failed for an unknown reason (network, auth, etc).
    /// Contains the stderr output from the container engine.
    Unknown(String),
}

pub fn check_remote_image(engine: ContainerEngine, image: &str) -> RemoteImageStatus {
    let exe = engine_executable(engine);
    let output = Command::new(exe)
        .args(["manifest", "inspect", image])
        .stdout(Stdio::null())
        .output();

    match output {
        Ok(o) if o.status.success() => RemoteImageStatus::Exists,
        Ok(o) => {
            let stderr = String::from_utf8_lossy(&o.stderr).to_string();
            let lower = stderr.to_lowercase();
            // "manifest unknown" / "not found" / "name unknown" indicate
            // the registry was reachable but the image doesn't exist.
            if lower.contains("manifest unknown")
                || lower.contains("not found")
                || lower.contains("name unknown")
            {
                RemoteImageStatus::NotFound
            } else {
                RemoteImageStatus::Unknown(stderr)
            }
        }
        Err(e) => RemoteImageStatus::Unknown(format!("Failed to execute {exe}: {e}")),
    }
}

pub fn container_stop(engine: ContainerEngine, name_or_id: &str) -> (ExitStatus, String) {
    let exe = engine_executable(engine);
    let (code, _, err) = run_process(exe, &["stop".to_string(), name_or_id.to_string()]);
    (code, err)
}

pub fn container_remove(engine: ContainerEngine, name_or_id: &str) -> ExitStatus {
    let exe = engine_executable(engine);
    let (code, _, _) = run_process(exe, &["rm".to_string(), "-f".to_string(), name_or_id.to_string()]);
    code
}

/// Quiet container removal: suppresses stderr (for pre-emptive cleanup).
pub fn container_remove_quiet(engine: ContainerEngine, name_or_id: &str) -> ExitStatus {
    let exe = engine_executable(engine);
    let (code, _, _) = run_process_quiet(exe, &["rm".to_string(), "-f".to_string(), name_or_id.to_string()]);
    code
}

/// Check whether a container with this name exists (running or stopped).
pub fn container_exists(engine: ContainerEngine, name: &str) -> bool {
    let exe = engine_executable(engine);
    Command::new(exe)
        .args(["container", "inspect", name])
        .stdout(Stdio::null())
        .stderr(Stdio::null())
        .status()
        .map(|s| s.success())
        .unwrap_or(false)
}

pub fn remove_image(engine: ContainerEngine, tag: &str) -> bool {
    let exe = engine_executable(engine);
    let (status, _, _) = run_process(exe, &["rmi".to_string(), tag.to_string()]);
    status.success()
}

// ======================================================================
// CLI argument construction
// ======================================================================

pub fn build_run_args(
    engine: ContainerEngine,
    extra_engine_flags: &[String],
    cfg: &RunConfig,
) -> Vec<String> {
    let mut args = vec!["run".to_string()];
    args.extend(extra_engine_flags.iter().cloned());

    if cfg.remove_after {
        args.push("--rm".to_string());
    }
    if cfg.read_only {
        args.push("--read-only".to_string());
        // Docker does not auto-mount a tmpfs at /tmp when --read-only is used
        // (podman does). Pool daemons need a writable /tmp for temp files.
        if engine == ContainerEngine::Docker {
            args.push("--tmpfs".to_string());
            args.push("/tmp".to_string());
        }
    }
    // Always attach stdin so piped input works; only allocate a TTY for
    // interactive (shell) sessions.
    args.push("-i".to_string());
    if cfg.interactive {
        args.push("-t".to_string());
    }
    if let Some(ref n) = cfg.name {
        args.push("--name".to_string());
        args.push(n.clone());
    }
    if let Some(ref s) = cfg.shm_size {
        args.push("--shm-size".to_string());
        args.push(s.clone());
    }
    if let Some(ref w) = cfg.work_dir {
        args.push("-w".to_string());
        args.push(w.clone());
    }
    for (host, container) in &cfg.bind_mounts {
        args.push("-v".to_string());
        args.push(format!("{host}:{container}{}", cfg.selinux_suffix));
    }
    for (host_port, container_port) in &cfg.ports {
        args.push("-p".to_string());
        args.push(format!("{host_port}:{container_port}"));
    }
    for (key, val) in &cfg.env {
        args.push("-e".to_string());
        args.push(format!("{key}={val}"));
    }
    args.extend(cfg.extra_flags.iter().cloned());
    args.push(cfg.image.clone());
    if let Some(ref cmd) = cfg.command {
        args.extend(cmd.iter().cloned());
    }
    args
}

pub fn engine_specific_run_flags_io(engine: ContainerEngine) -> Vec<String> {
    let uid = nix::unistd::getuid();
    match engine {
        ContainerEngine::Podman => {
            if uid.is_root() {
                Vec::new()
            } else {
                vec!["--userns=keep-id".to_string()]
            }
        }
        ContainerEngine::Docker => {
            if uid.is_root() {
                Vec::new()
            } else {
                let gid = nix::unistd::getgid();
                vec!["--user".to_string(), format!("{}:{}", uid, gid)]
            }
        }
    }
}

/// Pure version for testing.
#[cfg(test)]
pub fn engine_specific_run_flags(engine: ContainerEngine) -> Vec<String> {
    match engine {
        ContainerEngine::Podman => vec!["--userns=keep-id".to_string()],
        ContainerEngine::Docker => Vec::new(),
    }
}

pub fn build_build_args(cfg: &BuildConfig) -> Vec<String> {
    let mut args = vec![
        "build".to_string(),
        "-f".to_string(),
        cfg.dockerfile.clone(),
        "-t".to_string(),
        cfg.tag.clone(),
    ];
    for (key, val) in &cfg.build_args {
        args.push("--build-arg".to_string());
        args.push(format!("{key}={val}"));
    }
    args.push(cfg.context.clone());
    args
}

// ======================================================================
// Process execution
// ======================================================================

/// Run a process with both stdout and stderr redirected to our stderr.
/// Returns only the exit status. Use for IO () commands where morloc-manager's
/// stdout must stay clean but the user should see all container output.
fn run_process_to_stderr(exe: &str, args: &[String]) -> ExitStatus {
    let mut child = Command::new(exe)
        .args(args)
        .stdin(Stdio::null())
        .stdout(Stdio::piped())
        .stderr(Stdio::inherit())
        .spawn()
        .unwrap_or_else(|e| {
            eprintln!("Failed to execute {exe}: {e}");
            std::process::exit(1);
        });
    // Pump child stdout -> our stderr
    if let Some(mut child_stdout) = child.stdout.take() {
        let stderr = io::stderr();
        let _ = io::copy(&mut child_stdout, &mut stderr.lock());
    }
    child.wait().unwrap_or_else(|e| {
        eprintln!("Failed to wait for {exe}: {e}");
        std::process::exit(1);
    })
}

/// Run a process with stderr streamed live to the terminal.
/// Returns (exit_status, captured_stdout, "").
fn run_process(exe: &str, args: &[String]) -> (ExitStatus, String, String) {
    let output = Command::new(exe)
        .args(args)
        .stdin(Stdio::null())
        .stdout(Stdio::piped())
        .stderr(Stdio::inherit())
        .output()
        .unwrap_or_else(|e| {
            eprintln!("Failed to execute {exe}: {e}");
            std::process::exit(1);
        });
    (
        output.status,
        String::from_utf8_lossy(&output.stdout).to_string(),
        String::new(),
    )
}

/// Run a process with all output captured (no streaming).
/// Used when stderr must be parsed (e.g., for error classification).
fn run_process_quiet(exe: &str, args: &[String]) -> (ExitStatus, String, String) {
    let output = Command::new(exe)
        .args(args)
        .stdin(Stdio::null())
        .output()
        .unwrap_or_else(|e| {
            eprintln!("Failed to execute {exe}: {e}");
            std::process::exit(1);
        });
    (
        output.status,
        String::from_utf8_lossy(&output.stdout).to_string(),
        String::from_utf8_lossy(&output.stderr).to_string(),
    )
}

// ======================================================================
// Helpers
// ======================================================================

pub fn exit_code_to_int(status: ExitStatus) -> i32 {
    status.code().unwrap_or(1)
}


================================================
FILE: data/rust/morloc-manager/src/doctor.rs
================================================
use std::fs;
use std::path::Path;
use std::process::Command;

use crate::config as cfg;
use crate::container::{container_run_quiet, engine_executable, image_exists_locally, RunConfig};
use crate::environment;
use crate::error::Result;
use crate::types::*;

const MANIFEST_MARKER: &str = "### MANIFEST ###";

#[derive(serde::Serialize)]
pub struct CheckResult {
    pub category: String,
    pub result: String,
    pub message: String,
}

#[derive(serde::Serialize)]
pub struct DoctorSummary {
    pub ok: u32,
    pub warnings: u32,
    pub errors: u32,
}

struct Counts {
    ok: u32,
    warn: u32,
    fail: u32,
    json_mode: bool,
    current_category: String,
    checks: Vec<CheckResult>,
}

impl Counts {
    fn new(json_mode: bool) -> Self {
        Self { ok: 0, warn: 0, fail: 0, json_mode, current_category: String::new(), checks: Vec::new() }
    }

    fn set_category(&mut self, cat: &str) {
        self.current_category = cat.to_string();
    }

    fn pass(&mut self, msg: &str) {
        self.ok += 1;
        if self.json_mode {
            self.checks.push(CheckResult {
                category: self.current_category.clone(),
                result: "ok".to_string(),
                message: msg.to_string(),
            });
        } else {
            println!("  [ok] {msg}");
        }
    }

    fn warn(&mut self, msg: &str) {
        self.warn += 1;
        if self.json_mode {
            self.checks.push(CheckResult {
                category: self.current_category.clone(),
                result: "warning".to_string(),
                message: msg.to_string(),
            });
        } else {
            println!("  [!!] {msg}");
        }
    }

    fn fail(&mut self, msg: &str) {
        self.fail += 1;
        if self.json_mode {
            self.checks.push(CheckResult {
                category: self.current_category.clone(),
                result: "error".to_string(),
                message: msg.to_string(),
            });
        } else {
            println!("  [EE] {msg}");
        }
    }

    fn skip(&mut self, msg: &str) {
        if self.json_mode {
            self.checks.push(CheckResult {
                category: self.current_category.clone(),
                result: "skipped".to_string(),
                message: msg.to_string(),
            });
        } else {
            println!("  [--] {msg}");
        }
    }
}

pub fn doctor(
    engine: ContainerEngine,
    verbose: bool,
    env_name: &str,
    scope: Scope,
    ec: &EnvironmentConfig,
    deep: bool,
    strict: bool,
    json_mode: bool,
) -> Result<()> {
    let scope_str = match scope {
        Scope::Local => "local",
        Scope::System => "system",
    };
    let engine_str = match engine {
        ContainerEngine::Docker => "docker",
        ContainerEngine::Podman => "podman",
    };

    if !json_mode {
        println!("Environment: {env_name} ({scope_str})");
        println!("Engine:      {engine_str}");
        println!();
    }

    let mut c = Counts::new(json_mode);
    let data_dir = cfg::env_data_dir(scope, env_name);

    // ==== Prerequisites ====
    if !json_mode { println!("Prerequisites"); }
    c.set_category("prerequisites");
    check_engine(&mut c, engine);
    check_base_image(&mut c, engine, &ec.base_image);
    check_built_image(&mut c, engine, ec, scope, env_name);
    check_data_dirs(&mut c, &data_dir);
    check_file_readability(&mut c, &data_dir);

    // ==== Manifests ====
    if !json_mode { println!("\nManifests"); }
    c.set_category("manifests");
    check_manifests(&mut c, &data_dir, ec.morloc_version.as_ref());

    // ==== Deep checks ====
    c.set_category("deep");
    if deep {
        if !json_mode { println!("\nDeep checks"); }
        check_morloc_version(&mut c, engine, ec);
        check_programs_deep(&mut c, engine, verbose, ec, &data_dir);
    } else {
        if !json_mode { println!("\nDeep checks"); }
        c.skip("Use --deep to run container-side checks");
    }

    let fail_count = c.fail;
    let warn_count = c.warn;

    if json_mode {
        #[derive(serde::Serialize)]
        struct DoctorOutput {
            environment: String,
            scope: String,
            engine: String,
            checks: Vec<CheckResult>,
            summary: DoctorSummary,
        }
        let output = DoctorOutput {
            environment: env_name.to_string(),
            scope: scope_str.to_string(),
            engine: engine_str.to_string(),
            checks: c.checks,
            summary: DoctorSummary { ok: c.ok, warnings: warn_count, errors: fail_count },
        };
        println!("{}", serde_json::to_string_pretty(&output).unwrap());
    } else {
        // ==== Summary ====
        println!();
        println!(
            "{} passed, {} warnings, {} errors",
            c.ok, warn_count, fail_count
        );
    }

    if fail_count > 0 {
        return Err(crate::error::ManagerError::DoctorFailed(fail_count));
    }
    if strict && warn_count > 0 {
        return Err(crate::error::ManagerError::DoctorFailed(warn_count));
    }
    Ok(())
}

// ======================================================================
// Individual checks
// ======================================================================

fn check_engine(c: &mut Counts, engine: ContainerEngine) {
    let exe = engine_executable(engine);
    let fmt = match engine {
        ContainerEngine::Podman => "{{.Version.Version}}",
        ContainerEngine::Docker => "{{.ServerVersion}}",
    };
    let output = Command::new(exe)
        .args(["info", "--format", fmt])
        .output();
    match output {
        Ok(o) if o.status.success() => {
            let ver = String::from_utf8_lossy(&o.stdout).trim().to_string();
            if ver.is_empty() {
                c.pass(&format!("{exe} engine reachable"));
            } else {
                c.pass(&format!("{exe} engine reachable ({ver})"));
            }
        }
        Ok(o) => {
            let err = String::from_utf8_lossy(&o.stderr).trim().to_string();
            if err.contains("permission denied") || err.contains("Permission denied") {
                c.fail(&format!("{exe} permission denied -- add user to {exe} group?"));
            } else {
                c.fail(&format!("{exe} not reachable: {err}"));
            }
        }
        Err(e) => {
            c.fail(&format!("{exe} not found: {e}"));
        }
    }
}

fn check_base_image(c: &mut Counts, engine: ContainerEngine, base_image: &str) {
    if image_exists_locally(engine, base_image) {
        c.pass(&format!("Base image {base_image}"));
    } else {
        c.fail(&format!(
            "Base image {base_image} not found locally\n       \
             Run: morloc-manager run -- morloc --version  (triggers pull)"
        ));
    }
}

fn check_built_image(c: &mut Counts, engine: ContainerEngine, ec: &EnvironmentConfig, scope: Scope, env_name: &str) {
    if ec.dockerfile.is_none() {
        return;
    }
    // Check if the Dockerfile file itself still exists
    let df_path = cfg::env_dockerfile_path(scope, env_name);
    if !df_path.exists() {
        c.warn(&format!(
            "Dockerfile configured but file is missing: {}\n       \
             Remove stale config or recreate the file, then run: morloc-manager update",
            df_path.display()
        ));
        return;
    }
    match &ec.built_image {
        Some(img) => {
            if image_exists_locally(engine, img) {
                c.pass(&format!("Built image {img}"));
            } else {
                c.fail(&format!(
                    "Built image {img} not found locally\n       \
                     Run: morloc-manager update"
                ));
            }
        }
        None => {
            c.warn("Dockerfile configured but no image built yet\n       \
                    Run: morloc-manager update");
        }
    }
}

fn check_data_dirs(c: &mut Counts, data_dir: &Path) {
    let expected = ["lib", "bin", "opt", "fdb", "src/morloc/plane", "exe"];

    let mut missing: Vec<&str> = Vec::new();
    for dir in &expected {
        if !data_dir.join(dir).is_dir() {
            missing.push(dir);
        }
    }
    if missing.is_empty() {
        c.pass("Data directories intact");
    } else {
        c.fail(&format!(
            "Missing directories: {}\n       \
             Run: morloc-manager run -- morloc init -f",
            missing.join(", ")
        ));
    }
}

/// Walk exe/ and other data subdirectories, warning about files unreadable
/// by the current user (which would cause freeze to fail).
fn check_file_readability(c: &mut Counts, data_dir: &Path) {
    let dirs_to_check = ["exe", "bin", "lib"];
    let mut unreadable: Vec<String> = Vec::new();
    for dir in &dirs_to_check {
        let dir_path = data_dir.join(dir);
        if dir_path.is_dir() {
            collect_unreadable(&dir_path, &mut unreadable);
        }
    }
    if unreadable.is_empty() {
        c.pass("All data files readable");
    } else {
        let shown: Vec<&str> = unreadable.iter().take(5).map(|s| s.as_str()).collect();
        let suffix = if unreadable.len() > 5 {
            format!(" (and {} more)", unreadable.len() - 5)
        } else {
            String::new()
        };
        c.fail(&format!(
            "Unreadable files (freeze will fail): {}{suffix}\n       \
             Fix with: chmod -R a+rX <data-dir>",
            shown.join(", ")
        ));
    }
}

fn collect_unreadable(dir: &Path, out: &mut Vec<String>) {
    let Ok(entries) = fs::read_dir(dir) else {
        out.push(dir.display().to_string());
        return;
    };
    for entry in entries.flatten() {
        let path = entry.path();
        if path.is_dir() {
            collect_unreadable(&path, out);
        } else if fs::File::open(&path).is_err() {
            out.push(path.display().to_string());
        }
    }
}

fn check_manifests(
    c: &mut Counts,
    data_dir: &Path,
    expected_version: Option<&Version>,
) {
    let fdb_dir = data_dir.join("fdb");
    if !fdb_dir.is_dir() {
        c.warn("No fdb/ directory found");
        return;
    }

    let entries = match fs::read_dir(&fdb_dir) {
        Ok(e) => e,
        Err(e) => {
            c.fail(&format!("Cannot read fdb/: {e}"));
            return;
        }
    };

    let mut found_any = false;
    for entry in entries.flatten() {
        let name = entry.file_name();
        let name_str = name.to_string_lossy();
        if !name_str.ends_with(".manifest") {
            continue;
        }
        found_any = true;
        let prog_name = &name_str[..name_str.len() - ".manifest".len()];
        check_one_manifest(c, &entry.path(), prog_name, data_dir, expected_version);
    }

    if !found_any {
        c.warn("No program manifests found in fdb/");
    }
}

fn check_one_manifest(
    c: &mut Counts,
    path: &Path,
    prog_name: &str,
    data_dir: &Path,
    expected_version: Option<&Version>,
) {
    let content = match fs::read_to_string(path) {
        Ok(s) => s,
        Err(e) => {
            c.fail(&format!("{prog_name} -- cannot read manifest: {e}"));
            return;
        }
    };

    let json_str = if content.starts_with("#!") {
        if let Some(marker_pos) = content.find(MANIFEST_MARKER) {
            let after_marker = &content[marker_pos..];
            let json_start = after_marker
                .find('\n')
                .map(|i| marker_pos + i + 1)
                .unwrap_or(content.len());
            &content[json_start..]
        } else {
            c.fail(&format!("{prog_name} -- manifest missing ### MANIFEST ### marker"));
            return;
        }
    } else {
        content.as_str()
    };

    let manifest: serde_json::Value = match serde_json::from_str(json_str) {
        Ok(v) => v,
        Err(e) => {
            c.fail(&format!("{prog_name} -- invalid manifest JSON: {e}"));
            return;
        }
    };

    let mut issues: Vec<String> = Vec::new();

    // Check morloc_version
    let build_ver = manifest
        .get("build")
        .and_then(|b| b.get("morloc_version"))
        .and_then(|v| v.as_str());

    if let (Some(build_ver_str), Some(expected)) = (build_ver, expected_version) {
        let expected_str = expected.show();
        if build_ver_str != expected_str {
            issues.push(format!(
                "built with {build_ver_str}, expected {expected_str}"
            ));
        }
    }

    // Check build.path exists
    let build_path = manifest
        .get("build")
        .and_then(|b| b.get("path"))
        .and_then(|v| v.as_str());

    if let Some(bp) = build_path {
        // Build paths inside containers are /opt/morloc/exe/..., on host they're
        // under data_dir/exe/... Try the host path first.
        let host_path = data_dir.join("exe").join(prog_name);
        if !host_path.is_dir() && !Path::new(bp).is_dir() {
            issues.push("build directory missing".to_string());
        }
    } else {
        issues.push("no build.path in manifest".to_string());
    }

    // Check pool files exist
    let pool_count = manifest
        .get("pools")
        .and_then(|p| p.as_array())
        .map(|a| a.len())
        .unwrap_or(0);

    if pool_count == 0 {
        issues.push("no pools defined".to_string());
    }

    if issues.is_empty() {
        let ver_str = build_ver.unwrap_or("unknown");
        c.pass(&format!(
            "{prog_name} -- built with {ver_str}, {pool_count} pools"
        ));
    } else {
        for issue in &issues {
            c.warn(&format!(
                "{prog_name} -- {issue}\n       \
                 Recompile: morloc-manager run -- morloc make --install"
            ));
        }
    }
}

fn check_morloc_version(c: &mut Counts, engine: ContainerEngine, ec: &EnvironmentConfig) {
    let image = ec.active_image();
    match environment::detect_morloc_version(engine, image) {
        Ok(detected) => {
            if let Some(ref expected) = ec.morloc_version {
                if detected == *expected {
                    c.pass(&format!("morloc {} (matches config)", detected.show()));
                } else {
                    c.warn(&format!(
                        "morloc {} in container, config says {}",
                        detected.show(),
                        expected.show()
                    ));
                }
            } else {
                c.pass(&format!("morloc {} (no version in config to compare)", detected.show()));
            }
        }
        Err(e) => {
            c.fail(&format!("Cannot run morloc in container: {e}"));
        }
    }
}

fn check_programs_deep(
    c: &mut Counts,
    engine: ContainerEngine,
    verbose: bool,
    ec: &EnvironmentConfig,
    data_dir: &Path,
) {
    let image = ec.active_image();
    let mh = "/opt/morloc";
    let bind_mounts = vec![(data_dir.to_string_lossy().to_string(), mh.to_string())];
    let env = vec![
        ("MORLOC_HOME".to_string(), mh.to_string()),
    ];

    // Scan programs from fdb/ to get program names
    let fdb_dir = format!("{mh}/fdb");
    let cfg = RunConfig {
        command: Some(vec!["ls".to_string(), fdb_dir.clone()]),
        bind_mounts: bind_mounts.clone(),
        env: env.clone(),
        ..RunConfig::new(image)
    };
    let (status, stdout, _) = container_run_quiet(engine, &cfg);
    if !status.success() {
        c.fail("Cannot list programs in container");
        return;
    }

    let programs: Vec<ProgramEntry> = stdout
        .lines()
        .filter(|l| l.ends_with(".manifest"))
        .map(|l| {
            let name = l.strip_suffix(".manifest").unwrap_or(l);
            ProgramEntry {
                name: name.to_string(),
                commands: Vec::new(),
            }
        })
        .collect();

    if programs.is_empty() {
        c.warn("No programs found in container");
        return;
    }

    if !c.json_mode {
        println!("Running smoke tests for {} programs...", programs.len());
    }
    for prog in &programs {
        let exe_path = format!("{mh}/bin/{}", prog.name);
        let cfg = RunConfig {
            command: Some(vec![exe_path.clone(), "--help".to_string()]),
            bind_mounts: bind_mounts.clone(),
            env: env.clone(),
            ..RunConfig::new(image)
        };
        if verbose {
            let exe = engine_executable(engine);
            eprintln!("[morloc-manager] {exe} run --rm {image} {exe_path} --help");
        }
        let (status, _, stderr) = container_run_quiet(engine, &cfg);
        if status.success() {
            c.pass(&format!("{} -- smoke test passed", prog.name));
        } else {
            let snippet: String = stderr.lines().take(3).collect::<Vec<_>>().join("\n       ");
            c.fail(&format!("{} -- smoke test failed: {snippet}", prog.name));
        }
    }
}


================================================
FILE: data/rust/morloc-manager/src/environment.rs
================================================
use std::fs;
use std::path::{Path, PathBuf};
use std::process::Command;

use serde::Serialize;
use sha2::{Digest, Sha256};

use crate::config;
use crate::container::{
    self, check_remote_image, container_build_visible,
    container_pull_visible, engine_executable, exit_code_to_int,
    image_exists_locally, BuildConfig, RemoteImageStatus,
};
use crate::error::{ManagerError, Result};
use crate::serve;
use crate::types::*;

// ======================================================================
// Public types
// ======================================================================

/// Options for creating or updating an environment.
/// For `new` (is_new=true): all Option fields that are None use defaults.
/// For `update` (is_new=false): None means keep the existing value.
pub struct ApplyOptions {
    pub name: String,
    pub scope: Scope,
    pub is_new: bool,
    pub base_image: Option<String>,
    pub original_image: Option<String>,
    pub morloc_version: Option<Version>,
    pub dockerfile: Option<String>,
    pub includes: Vec<String>,
    pub flagfile: Option<String>,
    pub engine_args: Vec<String>,
    pub engine: Option<ContainerEngine>,
    pub shm_size: Option<String>,
    pub skip_dockerfile_build: bool,
    pub verbose: bool,
}

/// Info returned by list_environments.
#[derive(Serialize)]
pub struct EnvInfo {
    pub name: String,
    pub morloc_version: Option<Version>,
    pub active: bool,
}

// ======================================================================
// Image resolution
// ======================================================================

const MORLOC_IMAGE_PREFIX: &str = "ghcr.io/morloc-project/morloc/morloc-full";

/// Recognize engine errors that mean "cannot chdir into the current working
/// directory" and rewrite them into a clearer message. This commonly happens
/// when running `sudo -u <other-user> morloc-manager ...` from a directory
/// that <other-user> cannot access (e.g., /root or another user's $HOME).
/// Without this hint, the error bubbles up as "Failed to check registry..."
/// which misleads users toward debugging network/auth problems.
fn cwd_access_hint(stderr: &str) -> Option<String> {
    let lower = stderr.to_lowercase();
    let looks_like_cwd_denied = (lower.contains("chdir") || lower.contains("getwd")
        || lower.contains("current working directory"))
        && (lower.contains("permission denied") || lower.contains("no such file"));
    if looks_like_cwd_denied {
        Some(format!(
            "Cannot change into the current working directory as the target user. \
             Run morloc-manager from a directory the target user can access \
             (for example /tmp or the user's home directory).\nOriginal error: {}",
            stderr.trim()
        ))
    } else {
        None
    }
}

/// Resolve a morloc version string to a registry image reference.
pub fn version_to_image(ver: &Version) -> String {
    format!("{MORLOC_IMAGE_PREFIX}:{}", ver.show())
}

/// Pull an image by tag from the morloc registry, detect its version, and
/// return (image_ref, version). The tag can be a semver string ("0.77.0"),
/// a named tag ("edge", "nightly"), or any other valid container tag.
pub fn pull_tagged_image(engine: ContainerEngine, tag: &str) -> Result<(String, Version)> {
    let image_ref = format!("{MORLOC_IMAGE_PREFIX}:{tag}");

    if !image_exists_locally(engine, &image_ref) {
        match check_remote_image(engine, &image_ref) {
            RemoteImageStatus::Exists => {}
            RemoteImageStatus::NotFound => {
                return Err(ManagerError::EnvError(format!(
                    "No container image found for tag '{tag}'"
                )));
            }
            RemoteImageStatus::Unknown(stderr) => {
                if let Some(hint) = cwd_access_hint(&stderr) {
                    return Err(ManagerError::EnvError(hint));
                }
                return Err(ManagerError::EnvError(format!(
                    "Failed to check registry for tag '{tag}': {}",
                    stderr.trim()
                )));
            }
        }

        eprintln!("Pulling {image_ref}...");
        let status = container_pull_visible(engine, &image_ref);
        if !status.success() {
            return Err(ManagerError::EngineError {
                engine,
                code: exit_code_to_int(status),
                stderr: "Pull failed (see output above)".to_string(),
            });
        }
    } else {
        eprintln!("Using local copy of {image_ref}");
    }

    let ver = detect_morloc_version(engine, &image_ref)?;

    // Also tag with the detected version so future --version lookups find it
    let versioned_image = version_to_image(&ver);
    if versioned_image != image_ref {
        let exe = engine_executable(engine);
        let _ = Command::new(exe)
            .args(["tag", &image_ref, &versioned_image])
            .output();
    }

    Ok((versioned_image, ver))
}

/// Pull the :edge image. Convenience wrapper around pull_tagged_image.
pub fn resolve_latest(engine: ContainerEngine) -> Result<(String, Version)> {
    pull_tagged_image(engine, "edge")
}

/// Pull a specific version image from the morloc registry.
pub fn pull_version_image(engine: ContainerEngine, ver: &Version) -> Result<String> {
    let (img, _) = pull_tagged_image(engine, &ver.show())?;
    Ok(img)
}

/// Detect the morloc version by running `morloc --version` inside the image.
pub fn detect_morloc_version(engine: ContainerEngine, image: &str) -> Result<Version> {
    let exe = engine_executable(engine);
    let output = Command::new(exe)
        .args(["run", "--rm", image, "morloc", "--version"])
        .stdin(std::process::Stdio::null())
        .stdout(std::process::Stdio::piped())
        .stderr(std::process::Stdio::piped())
        .output()
        .map_err(|e| ManagerError::EnvError(format!("Failed to run container: {e}")))?;

    if !output.status.success() {
        return Err(ManagerError::EnvError(format!(
            "Image '{image}' does not have a working morloc binary: {}",
            String::from_utf8_lossy(&output.stderr).trim()
        )));
    }

    let ver_out = String::from_utf8_lossy(&output.stdout).trim().to_string();
    let ver_str = ver_out.split_whitespace().last().unwrap_or(&ver_out);
    ver_str.parse().map_err(|_| {
        ManagerError::EnvError(format!(
            "Could not parse morloc version from image '{image}' output: {ver_out}"
        ))
    })
}

/// Pull a custom image (not from morloc registry).
pub fn pull_custom_image(engine: ContainerEngine, image: &str) -> Result<()> {
    if image_exists_locally(engine, image) {
        eprintln!("Using local copy of {image}");
        return Ok(());
    }

    eprintln!("Pulling {image}...");
    let status = container_pull_visible(engine, image);
    if !status.success() {
        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(status),
            stderr: "Pull failed (see output above)".to_string(),
        });
    }
    Ok(())
}

// ======================================================================
// Core operations
// ======================================================================

/// Create or update an environment.
///
/// When `is_new` is true: validates name uniqueness, creates data directories.
/// Validate that an environment name contains only allowed characters.
pub fn validate_env_name(name: &str) -> Result<()> {
    if name.is_empty()
        || !name
            .chars()
            .all(|c| c.is_alphanumeric() || c == '-' || c == '_' || c == '.')
    {
        return Err(ManagerError::EnvError(format!(
            "Invalid environment name '{name}': must contain only alphanumeric characters, hyphens, underscores, or dots"
        )));
    }
    Ok(())
}

/// Parse an include spec into (resolved_source, destination).
///
/// Supports two forms:
/// - `path`        — copies to cfg_dir/basename(path)
/// - `src:dest`    — copies src to cfg_dir/dest
///
/// Rules for dest:
/// - Must be relative (no leading `/`)
/// - Cannot contain `..`
/// - If dest ends with `/`, src's basename is appended
///
/// Source symlinks are resolved via canonicalize().
fn parse_include_spec(spec: &str, cfg_dir: &Path) -> Result<(PathBuf, PathBuf)> {
    let (src_str, dest_rel) = if let Some(idx) = spec.find(':') {
        let s = &spec[..idx];
        let d = &spec[idx + 1..];
        if s.is_empty() || d.is_empty() {
            return Err(ManagerError::EnvError(format!(
                "Invalid include spec: '{spec}'"
            )));
        }
        (s, d.to_string())
    } else {
        let src_path = Path::new(spec);
        let fname = src_path.file_name().ok_or_else(|| {
            ManagerError::EnvError(format!("Invalid include path: {spec}"))
        })?;
        (spec.as_ref(), fname.to_string_lossy().to_string())
    };

    // Validate dest constraints
    if dest_rel.starts_with('/') {
        return Err(ManagerError::EnvError(format!(
            "Include destination must be relative, not absolute: '{dest_rel}'"
        )));
    }
    if dest_rel.contains("..") {
        return Err(ManagerError::EnvError(format!(
            "Include destination cannot contain '..': '{dest_rel}'"
        )));
    }

    // Resolve src (canonicalize follows symlinks, errors if path doesn't exist)
    let real_src = Path::new(src_str).canonicalize().map_err(|e| {
        ManagerError::EnvError(format!("Cannot resolve include path '{src_str}': {e}"))
    })?;

    // Compute final dest
    let dest = cfg_dir.join(&dest_rel);
    let final_dest = if dest_rel.ends_with('/') {
        dest.join(real_src.file_name().unwrap_or_default())
    } else {
        dest
    };

    Ok((real_src, final_dest))
}

/// When `is_new` is false: loads existing config, applies overrides.
pub fn apply_environment(opts: &ApplyOptions) -> Result<()> {
    let scope = opts.scope;
    let name = &opts.name;

    validate_env_name(name)?;

    // Load existing config or start fresh
    let mut ec = if opts.is_new {
        let cfg_path = config::env_config_path(scope, name);
        if cfg_path.is_file() {
            return Err(ManagerError::EnvError(format!(
                "Environment '{name}' already exists"
            )));
        }
        // Create data directories
        let data_dir = config::env_data_dir(scope, name);
        for sub in &["bin", "lib", "fdb", "include", "opt", "tmp"] {
            fs::create_dir_all(data_dir.join(sub)).map_err(|e| {
                ManagerError::EnvError(format!("Failed to create directory: {e}"))
            })?;
        }
        if scope == Scope::System {
            use std::os::unix::fs::PermissionsExt;
            let dirs: Vec<_> = std::iter::once(data_dir.clone())
                .chain(
                    ["bin", "lib", "fdb", "include", "opt", "tmp"]
                        .iter()
                        .map(|d| data_dir.join(d)),
                )
                .collect();
            for d in dirs {
                let _ = fs::set_permissions(&d, fs::Permissions::from_mode(0o2775));
            }
        }
        // Start with required fields from opts; the rest will be applied below
        EnvironmentConfig {
            name: name.clone(),
            base_image: opts.base_image.clone().unwrap_or_default(),
            original_image: None,
            dockerfile: None,
            content_hash: None,
            built_image: None,
            engine: opts.engine.unwrap_or(ContainerEngine::Podman),
            shm_size: "512m".to_string(),
            morloc_version: None,
        }
    } else {
        config::read_env_config(scope, name)
            .map_err(|_| ManagerError::EnvironmentNotFound(name.to_string()))?
    };

    // Apply overrides
    if let Some(ref img) = opts.base_image {
        ec.base_image = img.clone();
    }
    if let Some(ref img) = opts.original_image {
        ec.original_image = Some(img.clone());
    }
    if let Some(ref ver) = opts.morloc_version {
        ec.morloc_version = Some(ver.clone());
    }
    if let Some(engine) = opts.engine {
        ec.engine = engine;
    }
    if let Some(ref shm) = opts.shm_size {
        if !is_valid_shm_size(shm) {
            return Err(ManagerError::EnvError(format!(
                "Invalid --shm-size '{shm}'. Use format like: 512m, 1g, 2048k"
            )));
        }
        ec.shm_size = shm.clone();
    }

    // Copy Dockerfile if a new one was provided
    let dockerfile_changed = if let Some(ref src) = opts.dockerfile {
        let dest = config::env_dockerfile_path(scope, name);
        let dest_dir = dest.parent().unwrap();
        fs::create_dir_all(dest_dir).map_err(|e| {
            ManagerError::EnvError(format!("Failed to create config dir: {e}"))
        })?;
        fs::copy(src, &dest).map_err(|e| {
            ManagerError::EnvError(format!("Failed to copy Dockerfile '{}': {e}", src))
        })?;
        ec.dockerfile = Some("Dockerfile".to_string());
        true
    } else {
        false
    };

    // Copy included files/directories into build context.
    // Supports src:dest syntax (like Docker volume mounts) for explicit placement.
    let cfg_dir = config::env_config_dir(scope, name);
    fs::create_dir_all(&cfg_dir).map_err(|e| {
        ManagerError::EnvError(format!("Failed to create config dir: {e}"))
    })?;
    for spec in &opts.includes {
        let (real_src, final_dest) = parse_include_spec(spec, &cfg_dir)?;
        if let Some(parent) = final_dest.parent() {
            fs::create_dir_all(parent).map_err(|e| {
                ManagerError::EnvError(format!("Failed to create directory: {e}"))
            })?;
        }
        if real_src.is_dir() {
            let status = Command::new("cp")
                .args(["-a", &real_src.to_string_lossy(), &final_dest.to_string_lossy()])
                .stdin(std::process::Stdio::null())
                .stdout(std::process::Stdio::null())
                .stderr(std::process::Stdio::inherit())
                .status()
                .map_err(|e| ManagerError::EnvError(format!("Failed to copy '{spec}': {e}")))?;
            if !status.success() {
                return Err(ManagerError::EnvError(format!(
                    "Failed to copy directory '{spec}'"
                )));
            }
        } else {
            fs::copy(&real_src, &final_dest).map_err(|e| {
                ManagerError::EnvError(format!("Failed to copy '{spec}': {e}"))
            })?;
        }
    }

    // Write flags file: for new envs or when flagfile is provided, write fresh.
    // For updates with only engine_args, append to existing.
    let flags_path = config::env_flags_path(scope, name);
    if opts.is_new || opts.flagfile.is_some() {
        let mut flag_lines: Vec<String> = Vec::new();
        if let Some(ref src) = opts.flagfile {
            let content = fs::read_to_string(src).map_err(|e| {
                ManagerError::EnvError(format!("Failed to read flagfile '{}': {e}", src))
            })?;
            flag_lines.extend(
                content
                    .lines()
                    .map(|l| l.trim().to_string())
                    .filter(|l| !l.is_empty() && !l.starts_with('#')),
            );
        }
        flag_lines.extend(opts.engine_args.iter().cloned());
        let flags_content = if flag_lines.is_empty() {
            String::new()
        } else {
            flag_lines.join("\n") + "\n"
        };
        fs::write(&flags_path, &flags_content).map_err(|e| {
            ManagerError::EnvError(format!("Failed to write flags file: {e}"))
        })?;
    } else if !opts.engine_args.is_empty() {
        // Append engine_args to existing flags file
        let mut existing = config::read_flags_file_lines(&flags_path);
        existing.extend(opts.engine_args.iter().cloned());
        let flags_content = existing.join("\n") + "\n";
        fs::write(&flags_path, &flags_content).map_err(|e| {
            ManagerError::EnvError(format!("Failed to write flags file: {e}"))
        })?;
    }

    // Build Dockerfile layer if present and not skipped
    let has_dockerfile = ec.dockerfile.is_some();
    let should_build = has_dockerfile
        && !opts.skip_dockerfile_build
        && (opts.is_new || dockerfile_changed || !opts.includes.is_empty()
            || opts.base_image.is_some() || opts.engine.is_some()
            // For update with no specific changes, rebuild if Dockerfile exists
            || (!opts.is_new && opts.dockerfile.is_none() && opts.includes.is_empty()));

    if should_build {
        let tag = format!("localhost/morloc-env:{name}");
        let df_path = config::env_dockerfile_path(scope, name);
        if df_path.exists() {
            let hash = hash_file(&df_path)?;
            // Skip rebuild when nothing has actually changed: same Dockerfile
            // hash, no new includes, no base-image change, tagged image still
            // present. Without this, `update` with no arguments silently
            // re-runs the full build every time.
            let unchanged = !opts.is_new
                && !dockerfile_changed
                && opts.includes.is_empty()
                && opts.base_image.is_none()
                && ec.content_hash.as_deref() == Some(hash.as_str())
                && ec.built_image.as_ref()
                    .map(|img| image_exists_locally(ec.engine, img))
                    .unwrap_or(false);
            if unchanged {
                eprintln!("Dockerfile unchanged; skipping rebuild.");
            } else {
                let build_cfg = BuildConfig {
                    dockerfile: df_path.to_string_lossy().to_string(),
                    context: cfg_dir.to_string_lossy().to_string(),
                    tag: tag.clone(),
                    build_args: vec![("CONTAINER_BASE".to_string(), ec.base_image.clone())],
                };
                if opts.verbose {
                    let exe = engine_executable(ec.engine);
                    eprintln!(
                        "[morloc-manager] {exe} build -f {} -t {} {}",
                        build_cfg.dockerfile, build_cfg.tag, build_cfg.context
                    );
                }
                let status = container_build_visible(ec.engine, &build_cfg);
                if !status.success() {
                    return Err(ManagerError::EngineError {
                        engine: ec.engine,
                        code: exit_code_to_int(status),
                        stderr: "Build failed (see output above)".to_string(),
                    });
                }
                ec.built_image = Some(tag);
                ec.content_hash = Some(hash);
            }
        }
    }

    // Always reconcile the stored morloc version against the actual image.
    // - For `new --version 0.77.0-rc.6`, the binary reports "0.77.0" (stack
    //   does not expose prerelease tags), so keep the recorded value when
    //   major.minor.patch match — the recorded tag is more informative.
    // - For `new --image <custom>` or `update --image ...`, nothing was
    //   recorded yet, so store the detected version.
    // - If the image has no morloc binary (e.g., a bare base image staged
    //   for a Dockerfile layer not yet built), silently leave the field
    //   unchanged rather than failing the whole operation.
    let detect_target = ec.built_image.clone().unwrap_or_else(|| ec.base_image.clone());
    if !detect_target.is_empty() {
        if let Ok(detected) = detect_morloc_version(ec.engine, &detect_target) {
            ec.morloc_version = Some(match ec.morloc_version.take() {
                Some(recorded) if recorded.major == detected.major
                    && recorded.minor == detected.minor
                    && recorded.patch == detected.patch => recorded,
                _ => detected,
            });
        }
    }

    // Write environment config
    config::write_env_config(scope, name, &ec)?;

    Ok(())
}

/// Remove an environment and all its data.
pub fn remove_environment(engine: ContainerEngine, scope: Scope, name: &str) -> Result<()> {
    let ec = config::read_env_config(scope, name)
        .map_err(|_| ManagerError::EnvironmentNotFound(name.to_string()))?;

    // Stop and remove any running serve container for this environment before
    // removing its image. If we skipped this, the serve container would keep
    // running and be unreachable through morloc-manager.
    let serve_name = serve::serve_container_name(name);
    if container::container_exists(engine, &serve_name) {
        let _ = container::container_stop(engine, &serve_name);
        let _ = container::container_remove_quiet(engine, &serve_name);
    }

    // Remove built Dockerfile layer image
    if let Some(ref img) = ec.built_image {
        if image_exists_locally(engine, img) {
            container::remove_image(engine, img);
        }
    }

    // Remove config directory
    let cfg_dir = config::env_config_dir(scope, name);
    if cfg_dir.is_dir() {
        let _ = fs::remove_dir_all(&cfg_dir);
    }

    // Remove data directory
    let data_dir = config::env_data_dir(scope, name);
    if data_dir.is_dir() {
        let _ = fs::remove_dir_all(&data_dir);
    }

    // If the active env was this one, clear it in both local and system configs
    for cfg_scope in [Scope::Local, Scope::System] {
        let cfg_path = config::config_path(cfg_scope);
        if let Ok(cfg) = config::read_config::<Config>(&cfg_path) {
            if cfg.active_env.as_deref() == Some(name) {
                let new_cfg = Config {
                    active_env: None,
                    ..cfg
                };
                let _ = config::write_config(&cfg_path, &new_cfg);
            }
        }
    }

    Ok(())
}

/// List environments in the given scope.
pub fn list_environments(scope: Scope, active_env: Option<&str>) -> Vec<EnvInfo> {
    let names = config::list_env_names(scope);
    let mut result = Vec::new();
    for name in names {
        if let Ok(ec) = config::read_env_config(scope, &name) {
            result.push(EnvInfo {
                name: name.clone(),
                morloc_version: ec.morloc_version,
                active: active_env == Some(name.as_str()),
            });
        }
    }
    result
}

/// Select an environment by writing active_env to the given write_scope config.
pub fn select_environment(name: &str, write_scope: Scope) -> Result<()> {
    // Verify the environment exists somewhere
    config::find_env_scope(name)?;

    let cfg_path = config::config_path(write_scope);
    let base_cfg = config::read_config::<Config>(&cfg_path)
        .or_else(|_| config::read_config::<Config>(&config::config_path(Scope::System)))
        .unwrap_or_default();
    let new_cfg = Config {
        active_env: Some(name.to_string()),
        ..base_cfg
    };
    config::write_config(&cfg_path, &new_cfg)
}

/// Resolve the active environment. Checks local config first, then system.
/// Returns (name, scope where env config lives, EnvironmentConfig).
pub fn resolve_active_environment() -> Result<(String, Scope, EnvironmentConfig)> {
    // Find active_env name from config (local first, then system)
    let name = resolve_active_env_name()?;

    // Find which scope has the environment config
    let scope = config::find_env_scope(&name)?;
    let ec = config::read_env_config(scope, &name)?;
    Ok((name, scope, ec))
}

/// Resolve just the active environment name from config.
/// Skips names that don't resolve to an actual environment (e.g., stale
/// entries from old config formats).
fn resolve_active_env_name() -> Result<String> {
    if let Ok(cfg) = config::read_config::<Config>(&config::config_path(Scope::Local)) {
        if let Some(ref name) = cfg.active_env {
            if config::find_env_scope(name).is_ok() {
                return Ok(name.clone());
            }
        }
    }
    if let Ok(cfg) = config::read_config::<Config>(&config::config_path(Scope::System)) {
        if let Some(ref name) = cfg.active_env {
            if config::find_env_scope(name).is_ok() {
                return Ok(name.clone());
            }
        }
    }
    // Check if any environments exist to give a better suggestion
    let local_envs = config::list_env_names(Scope::Local);
    let system_envs = config::list_env_names(Scope::System);
    if local_envs.is_empty() && system_envs.is_empty() {
        Err(ManagerError::NoActiveEnvironment)
    } else {
        // Label each entry with its scope so same-named envs are distinguishable.
        // System envs are flagged with --system to disambiguate in select.
        let mut available: Vec<String> = local_envs
            .iter()
            .map(|n| format!("{n} (local)"))
            .collect();
        available.extend(system_envs.iter().map(|n| format!("{n} (system)")));
        Err(ManagerError::EnvError(format!(
            "No active environment. Select one with: morloc-manager select <name>\n\
             Available: {}",
            available.join(", ")
        )))
    }
}

// ======================================================================
// Internal
// ======================================================================

pub fn is_valid_shm_size(s: &str) -> bool {
    if s.is_empty() {
        return false;
    }
    let (digits, suffix) = if s.ends_with(|c: char| "bkmgBKMG".contains(c)) {
        (&s[..s.len() - 1], true)
    } else {
        (s, false)
    };
    !digits.is_empty() && digits.chars().all(|c| c.is_ascii_digit()) && (suffix || !digits.is_empty())
}

fn hash_file(path: &Path) -> Result<String> {
    let contents = fs::read(path).map_err(|e| {
        ManagerError::EnvError(format!("Failed to read file: {e}"))
    })?;
    let digest = Sha256::digest(&contents);
    Ok(hex_encode(&digest))
}

fn hex_encode(bytes: &[u8]) -> String {
    bytes.iter().map(|b| format!("{b:02x}")).collect()
}


================================================
FILE: data/rust/morloc-manager/src/error.rs
================================================
use std::fmt;
use thiserror::Error;

use crate::types::{ContainerEngine, Scope, Version};

#[derive(Debug, Error, PartialEq, Eq)]
pub enum ManagerError {
    #[error("Configuration not found: {0}")]
    ConfigNotFound(String),

    #[error("Permission denied: {0}")]
    ConfigPermissionDenied(String),

    #[error("Invalid configuration in {path}: {msg}")]
    ConfigParseError { path: String, msg: String },

    #[error("No active environment. Run: morloc-manager new")]
    NoActiveEnvironment,

    #[error("Environment not found: {0}")]
    EnvironmentNotFound(String),

    #[error("Environment error: {0}")]
    EnvError(String),

    #[error("Invalid version: {0}. Expected format: MAJOR.MINOR.PATCH. For named tags like 'edge', use --tag instead.")]
    InvalidVersion(String),

    #[error("No command specified. Use --shell or provide a command after --.")]
    NoCommand,

    #[error("No container engine found. Install podman or docker.")]
    EngineNotFound,

    #[error("Container engine ({engine}) failed with exit code {code}:\n{stderr}")]
    EngineError {
        engine: ContainerEngine,
        code: i32,
        stderr: String,
    },

    #[error("Freeze failed: {0}")]
    FreezeError(String),

    #[error("Unfreeze failed: {0}")]
    UnfreezeError(String),

    #[error("SELinux error: {0}")]
    SELinuxError(String),

    #[error("Doctor found {0} error(s)")]
    DoctorFailed(u32),

    #[error("{}", match .0 {
        Scope::Local => "No local configuration found. Run: morloc-manager new",
        Scope::System => "No system configuration found. Run: sudo morloc-manager new --system",
    })]
    SetupNotComplete(Scope),
}

impl fmt::Display for Version {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "{}.{}.{}", self.major, self.minor, self.patch)
    }
}

impl fmt::Display for ContainerEngine {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        match self {
            ContainerEngine::Docker => write!(f, "Docker"),
            ContainerEngine::Podman => write!(f, "Podman"),
        }
    }
}

pub type Result<T> = std::result::Result<T, ManagerError>;


================================================
FILE: data/rust/morloc-manager/src/freeze.rs
================================================
use std::fs;
use std::path::Path;
use std::process::{Command, Stdio};

use chrono::Utc;
use sha2::{Digest, Sha256};
use crate::config;
use crate::error::{ManagerError, Result};
use crate::types::*;

pub fn freeze_from_dir(
    scope: Scope,
    ver: Version,
    engine: ContainerEngine,
    image: &str,
    v_data_dir: &str,
    output_dir: &str,
    verbose: bool,
) -> Result<()> {
    fs::create_dir_all(output_dir)
        .map_err(|e| ManagerError::FreezeError(format!("Failed to create output dir: {e}")))?;

    if !Path::new(v_data_dir).is_dir() {
        return Err(ManagerError::FreezeError(format!(
            "Data directory does not exist: {v_data_dir}"
        )));
    }

    // Validate programs exist before writing any files
    let modules = scan_modules(&format!("{v_data_dir}/fdb"));
    let programs = scan_programs(&format!("{v_data_dir}/fdb"));
    if programs.is_empty() {
        return Err(ManagerError::FreezeError(
            "No morloc programs are installed. Compile and install with 'morloc make --install' before freezing.".to_string()
        ));
    }

    // Validate programs work before freezing
    let mh = "/opt/morloc";
    let bind_mounts = vec![(v_data_dir.to_string(), mh.to_string())];
    crate::serve::validate_programs(engine, image, &programs, bind_mounts, verbose)?;

    eprintln!("Freezing installed state from {v_data_dir}...");
    let tar_path = Path::new(output_dir).join("state.tar.gz");
    let tar_path = tar_path.to_string_lossy();
    let mut tar_dirs: Vec<&str> = Vec::new();
    for dir in &["lib", "fdb", "bin", "exe", "opt", "src"] {
        if Path::new(&format!("{v_data_dir}/{dir}")).is_dir() {
            tar_dirs.push(dir);
        }
    }

    // Pre-flight: verify all files are readable before invoking tar
    for dir in &tar_dirs {
        check_readable_recursive(&Path::new(v_data_dir).join(dir))?;
    }

    let tar_status = Command::new("tar")
        .args(["-czf", &tar_path, "-C", v_data_dir])
        .args(&tar_dirs)
        .stdin(Stdio::null())
        .stdout(Stdio::null())
        .stderr(Stdio::inherit())
        .status()
        .map_err(|e| ManagerError::FreezeError(format!("tar failed: {e}")))?;

    if !tar_status.success() {
        return Err(ManagerError::FreezeError(
            "tar failed (see error output above)".to_string()
        ));
    }
    eprintln!("Created {tar_path}");
    let now = Utc::now();

    // Get base image from the active environment config.
    // Check local config first, then system config for the active env name
    // (mirrors resolve_active_env_name in environment.rs).
    let active_env_name: Option<String> = config::read_active_config()
        .and_then(|c| c.active_env)
        .or_else(|| {
            let sys_path = config::config_path(Scope::System);
            config::read_config::<Config>(&sys_path)
                .ok()
                .and_then(|c| c.active_env)
        });

    let (base_img, env_layer) = if let Some(ref env_name) = active_env_name {
        let env_scope = config::find_env_scope(env_name).unwrap_or(scope);
        match config::read_env_config(env_scope, env_name) {
            Ok(ec) => {
                let base = ec.base_image.clone();
                // Capture env layer info if there's a Dockerfile
                let layer = if ec.dockerfile.is_some() {
                    let df_path = config::env_dockerfile_path(env_scope, env_name);
                    if df_path.exists() {
                        let df_contents = fs::read_to_string(&df_path).unwrap_or_default();
                        let content_hash = ec.content_hash.unwrap_or_default();
                        // Use the tagged image reference (not digest) so that
                        // unfreeze can resolve it locally without network access.
                        // Digest references like localhost/morloc-env@sha256:...
                        // cause BuildKit to attempt HTTPS to localhost.
                        let image_tag = ec.built_image.clone();
                        Some(FrozenEnvLayer {
                            name: env_name.to_string(),
                            dockerfile: df_contents,
                            content_hash,
                            image_tag,
                        })
                    } else {
                        None
                    }
                } else {
                    None
                };
                (base, layer)
            }
            Err(_) => ("unknown".to_string(), None),
        }
    } else {
        ("unknown".to_string(), None)
    };

    let manifest = FreezeManifest {
        morloc_version: ver,
        frozen_at: now,
        modules,
        programs,
        base_image: base_img,
        env_layer,
        env_vars: Vec::new(),
    };
    let manifest_path = Path::new(output_dir).join("freeze-manifest.json");
    let manifest_path = manifest_path.to_string_lossy();
    write_freeze_manifest(&manifest_path, &manifest)?;
    eprintln!("Wrote {manifest_path}");
    eprintln!("Frozen state written to {output_dir}");
    Ok(())
}

pub fn write_freeze_manifest(path: &str, manifest: &FreezeManifest) -> Result<()> {
    let json = serde_json::to_vec(manifest)
        .map_err(|e| ManagerError::FreezeError(format!("JSON encode failed: {e}")))?;
    fs::write(path, json)
        .map_err(|e| ManagerError::FreezeError(format!("Write failed: {e}")))?;
    Ok(())
}

pub fn read_freeze_manifest(path: &str) -> Result<FreezeManifest> {
    let bytes =
        fs::read(path).map_err(|e| ManagerError::FreezeError(format!("Read failed: {e}")))?;
    serde_json::from_slice(&bytes)
        .map_err(|e| ManagerError::FreezeError(format!("Invalid manifest: {e}")))
}

// ======================================================================
// Internal: scanning installed state
// ======================================================================

fn scan_modules(fdb_dir: &str) -> Vec<ModuleEntry> {
    let fdb_path = Path::new(fdb_dir);
    if !fdb_path.is_dir() {
        return Vec::new();
    }
    let Ok(entries) = fs::read_dir(fdb_path) else {
        return Vec::new();
    };

    #[derive(serde::Deserialize)]
    struct ModuleStub {
        name: String,
        #[serde(default)]
        version: Option<String>,
    }

    entries
        .flatten()
        .filter(|e| {
            e.file_name()
                .to_string_lossy()
                .ends_with(".module")
        })
        .filter_map(|e| {
            let bytes = fs::read(e.path()).ok()?;
            let stub: ModuleStub = serde_json::from_slice(&bytes).ok()?;
            let digest = Sha256::digest(&bytes);
            let sha256: String = digest.iter().map(|b| format!("{b:02x}")).collect();
            Some(ModuleEntry {
                name: stub.name,
                version: stub.version,
                sha256,
            })
        })
        .collect()
}

fn scan_programs(fdb_dir: &str) -> Vec<ProgramEntry> {
    let fdb_path = Path::new(fdb_dir);
    if !fdb_path.is_dir() {
        return Vec::new();
    }
    let Ok(entries) = fs::read_dir(fdb_path) else {
        return Vec::new();
    };
    entries
        .flatten()
        .filter(|e| {
            e.file_name()
                .to_string_lossy()
                .ends_with(".manifest")
        })
        .map(|e| {
            let filename = e.file_name().to_string_lossy().to_string();
            let prog_name = filename.strip_suffix(".manifest").unwrap_or(&filename);
            let commands = parse_manifest_commands(&e.path());
            ProgramEntry {
                name: prog_name.to_string(),
                commands,
            }
        })
        .collect()
}

fn parse_manifest_commands(path: &Path) -> Vec<String> {
    let Ok(bytes) = fs::read(path) else {
        return Vec::new();
    };
    #[derive(serde::Deserialize)]
    struct ManifestStub {
        #[serde(default)]
        commands: Vec<ManifestStubCmd>,
    }
    #[derive(serde::Deserialize)]
    struct ManifestStubCmd {
        name: String,
    }
    match serde_json::from_slice::<ManifestStub>(&bytes) {
        Ok(stub) => stub.commands.into_iter().map(|c| c.name).collect(),
        Err(_) => Vec::new(),
    }
}

/// Walk a directory tree and verify every file is readable by the current user.
fn check_readable_recursive(dir: &Path) -> Result<()> {
    if !dir.is_dir() {
        return Ok(());
    }
    let entries = fs::read_dir(dir).map_err(|e| {
        ManagerError::FreezeError(format!("Cannot read directory {}: {e}", dir.display()))
    })?;
    for entry in entries {
        let entry = entry.map_err(|e| {
            ManagerError::FreezeError(format!(
                "Cannot read entry in {}: {e}",
                dir.display()
            ))
        })?;
        let path = entry.path();
        if path.is_dir() {
            check_readable_recursive(&path)?;
        } else if fs::File::open(&path).is_err() {
            return Err(ManagerError::FreezeError(format!(
                "Unreadable file: {}. Fix permissions or remove before freezing.",
                path.display()
            )));
        }
    }
    Ok(())
}


================================================
FILE: data/rust/morloc-manager/src/main.rs
================================================
mod config;
mod container;
mod doctor;
mod environment;
mod error;
mod freeze;
mod selinux;
mod serve;
mod types;

use std::collections::HashSet;
use std::fs;
use std::io::{self, IsTerminal, Write};
use std::process::{Command, ExitCode, Stdio};

use clap::builder::styling::Style;
use clap::{CommandFactory, FromArgMatches, Parser, Subcommand, ValueEnum};

use crate::config as cfg;
use crate::container::{container_run_passthrough, RunConfig};
use crate::error::{ManagerError, Result};
use crate::selinux::{detect_selinux, volume_suffix, SELinuxMode};
use crate::types::*;

// ======================================================================
// CLI types
// ======================================================================

fn build_help_template() -> String {
    let b = Style::new().bold().render();
    let bu = Style::new().bold().underline().render();
    let r = "\x1b[0m"; // full ANSI reset

    format!(
        "\
{{name}} - {{about}}

{{usage-heading}} {{usage}}

{bu}Development{r}
  {b}setup{r}      Configure the default container engine
  {b}new{r}        Build a new morloc environment
  {b}run{r}        Run a command in the active environment
  {b}rm{r}         Remove a morloc environment
  {b}ls{r}         List morloc environments
  {b}info{r}       Show configuration and installed environments
  {b}select{r}     Select an environment
  {b}update{r}     Rebuild an environment
  {b}nuke{r}       Remove all morloc environments

{bu}Deployment{r}
  {b}start{r}      Serve an environment over the network
  {b}stop{r}       Stop a running serve container
  {b}logs{r}       Stream logs from a running serve container
  {b}freeze{r}     Export installed state as a frozen artifact
  {b}unfreeze{r}   Build a portable serve image from frozen state
  {b}status{r}     List running serve containers
  {b}doctor{r}     Check environment health and diagnose issues

{bu}Options{r}
{{options}}"
    )
}

#[derive(Parser)]
#[command(name = "morloc-manager")]
#[command(about = "container lifecycle manager for Morloc")]
#[command(long_about = "Manage containerized Morloc installations, dependency layers, and deployments")]
#[command(disable_version_flag = true)]
#[command(arg_required_else_help = true)]
#[command(hide_possible_values = true)]
struct Cli {
    /// Print container commands to stderr before executing
    #[arg(short, long, global = true)]
    verbose: bool,

    /// Output machine-readable JSON instead of human-readable text
    #[arg(long, global = true)]
    json: bool,

    /// Print version and exit
    #[arg(long)]
    version: bool,

    #[command(subcommand)]
    command: Option<Cmd>,
}

#[derive(Subcommand)]
enum Cmd {
    // -- Development --
    /// Configure the default container engine
    #[command(display_order = 0)]
    #[command(after_help = "Examples:\n  morloc-manager setup --engine podman\n  morloc-manager setup --engine docker\n  sudo morloc-manager setup --engine podman --system")]
    Setup {
        /// Container engine: podman or docker
        #[arg(long, value_enum)]
        engine: Option<EngineArg>,
        /// Apply to system scope (requires root)
        #[arg(long)]
        system: bool,
    },
    /// Build a new morloc environment
    #[command(display_order = 1)]
    #[command(after_help = "Examples:\n  morloc-manager new\n  morloc-manager new myenv --version 0.73.0\n  morloc-manager new myenv --tag edge\n  morloc-manager new myenv --image ubuntu:22.04 --dockerfile ./Dockerfile\n\nDefault (when --version, --tag, and --image are all omitted): pulls the\n:edge tag from the morloc registry and records the resolved version.\n\nIn non-interactive mode (no TTY), if no name is given, the latest edge\nimage is pulled and the environment is named after the detected morloc\nversion.")]
    New {
        /// Environment name (default: derived from base image version)
        name: Option<String>,
        /// Base image from Docker Hub or a registry
        #[arg(long)]
        image: Option<String>,
        /// Morloc version (MAJOR.MINOR.PATCH, leading 'v' stripped automatically)
        #[arg(long)]
        version: Option<String>,
        /// Container image tag (e.g., 'edge', 'nightly')
        #[arg(long, conflicts_with_all = ["version", "image"])]
        tag: Option<String>,
        /// Dockerfile to layer on top of the base image
        #[arg(long)]
        dockerfile: Option<String>,
        /// Generate a stub Dockerfile for customization
        #[arg(long)]
        dockerfile_stub: bool,
        /// Force overwrite of existing Dockerfile stub
        #[arg(long)]
        force: bool,
        /// Include file/dir in build context; use src:dest for explicit placement (repeatable)
        #[arg(short = 'i', long = "include")]
        include: Vec<String>,
        /// Path to a file with one engine argument per line
        #[arg(long)]
        flagfile: Option<String>,
        /// A single engine flag (may be repeated)
        #[arg(short = 'x', long = "engine-arg", allow_hyphen_values = true)]
        engine_arg: Vec<String>,
        /// Container engine: podman or docker
        #[arg(long, value_enum)]
        engine: Option<EngineArg>,
        /// Shared memory size (default: 512m)
        #[arg(long)]
        shm_size: Option<String>,
        /// Create in system scope (requires root)
        #[arg(long)]
        system: bool,
        /// Skip morloc init after creation
        #[arg(long)]
        no_init: bool,
        /// Skip interactive wizard, use defaults for unspecified options
        #[arg(long)]
        non_interactive: bool,
    },
    /// Run a command in the active environment
    #[command(display_order = 2)]
    #[command(after_help = "\
Examples:
  morloc-manager run -- morloc --version
  morloc-manager run -- morloc make -o svc svc.loc
  morloc-manager run -- morloc install math
  morloc-manager run --shell

Use -- to separate morloc-manager flags from the container command.
Without --, flags like --version are interpreted by morloc-manager itself.")]
    Run {
        /// Command to run inside the container
        command: Vec<String>,
        /// Start an interactive shell
        #[arg(long)]
        shell: bool,
        /// Pass environment variable to the container (KEY=VALUE)
        #[arg(short, long = "env")]
        env_vars: Vec<String>,
        /// Read environment variables from a file (one KEY=VALUE per line)
        #[arg(long)]
        env_file: Option<String>,
    },
    /// Remove a morloc environment
    #[command(display_order = 3)]
    #[command(after_help = "Examples:\n  morloc-manager rm myenv\n  sudo morloc-manager rm myenv --system")]
    Rm {
        /// Environment name(s) to remove
        names: Vec<String>,
        /// Remove from system scope (requires root)
        #[arg(long)]
        system: bool,
        /// Remove even if active (deactivates first)
        #[arg(long)]
        force: bool,
    },
    /// Remove all morloc environments
    #[command(display_order = 8)]
    #[command(after_help = "Examples:\n  morloc-manager nuke\n  morloc-manager nuke --yes\n  morloc-manager nuke --images\n  sudo morloc-manager nuke --system\n  sudo morloc-manager nuke --system --images --yes")]
    Nuke {
        /// Remove system-scope environments instead of local (requires root)
        #[arg(long)]
        system: bool,
        /// Also remove base container images
        #[arg(long)]
        images: bool,
        /// Skip confirmation prompt
        #[arg(long)]
        yes: bool,
    },
    /// List morloc environments
    #[command(display_order = 4)]
    #[command(after_help = "Examples:\n  morloc-manager ls\n  morloc-manager ls --system")]
    Ls {
        /// Show only system environments
        #[arg(long)]
        system: bool,
        /// Show only local environments
        #[arg(long)]
        local: bool,
    },
    /// Show configuration and installed environments
    #[command(display_order = 5)]
    #[command(after_help = "Examples:\n  morloc-manager info\n  morloc-manager info myenv")]
    Info {
        /// Environment name (show details for this environment)
        name: Option<String>,
        /// Look up the system-scope environment (when name is shadowed locally)
        #[arg(long)]
        system: bool,
    },
    /// Select an environment
    #[command(display_order = 6)]
    #[command(after_help = "Examples:\n  morloc-manager select myenv\n  sudo morloc-manager select myenv --system")]
    Select {
        /// Environment name
        name: String,
        /// Write to system config instead of local (requires root)
        #[arg(long)]
        system: bool,
    },

    /// Rebuild an environment
    #[command(display_order = 7)]
    #[command(after_help = "Examples:\n  morloc-manager update              # rebuild active environment\n  morloc-manager update myenv        # rebuild a specific environment\n  morloc-manager update --shm-size 1g\n  morloc-manager update --dockerfile ./new.Dockerfile -i ./data\n  morloc-manager update myenv --reinit  # re-run morloc init in myenv")]
    Update {
        /// Environment name (default: active environment)
        name: Option<String>,
        /// Change the base image
        #[arg(long)]
        image: Option<String>,
        /// Change to a specific morloc version (MAJOR.MINOR.PATCH, leading 'v' stripped)
        #[arg(long)]
        version: Option<String>,
        /// Container image tag (e.g., 'edge', 'nightly')
        #[arg(long, conflicts_with_all = ["version", "image"])]
        tag: Option<String>,
        /// Replace the Dockerfile
        #[arg(long)]
        dockerfile: Option<String>,
        /// Include file/dir in build context; use src:dest for explicit placement (repeatable)
        #[arg(short = 'i', long = "include")]
        include: Vec<String>,
        /// Replace the flags file
        #[arg(long)]
        flagfile: Option<String>,
        /// Add an engine flag (repeatable; appends unless --flagfile replaces)
        #[arg(short = 'x', long = "engine-arg", allow_hyphen_values = true)]
        engine_arg: Vec<String>,
        /// Change the container engine
        #[arg(long, value_enum)]
        engine: Option<EngineArg>,
        /// Change shared memory size
        #[arg(long)]
        shm_size: Option<String>,
        /// Generate a stub Dockerfile (fails if one already exists)
        #[arg(long)]
        dockerfile_stub: bool,
        /// Force overwrite of existing Dockerfile stub
        #[arg(long)]
        force: bool,
        /// Skip Dockerfile build
        #[arg(long)]
        no_build: bool,
        /// Re-run morloc init
        #[arg(long)]
        reinit: bool,
        /// Accepted for scripting uniformity with `new` (no effect)
        #[arg(long, hide = true)]
        non_interactive: bool,
    },

    // -- Deployment --
    /// Serve an environment over the network
    #[command(display_order = 20)]
    #[command(after_help = "Examples:\n  morloc-manager start              # serve active environment\n  morloc-manager start myenv -p 9090:8080")]
    Start {
        /// Environment name (default: active environment)
        name: Option<String>,
        /// Port mapping HOST:CONTAINER (default: 8080:8080)
        #[arg(short, long, value_parser = parse_port)]
        port: Vec<(u16, u16)>,
        /// Pass environment variable to the container (KEY=VALUE)
        #[arg(short, long = "env")]
        env_vars: Vec<String>,
        /// Read environment variables from a file (one KEY=VALUE per line)
        #[arg(long)]
        env_file: Option<String>,
        /// Replace an already-running serve container
        #[arg(long)]
        force: bool,
    },
    /// Stop a running serve container
    #[command(display_order = 21)]
    #[command(after_help = "Examples:\n  morloc-manager stop              # stop active environment\n  morloc-manager stop myenv")]
    Stop {
        /// Environment name (default: active environment)
        name: Option<String>,
    },
    /// Stream logs from a running serve container
    #[command(display_order = 22)]
    #[command(after_help = "Examples:\n  morloc-manager logs              # logs from only running serve container\n  morloc-manager logs myenv\n  morloc-manager logs -f myenv     # follow mode")]
    Logs {
        /// Environment name (default: auto-detect running container)
        name: Option<String>,
        /// Follow log output
        #[arg(short, long)]
        follow: bool,
    },
    /// Export installed state as a frozen artifact
    #[command(display_order = 23)]
    #[command(after_help = "Examples:\n  morloc-manager freeze\n  morloc-manager freeze myenv\n  morloc-manager freeze -o ./my-freeze\n\nRequires at least one program compiled with 'morloc make --install'.")]
    Freeze {
        /// Environment name (default: active environment)
        name: Option<String>,
        /// Output directory (default: ./morloc-freeze)
        #[arg(short, long)]
        output: Option<String>,
        /// Overwrite existing output directory
        #[arg(long)]
        force: bool,
    },
    /// Build a serve image from frozen state
    #[command(display_order = 24)]
    #[command(after_help = "Examples:\n  morloc-manager unfreeze --from ./morloc-freeze/state.tar.gz -t myservice:v1\n  morloc-manager unfreeze --from ./state.tar.gz -t svc:v1 --engine docker")]
    Unfreeze {
        /// Path to state.tar.gz from freeze
        #[arg(long)]
        from: String,
        /// Image tag
        #[arg(short, long)]
        tag: String,
        /// Base image override
        #[arg(long)]
        base: Option<String>,
        /// Container engine override (default: configured engine).
        /// Images frozen with engine-specific flags may not work with a different engine.
        #[arg(long, value_enum)]
        engine: Option<EngineArg>,
        /// Rebuild image even if it already exists locally
        #[arg(long)]
        rebuild: bool,
    },
    /// Evaluate a morloc expression against a running serve container
    #[command(display_order = 25)]
    #[command(after_help = "Examples:\n  morloc-manager eval 'add 1 2'\n  morloc-manager eval myenv 'map (add 1) [1,2,3]'\n  morloc-manager eval -p 9090 'greet \"world\"'")]
    Eval {
        /// Expression to evaluate (or environment name if two positional args)
        first: String,
        /// Expression to evaluate (when first arg is environment name)
        second: Option<String>,
        /// Port of the serve container (default: 8080)
        #[arg(short, long, default_value = "8080")]
        port: u16,
    },
    /// List running serve containers
    #[command(display_order = 26)]
    #[command(after_help = "Examples:\n  morloc-manager status")]
    Status,
    /// Check environment health and diagnose issues
    #[command(display_order = 26)]
    #[command(after_help = "Examples:\n  morloc-manager doctor\n  morloc-manager doctor myenv\n  morloc-manager doctor --deep")]
    Doctor {
        /// Environment name (default: active)
        name: Option<String>,
        /// Check system-scope environment
        #[arg(long)]
        system: bool,
        /// Run checks inside the container (slower, more thorough)
        #[arg(long)]
        deep: bool,
        /// Treat warnings as errors (non-zero exit on warnings)
        #[arg(long)]
        strict: bool,
    },
}

#[derive(Clone, ValueEnum)]
enum EngineArg {
    Docker,
    Podman,
}

impl From<EngineArg> for ContainerEngine {
    fn from(e: EngineArg) -> Self {
        match e {
            EngineArg::Docker => ContainerEngine::Docker,
            EngineArg::Podman => ContainerEngine::Podman,
        }
    }
}

fn parse_port(s: &str) -> std::result::Result<(u16, u16), String> {
    let parts: Vec<&str> = s.splitn(2, ':').collect();
    if parts.len() != 2 {
        return Err(format!("Expected HOST:CONTAINER format, got: {s}"));
    }
    let host: u16 = parts[0]
        .parse()
        .map_err(|_| format!("Invalid host port: {}", parts[0]))?;
    let container: u16 = parts[1]
        .parse()
        .map_err(|_| format!("Invalid container port: {}", parts[1]))?;
    Ok((host, container))
}

/// Parse env vars from --env flags and --env-file, returning (key, value) pairs.
fn collect_env_vars(
    env_flags: &[String],
    env_file: Option<&str>,
) -> Result<Vec<(String, String)>> {
    let mut result = Vec::new();

    if let Some(path) = env_file {
        let contents = std::fs::read_to_string(path).map_err(|e| {
            ManagerError::EnvError(format!("Cannot read env file {path}: {e}"))
        })?;
        for line in contents.lines() {
            let trimmed = line.trim();
            if trimmed.is_empty() || trimmed.starts_with('#') {
                continue;
            }
            if let Some((k, v)) = trimmed.split_once('=') {
                result.push((k.to_string(), v.to_string()));
            }
        }
    }

    for entry in env_flags {
        if let Some((k, v)) = entry.split_once('=') {
            result.push((k.to_string(), v.to_string()));
        } else {
            // Bare key — pass through from host environment
            if let Ok(v) = std::env::var(entry) {
                result.push((entry.clone(), v));
            } else {
                eprintln!("Warning: env var '{entry}' not set in host environment, skipping");
            }
        }
    }

    Ok(result)
}

// ======================================================================
// Main
// ======================================================================

fn main() -> ExitCode {
    #[cfg(unix)]
    {
        use nix::sys::signal::{signal, SigHandler, Signal};
        unsafe { let _ = signal(Signal::SIGPIPE, SigHandler::SigDfl); }
    }

    let matches = match Cli::command()
        .help_template(build_help_template())
        .try_get_matches()
    {
        Ok(m) => m,
        Err(e) => {
            // Detect missing -- separator for the run subcommand
            let rendered = e.to_string();
            if rendered.contains("unrecognized") || rendered.contains("unexpected") {
                let args: Vec<String> = std::env::args().collect();
                if args.len() > 1 && args[1] == "run" {
                    let inner: Vec<&str> = args[2..].iter()
                        .filter(|a| *a != "--shell")
                        .map(|a| a.as_str())
                        .collect();
                    if !inner.is_empty() {
                        eprintln!("Error: unrecognized arguments for 'run'.");
                        eprintln!();
                        eprintln!("Use -- to separate morloc-manager flags from the container command:");
                        eprintln!("  morloc-manager run -- {}", inner.join(" "));
                        return ExitCode::from(2);
                    }
                }
            }
            e.exit();
        }
    };
    let cli = Cli::from_arg_matches(&matches).unwrap();
    if cli.version {
        println!("morloc-manager {}", env!("CARGO_PKG_VERSION"));
        return ExitCode::SUCCESS;
    }
    let Some(cmd) = cli.command else {
        Cli::command()
            .help_template(build_help_template())
            .print_help()
            .ok();
        return ExitCode::from(2);
    };
    match dispatch(cli.verbose, cli.json, cmd) {
        Ok(()) => ExitCode::SUCCESS,
        Err(err) => {
            if cli.json {
                println!("{}", serde_json::json!({"error": format!("{err}")}));
            } else {
                eprintln!("{err}");
            }
            if let ManagerError::EngineError { code, .. } = &err {
                ExitCode::from(*code as u8)
            } else {
                ExitCode::FAILURE
            }
        }
    }
}

fn resolve_scope(system: bool) -> Scope {
    if system { Scope::System } else { Scope::Local }
}

fn check_system_write_access() -> Result<()> {
    let sys_dir = cfg::config_dir(Scope::System);
    if sys_dir.exists() {
        let test_path = sys_dir.join(".write-check");
        match fs::write(&test_path, b"") {
            Ok(_) => { let _ = fs::remove_file(&test_path); Ok(()) }
            Err(_) => Err(ManagerError::ConfigPermissionDenied(format!(
                "{}. System-scope operations require root. Re-run with sudo",
                sys_dir.display()
            )))
        }
    } else {
        match fs::create_dir_all(&sys_dir) {
            Ok(_) => Ok(()),
            Err(_) => Err(ManagerError::ConfigPermissionDenied(format!(
                "{}. System-scope operations require root. Re-run with sudo",
                sys_dir.display()
            )))
        }
    }
}

/// Resolve an environment by explicit name or fall back to the active environment.
fn resolve_env_or_active(name: Option<String>) -> Result<(String, Scope, EnvironmentConfig)> {
    match name {
        Some(n) => {
            let scope = cfg::find_env_scope(&n)?;
            let ec = cfg::read_env_config(scope, &n)?;
            Ok((n, scope, ec))
        }
        None => environment::resolve_active_environment(),
    }
}

fn ensure_engine() -> Result<ContainerEngine> {
    if let Some(cfg) = cfg::read_active_config() {
        return Ok(cfg.engine);
    }
    Err(ManagerError::SetupNotComplete(Scope::Local))
}

fn which(name: &str) -> bool {
    Command::new("which")
        .arg(name)
        .stdout(Stdio::null())
        .stderr(Stdio::null())
        .status()
        .map(|s| s.success())
        .unwrap_or(false)
}

fn display_engine(engine: ContainerEngine) -> &'static str {
    match engine {
        ContainerEngine::Docker => "docker",
        ContainerEngine::Podman => "podman",
    }
}

fn bold_green(msg: &str) -> String {
    if io::stderr().is_terminal() {
        format!("\x1b[1;32m{msg}\x1b[0m")
    } else {
        msg.to_string()
    }
}

fn check_docker_socket(engine: ContainerEngine) {
    use std::path::Path;
    if engine != ContainerEngine::Docker {
        return;
    }
    let socket = Path::new("/var/run/docker.sock");
    if !socket.exists() {
        eprintln!("Warning: Docker socket not found at /var/run/docker.sock");
        eprintln!("  Docker may not be installed or the daemon may not be running.");
    } else if nix::unistd::access(socket, nix::unistd::AccessFlags::R_OK).is_err() {
        eprintln!("Warning: Cannot access Docker socket. You may need to:");
        eprintln!("  sudo usermod -aG docker $USER  # then log out and back in");
    }
}

/// Returns Err with a clear message if Docker is selected but its socket is unreachable.
fn require_docker_socket(engine: ContainerEngine) -> Result<()> {
    use std::path::Path;
    if engine != ContainerEngine::Docker {
        return Ok(());
    }
    let socket = Path::new("/var/run/docker.sock");
    if !socket.exists() {
        return Err(ManagerError::EnvError(
            "Docker socket not found at /var/run/docker.sock. Ensure Docker is installed and the daemon is running.".to_string()
        ));
    }
    if nix::unistd::access(socket, nix::unistd::AccessFlags::R_OK).is_err() {
        return Err(ManagerError::EnvError(
            "Cannot access Docker socket. Add your user to the docker group:\n  \
             sudo usermod -aG docker $USER  # then log out and back in".to_string()
        ));
    }
    Ok(())
}

/// Check if Podman is configured to see rootful images from rootless contexts.
/// Returns true if additionalimagestore is configured (or not needed).
fn check_podman_additional_stores(engine: ContainerEngine) -> bool {
    if engine != ContainerEngine::Podman {
        return true;
    }
    // Root doesn't need additional stores — it owns the store
    if nix::unistd::getuid().is_root() {
        return true;
    }
    let rootful_store = std::path::Path::new("/var/lib/containers/storage");
    if !rootful_store.is_dir() {
        // No rootful store exists, nothing to configure
        return true;
    }
    // Check system and user storage.conf for additionalimagestores
    for path in &[
        "/etc/containers/storage.conf",
        &format!(
            "{}/.config/containers/storage.conf",
            dirs::home_dir()
                .unwrap_or_default()
                .to_string_lossy()
        ),
    ] {
        if let Ok(contents) = fs::read_to_string(path) {
            if contents.contains("/var/lib/containers/storage") {
                return true;
            }
        }
    }
    false
}

fn warn_podman_additional_stores() {
    eprintln!("Warning: Podman is not configured to see system (rootful) images.");
    eprintln!("  Non-root users will not be able to run system environments.");
    eprintln!("  Option 1 (recommended): Use Docker for system environments.");
    eprintln!("  Option 2: Add to [storage.options] in /etc/containers/storage.conf:");
    eprintln!();
    eprintln!("    additionalimagestores = [\"/var/lib/containers/storage\"]");
    eprintln!();
    eprintln!("  Note: Option 2 may cause storage locking conflicts on Fedora and Debian.");
}

// ======================================================================
// Dispatch
// ======================================================================

fn dispatch(verbose: bool, json: bool, cmd: Cmd) -> Result<()> {
    match cmd {
        // ---- setup ----
        Cmd::Setup { engine, system } => {
            // With no --engine, show the current engine settings
            if engine.is_none() {
                let local = cfg::read_config::<Config>(&cfg::config_path(Scope::Local)).ok();
                let sys = cfg::read_config::<Config>(&cfg::config_path(Scope::System)).ok();
                println!("Local engine:   {}",
                    local.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset"));
                println!("System engine:  {}",
                    sys.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset"));
                println!();
                println!("Set with: morloc-manager setup --engine <podman|docker>");
                return Ok(());
            }
            if system { check_system_write_access()?; }
            let scope = resolve_scope(system);
            let eng: ContainerEngine = engine.unwrap().into();
            check_docker_socket(eng);
            let cfg_path = cfg::config_path(scope);
            let base_cfg = cfg::read_config::<Config>(&cfg_path).unwrap_or_default();
            let new_cfg = Config {
                engine: eng,
                ..base_cfg
            };
            cfg::write_config(&cfg_path, &new_cfg)?;
            eprintln!("Engine set to: {}", display_engine(eng));
            Ok(())
        }

        // ---- new ----
        Cmd::New {
            name,
            image,
            version,
            tag,
            dockerfile,
            dockerfile_stub,
            force,
            include,
            flagfile,
            engine_arg,
            engine,
            shm_size,
            system,
            no_init,
            non_interactive,
        } => {
            if system { check_system_write_access()?; }
            let scope = resolve_scope(system);

            // Resolve engine: explicit flag > config default > auto-detect single > error
            // For --system, prefer system config so the env uses the system engine.
            let resolved_engine = if let Some(e) = engine {
                let eng: ContainerEngine = e.into();
                check_docker_socket(eng);
                eng
            } else if let Some(cfg) = if system {
                // System scope: check system config first, then local
                cfg::read_config::<Config>(&cfg::config_path(Scope::System)).ok()
                    .or_else(|| cfg::read_active_config())
            } else {
                cfg::read_active_config()
            } {
                cfg.engine
            } else {
                // No config — try auto-detection
                let has_podman = which("podman");
                let has_docker = which("docker");
                match (has_podman, has_docker) {
                    (true, false) => ContainerEngine::Podman,
                    (false, true) => {
                        check_docker_socket(ContainerEngine::Docker);
                        ContainerEngine::Docker
                    }
                    (true, true) => {
                        let scope_flag = if system { " --system" } else { "" };
                        return Err(ManagerError::EnvError(format!(
                            "Both podman and docker are installed and no default is set.\n\
                             Pick one with:\n  \
                             morloc-manager setup --engine podman{scope_flag}\n  \
                             morloc-manager setup --engine docker{scope_flag}\n\
                             Or pass --engine to this command directly."
                        )));
                    }
                    (false, false) => return Err(ManagerError::EngineNotFound),
                }
            };

            // Ensure config exists (write default if first run)
            if cfg::read_active_config().is_none() {
                let cfg_path = cfg::config_path(scope);
                let new_cfg = Config {
                    active_env: None,
                    engine: resolved_engine,
                };
                cfg::write_config(&cfg_path, &new_cfg)?;
            }

            let interactive = !non_interactive && io::stdin().is_terminal();
            if !non_interactive && !interactive {
                eprintln!("Note: No TTY detected, running in non-interactive mode.");
            }

            // Step 1: Resolve name (ask first so user isn't surprised after a long pull)
            let env_name = if let Some(n) = name {
                if cfg::env_config_path(scope, &n).is_file() {
                    return Err(ManagerError::EnvError(format!(
                        "Environment '{n}' already exists"
                    )));
                }
                n
            } else if interactive {
                loop {
                    eprint!("Environment name: ");
                    io::stderr().flush().ok();
                    let mut name_input = String::new();
                    io::stdin().read_line(&mut name_input).ok();
                    let n = name_input.trim().to_string();
                    if n.is_empty() {
                        eprintln!("Name cannot be empty.");
                        continue;
                    }
                    if cfg::env_config_path(scope, &n).is_file() {
                        eprintln!("Environment '{n}' already exists. Choose a different name.");
                        continue;
                    }
                    break n;
                }
            } else {
                // Non-interactive without a name: will be filled in after
                // version resolution below (default to version string)
                String::new()
            };

            // Validate name early (before potentially slow image pull)
            if !env_name.is_empty() {
                environment::validate_env_name(&env_name)?;
            }

            if version.is_some() && image.is_some() {
                return Err(ManagerError::EnvError(
                    "--version and --image are mutually exclusive".to_string()
                ));
            }

            // Validate cheap-to-check parameters before any I/O
            if let Some(ref shm) = shm_size {
                if !environment::is_valid_shm_size(shm) {
                    return Err(ManagerError::EnvError(format!(
                        "Invalid --shm-size '{shm}'. Use format like: 512m, 1g, 2048k"
                    )));
                }
            }

            // Step 2: Resolve base image and version
            let (base_image, original_image, morloc_ver) = if let Some(ref ver_str) = version {
                // Strip leading 'v' for convenience (e.g., "v0.77.0" -> "0.77.0")
                let clean = ver_str.strip_prefix('v').unwrap_or(ver_str);
                let ver: Version = clean.parse().map_err(|_| {
                    ManagerError::InvalidVersion(ver_str.clone())
                })?;
                let img = environment::pull_version_image(resolved_engine, &ver)?;
                (img, None, Some(ver))
            } else if let Some(ref t) = tag {
                let (img, ver) = environment::pull_tagged_image(resolved_engine, t)?;
                (img, None, Some(ver))
            } else if let Some(ref img) = image {
                environment::pull_custom_image(resolved_engine, img)?;
                (img.clone(), None, None)
            } else if interactive {
                eprintln!("Choose a base image:");
                eprintln!("  [1] Latest morloc release (recommended)");
                eprintln!("  [2] Specific morloc version");
                eprintln!("  [3] Custom image");
                eprint!("Choose [1]: ");
                io::stderr().flush().ok();
                let mut input = String::new();
                io::stdin().read_line(&mut input).ok();
                match input.trim() {
                    "2" => {
                        eprint!("Morloc version: ");
                        io::stderr().flush().ok();
                        let mut ver_input = String::new();
                        io::stdin().read_line(&mut ver_input).ok();
                        let ver: Version = ver_input.trim().parse().map_err(|_| {
                            ManagerError::InvalidVersion(ver_input.trim().to_string())
                        })?;
                        let img = environment::pull_version_image(resolved_engine, &ver)?;
                        (img, None, Some(ver))
                    }
                    "3" => {
                        eprint!("Image reference: ");
                        io::stderr().flush().ok();
                        let mut img_input = String::new();
                        io::stdin().read_line(&mut img_input).ok();
                        let img = img_input.trim().to_string();
                        if img.is_empty() {
                            return Err(ManagerError::EnvError("No image specified".to_string()));
                        }
                        environment::pull_custom_image(resolved_engine, &img)?;
                        (img, None, None)
                    }
                    _ => {
                        let (img, ver) = environment::resolve_latest(resolved_engine)?;
                        (img.clone(), Some(img), Some(ver))
                    }
                }
            } else {
                let (img, ver) = environment::resolve_latest(resolved_engine)?;
                (img.clone(), Some(img), Some(ver))
            };

            // Fill in name for non-interactive mode if it wasn't provided
            let env_name = if env_name.is_empty() {
                if let Some(ref ver) = morloc_ver {
                    let default_name = ver.show();
                    if cfg::env_config_path(scope, &default_name).is_file() {
                        return Err(ManagerError::EnvError(format!(
                            "Environment '{}' already exists. Specify a different name: morloc-manager new <NAME> ...",
                            default_name
                        )));
                    }
                    default_name
                } else {
                    return Err(ManagerError::EnvError(
                        "Environment name required in non-interactive mode".to_string(),
                    ));
                }
            } else {
                env_name
            };

            // Resolve dockerfile: explicit path takes precedence, then stub generation
            let resolved_dockerfile = if dockerfile.is_some() {
                if dockerfile_stub {
                    return Err(ManagerError::EnvError(
                        "Cannot use both --dockerfile and --dockerfile-stub".to_string(),
                    ));
                }
                dockerfile
            } else if dockerfile_stub {
                let df_path = cfg::env_dockerfile_path(scope, &env_name);
                if df_path.exists() && !force {
                    return Err(ManagerError::EnvError(format!(
                        "Dockerfile already exists: {}\nUse --force to overwrite.",
                        df_path.display()
                    )));
                }
                let stub_dir = cfg::data_dir(scope).join("tmp");
                fs::create_dir_all(&stub_dir).map_err(|e| {
                    ManagerError::EnvError(format!("Failed to create tmp dir: {e}"))
                })?;
                let stub_path = stub_dir.join(format!("{env_name}.Dockerfile"));
                let stub_content = format!(
                    "# morloc environment: {env_name}\n\
                     # Edit this file, then rebuild with: morloc-manager update\n\
                     \n\
                     # CONTAINER_BASE is replaced at build time with the environment's base image\n\
                     ARG CONTAINER_BASE=scratch\n\
                     FROM ${{CONTAINER_BASE}}\n\
                     \n\
                     # Example: install system packages\n\
                     # RUN apt-get update && apt-get install -y jq && rm -rf /var/lib/apt/lists/*\n\
                     \n\
                     # Example: install Python packages\n\
                     # RUN pip install scikit-learn pandas\n\
                     \n\
                     # Example: install R packages\n\
                     # RUN R -e \"install.packages('ggplot2', repos='https://cloud.r-project.org')\"\n"
                );
                fs::write(&stub_path, &stub_content).map_err(|e| {
                    ManagerError::EnvError(format!("Failed to write stub Dockerfile: {e}"))
                })?;
                Some(stub_path.to_string_lossy().to_string())
            } else {
                None
            };

            let opts = environment::ApplyOptions {
                name: env_name.clone(),
                scope,
                is_new: true,
                base_image: Some(base_image),
                original_image,
                morloc_version: morloc_ver,
                dockerfile: resolved_dockerfile,
                includes: include,
                flagfile,
                engine_args: engine_arg,
                engine: Some(resolved_engine),
                shm_size: Some(shm_size.unwrap_or_else(|| "512m".to_string())),
                skip_dockerfile_build: dockerfile_stub,
                verbose,
            };

            environment::apply_environment(&opts)?;

            if dockerfile_stub {
                let df_path = cfg::env_dockerfile_path(scope, &env_name);
                eprintln!("Stub Dockerfile: {}", df_path.display());
                eprintln!("Edit it, then run: morloc-manager update {env_name}");
            }

            eprintln!("Created environment: {env_name}");

            // Run morloc init, passing the env explicitly (no active env needed)
            if !no_init {
                let ec = cfg::read_env_config(scope, &env_name)?;
                run_morloc_init_for(Some((env_name.clone(), scope, ec)), verbose)?;
            } else {
                eprintln!("Warning: --no-init was used. Run 'morloc-manager run -- morloc init -f' before building morloc programs.");
            }

            eprintln!("{}", bold_green(&format!("Environment '{env_name}' is ready.")));
            eprintln!("Activate it with: morloc-manager select {env_name}");

            if system && !check_podman_additional_stores(resolved_engine) {
                eprintln!();
                warn_podman_additional_stores();
            }

            Ok(())
        }

        // ---- run ----
        Cmd::Run { command, shell, env_vars, env_file } => {
            if !shell && command.is_empty() {
                return Err(ManagerError::NoCommand);
            }
            let user_env = collect_env_vars(&env_vars, env_file.as_deref())?;
            run_in_container(verbose, shell, &command, &user_env).map_err(|e| match e {
                ManagerError::EnvironmentNotFound(msg) => ManagerError::EnvironmentNotFound(
                    format!("{msg}. Run 'morloc-manager new' to create an environment")
                ),
                other => other,
            })
        }

        // ---- rm ----
        Cmd::Rm { names, system, force } => {
            if system { check_system_write_access()?; }
            if names.is_empty() {
                return Err(ManagerError::EnvError("No environment names specified".to_string()));
            }
            // Capture current active env for post-removal feedback
            let was_active = cfg::read_active_config().and_then(|c| c.active_env);
            // Attempt each removal; collect failures, continue past errors
            let mut failures: Vec<String> = Vec::new();
            for name in &names {
                let result: Result<()> = (|| {
                    let scope = if system {
                        Scope::System
                    } else {
                        cfg::find_env_scope(name)?
                    };
                    if scope == Scope::System && !system {
                        check_system_write_access()?;
                    }
                    if !force {
                        if let Some(cfg) = cfg::read_active_config() {
                            if cfg.active_env.as_deref() == Some(name.as_str()) {
                                return Err(ManagerError::EnvError(format!(
                                    "active environment (use --force)"
                                )));
                            }
                        }
                    }
                    let ec = cfg::read_env_config(scope, name)
                        .map_err(|_| ManagerError::EnvironmentNotFound(name.to_string()))?;
                    environment::remove_environment(ec.engine, scope, name)?;
                    Ok(())
                })();
                match result {
                    Ok(()) => {
                        // Check if removed env was active and report new state
                        if was_active.as_deref() == Some(name.as_str()) {
                            match environment::resolve_active_environment() {
                                Ok((new_active, _, _)) => {
                                    // Persist the fallback as the new active environment
                                    let _ = environment::select_environment(&new_active, Scope::Local);
                                    eprintln!("Removed environment: {name}. Active environment is now: {new_active}");
                                }
                                Err(_) => {
                                    eprintln!("Removed environment: {name}. No active environment. Use: morloc-manager select <name>");
                                }
                            }
                        } else {
                            eprintln!("Removed environment: {name}");
                        }
                    }
                    Err(e) => failures.push(format!("{name}: {e}")),
                }
            }
            if !failures.is_empty() {
                eprintln!();
                eprintln!("Failed to remove {} environment(s):", failures.len());
                for f in &failures {
                    eprintln!("  {f}");
                }
                return Err(ManagerError::EnvError(format!(
                    "{} of {} removals failed",
                    failures.len(),
                    names.len()
                )));
            }
            Ok(())
        }

        // ---- nuke ----
        Cmd::Nuke { system, images, yes } => {
            let scope = if system { Scope::System } else { Scope::Local };
            let scope_label = if system { "system" } else { "local" };

            if system {
                check_system_write_access()?;
            }

            // Confirm before removing all environments
            let env_names = cfg::list_env_names(scope);
            if env_names.is_empty() {
                eprintln!("No {scope_label} environments found.");
                return Ok(());
            }

            if !yes {
                eprintln!("This will remove {} {scope_label} environment(s):", env_names.len());
                for n in &env_names {
                    eprintln!("  {n}");
                }
                if io::stdin().is_terminal() {
                    eprint!("Continue? [y/N] ");
                    io::stderr().flush().ok();
                    let mut answer = String::new();
                    io::stdin().read_line(&mut answer).ok();
                    if !matches!(answer.trim(), "y" | "yes" | "Y" | "YES") {
                        eprintln!("Aborted.");
                        return Ok(());
                    }
                } else {
                    return Err(ManagerError::EnvError(
                        "nuke requires --yes for non-interactive use".to_string(),
                    ));
                }
            }

            eprintln!("Removing all {scope_label} morloc environments...");

            // Collect env info before removal (configs are deleted during removal)
            let mut env_list: Vec<(String, ContainerEngine)> = Vec::new();
            let mut base_images: HashSet<String> = HashSet::new();

            for name in cfg::list_env_names(scope) {
                if let Ok(ec) = cfg::read_env_config(scope, &name) {
                    if images {
                        base_images.insert(ec.base_image.clone());
                        if let Some(ref orig) = ec.original_image {
                            base_images.insert(orig.clone());
                        }
                    }
                    env_list.push((name, ec.engine));
                }
            }

            if env_list.is_empty() {
                eprintln!("No {scope_label} environments found.");
            } else {
                let mut removed = 0usize;
                let mut failures: Vec<String> = Vec::new();

                for (name, engine) in &env_list {
                    eprintln!("Removing environment: {name}...");
                    match environment::remove_environment(*engine, scope, name) {
                        Ok(()) => {
                            eprintln!("  Removed: {name}");
                            removed += 1;
                        }
                        Err(e) => {
                            eprintln!("  Failed: {name}: {e}");
                            failures.push(format!("{name}: {e}"));
                        }
                    }
                }

                // Clear active_env in the targeted scope's config
                let cfg_path = cfg::config_path(scope);
                if let Ok(cfg_data) = cfg::read_config::<Config>(&cfg_path) {
                    if cfg_data.active_env.is_some() {
                        let new_cfg = Config { active_env: None, ..cfg_data };
                        let _ = cfg::write_config(&cfg_path, &new_cfg);
                        eprintln!("Cleared active environment.");
                    }
                }

                eprintln!("Removed {removed} environment(s).");

                if !failures.is_empty() {
                    eprintln!();
                    eprintln!("Failed to remove {} environment(s):", failures.len());
                    for f in &failures {
                        eprintln!("  {f}");
                    }
                    return Err(ManagerError::EnvError(format!(
                        "{} of {} removals failed",
                        failures.len(),
                        env_list.len()
                    )));
                }
            }

            // Remove base images if --images
            if images && !base_images.is_empty() {
                let engine = ensure_engine().unwrap_or(ContainerEngine::Docker);
                eprintln!("Removing base images...");
                for img in &base_images {
                    if container::image_exists_locally(engine, img) {
                        eprintln!("  Removing image: {img}...");
                        if container::remove_image(engine, img) {
                            eprintln!("  Removed: {img}");
                        } else {
                            eprintln!("  Failed to remove: {img}");
                        }
                    }
                }
            }

            // Hint about the other scope
            let other_scope = if system { Scope::Local } else { Scope::System };
            let other_envs = cfg::list_env_names(other_scope);
            if !other_envs.is_empty() {
                if system {
                    eprintln!(
                        "{} local environment(s) remain. Use: morloc-manager nuke",
                        other_envs.len()
                    );
                } else {
                    eprintln!(
                        "{} system environment(s) remain. Use: sudo morloc-manager nuke --system",
                        other_envs.len()
                    );
                }
            }

            Ok(())
        }

        // ---- ls ----
        Cmd::Ls { system, local } => {
            let active_env = cfg::read_active_config()
                .and_then(|c| c.active_env);
            let active_str = active_env.as_deref();

            // Determine which scope effectively owns the active environment.
            // Local takes priority (same resolution as run/select).
            let active_in_local = active_str
                .map(|name| cfg::env_config_path(Scope::Local, name).is_file())
                .unwrap_or(false);

            let show_local = !system || local;
            let show_system = !local || system;

            let local_envs = if show_local {
                let local_active = if active_in_local { active_str } else { None };
                environment::list_environments(Scope::Local, local_active)
            } else {
                Vec::new()
            };
            let system_envs = if show_system {
                let system_active = if active_in_local { None } else { active_str };
                environment::list_environments(Scope::System, system_active)
            } else {
                Vec::new()
            };

            if json {
                #[derive(serde::Serialize)]
                struct LsOutput {
                    local: Vec<environment::EnvInfo>,
                    system: Vec<environment::EnvInfo>,
                }
                let output = LsOutput { local: local_envs, system: system_envs };
                println!("{}", serde_json::to_string_pretty(&output).unwrap());
            } else {
                let total = local_envs.len() + system_envs.len();
                if !local_envs.is_empty() {
                    println!("Local environments:");
                    for e in &local_envs {
                        let active_mark = if e.active { " (active)" } else { "" };
                        let ver_mark = e.morloc_version.as_ref()
                            .map(|v| format!(" [{}]", v.show()))
                            .unwrap_or_default();
                        println!("  {}{}{}", e.name, ver_mark, active_mark);
                    }
                }
                if !system_envs.is_empty() {
                    if !local_envs.is_empty() {
                        println!();
                    }
                    println!("System environments:");
                    for e in &system_envs {
                        let active_mark = if e.active { " (active)" } else { "" };
                        let ver_mark = e.morloc_version.as_ref()
                            .map(|v| format!(" [{}]", v.show()))
                            .unwrap_or_default();
                        println!("  {}{}{}", e.name, ver_mark, active_mark);
                    }
                }
                if total == 0 {
                    println!("No environments found. Create one with: morloc-manager new");
                }
            }
            Ok(())
        }

        // ---- info ----
        Cmd::Info { name, system } => {
            if let Some(env_name) = name {
                // Detailed info for a specific environment
                let scope = if system {
                    if !cfg::env_config_path(Scope::System, &env_name).is_file() {
                        return Err(ManagerError::EnvironmentNotFound(format!(
                            "{env_name} (in system scope)"
                        )));
                    }
                    Scope::System
                } else {
                    cfg::find_env_scope(&env_name)?
                };
                let ec = cfg::read_env_config(scope, &env_name)?;
                let data_dir = cfg::env_data_dir(scope, &env_name);
                let active = cfg::read_active_config()
                    .and_then(|c| c.active_env)
                    .as_deref() == Some(env_name.as_str());

                if json {
                    #[derive(serde::Serialize)]
                    struct InfoDetail {
                        name: String,
                        scope: String,
                        active: bool,
                        base_image: String,
                        built_image: Option<String>,
                        morloc_version: Option<Version>,
                        engine: String,
                        shm_size: String,
                        dockerfile: Option<String>,
                        flags: Vec<String>,
                        data_dir: String,
                    }
                    let df_str = ec.dockerfile.as_ref().map(|_| {
                        let df_path = cfg::env_dockerfile_path(scope, &env_name);
                        df_path.display().to_string()
                    });
                    let flags_path = cfg::env_flags_path(scope, &env_name);
                    let flags = cfg::read_flags_file_lines(&flags_path);
                    let output = InfoDetail {
                        name: ec.name.clone(),
                        scope: match scope { Scope::Local => "local", Scope::System => "system" }.to_string(),
                        active,
                        base_image: ec.base_image.clone(),
                        built_image: ec.built_image.clone(),
                        morloc_version: ec.morloc_version.clone(),
                        engine: display_engine(ec.engine).to_string(),
                        shm_size: ec.shm_size.clone(),
                        dockerfile: df_str,
                        flags,
                        data_dir: data_dir.display().to_string(),
                    };
                    println!("{}", serde_json::to_string_pretty(&output).unwrap());
                } else {
                    println!("Name:           {}", ec.name);
                    println!("Scope:          {}", match scope { Scope::Local => "local", Scope::System => "system" });
                    println!("Active:         {}", if active { "yes" } else { "no" });
                    println!("Base image:     {}", ec.base_image);
                    if let Some(ref img) = ec.built_image {
                        println!("Built image:    {img}");
                    }
                    if let Some(ref ver) = ec.morloc_version {
                        println!("Morloc version: {}", ver.show());
                    }
                    println!("Engine:         {}", display_engine(ec.engine));
                    println!("SHM size:       {}", ec.shm_size);
                    println!("Dockerfile:     {}", match ec.dockerfile {
                        Some(_) => {
                            let df_path = cfg::env_dockerfile_path(scope, &env_name);
                            if df_path.exists() {
                                df_path.display().to_string()
                            } else {
                                format!("{} (MISSING)", df_path.display())
                            }
                        }
                        None => "none".to_string(),
                    });
                    let flags_path = cfg::env_flags_path(scope, &env_name);
                    println!("Flags:          {}", flags_path.display());
                    let flags = cfg::read_flags_file_lines(&flags_path);
                    for flag in &flags {
                        println!("  {flag}");
                    }
                    println!("Data dir:       {}", data_dir.display());
                }
            } else {
                // Overview
                let local_cfg = cfg::read_config::<Config>(&cfg::config_path(Scope::Local)).ok();
                let system_cfg = cfg::read_config::<Config>(&cfg::config_path(Scope::System)).ok();
                let se_mode = detect_selinux();

                let active_env = environment::resolve_active_environment()
                    .map(|(name, _, _)| name)
                    .unwrap_or_else(|_| "none".to_string());

                let se_str = match se_mode {
                    SELinuxMode::Enforcing => "enforcing",
                    SELinuxMode::Permissive => "permissive",
                    SELinuxMode::Disabled => "not detected",
                };

                if json {
                    #[derive(serde::Serialize)]
                    struct DirInfo { path: String, exists: bool }
                    #[derive(serde::Serialize)]
                    struct InfoOverview {
                        active: String,
                        local_engine: String,
                        system_engine: String,
                        selinux: String,
                        directories: std::collections::BTreeMap<String, DirInfo>,
                        local: Vec<environment::EnvInfo>,
                        system: Vec<environment::EnvInfo>,
                    }
                    let active_str = if active_env == "none" { None } else { Some(active_env.as_str()) };
                    let mut directories = std::collections::BTreeMap::new();
                    for (label, path) in [
                        ("config_local", cfg::config_dir(Scope::Local)),
                        ("data_local", cfg::data_dir(Scope::Local)),
                        ("config_system", cfg::config_dir(Scope::System)),
                        ("data_system", cfg::data_dir(Scope::System)),
                    ] {
                        directories.insert(label.to_string(), DirInfo {
                            path: path.display().to_string(),
                            exists: path.is_dir(),
                        });
                    }
                    let output = InfoOverview {
                        active: active_env.clone(),
                        local_engine: local_cfg.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset").to_string(),
                        system_engine: system_cfg.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset").to_string(),
                        selinux: se_str.to_string(),
                        directories,
                        local: environment::list_environments(Scope::Local, active_str),
                        system: environment::list_environments(Scope::System, active_str),
                    };
                    println!("{}", serde_json::to_string_pretty(&output).unwrap());
                } else {
                    println!("Active:         {active_env}");
                    println!("Local engine:   {}",
                        local_cfg.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset"));
                    println!("System engine:  {}",
                        system_cfg.as_ref().map(|c| display_engine(c.engine)).unwrap_or("unset"));
                    println!("SELinux:        {se_str}");

                    let dirs = [
                        ("Config (local)", cfg::config_dir(Scope::Local)),
                        ("Data (local)", cfg::data_dir(Scope::Local)),
                        ("Config (system)", cfg::config_dir(Scope::System)),
                        ("Data (system)", cfg::data_dir(Scope::System)),
                    ];
                    println!("\nDirectories:");
                    for (label, path) in &dirs {
                        let status = if path.is_dir() { "exists" } else { "not found" };
                        println!("  {:<20} {} ({})", label, path.display(), status);
                    }

                    let active_str = if active_env == "none" { None } else { Some(active_env.as_str()) };

                    // Check if active env lives in local scope (local takes priority)
                    let active_in_local = active_str
                        .map(|name| cfg::env_config_path(Scope::Local, name).is_file())
                        .unwrap_or(false);

                    let local_envs = environment::list_environments(Scope::Local, active_str);
                    println!("\nLocal environments:");
                    if local_envs.is_empty() {
                        println!("  (none)");
                    } else {
                        for e in &local_envs {
                            let active_mark = if e.active { " (active)" } else { "" };
                            let ver_mark = e.morloc_version.as_ref()
                                .map(|v| format!(" [{}]", v.show()))
                                .unwrap_or_default();
                            println!("  {}{}{}", e.name, ver_mark, active_mark);
                        }
                    }

                    let system_envs = environment::list_environments(Scope::System, active_str);
                    if !system_envs.is_empty() {
                        println!("\nSystem environments:");
                        for e in &system_envs {
                            let active_mark = if e.active && active_in_local {
                                " (active - shadowed)"
                            } else if e.active {
                                " (active)"
                            } else {
                                ""
                            };
                            let ver_mark = e.morloc_version.as_ref()
                                .map(|v| format!(" [{}]", v.show()))
                                .unwrap_or_default();
                            println!("  {}{}{}", e.name, ver_mark, active_mark);
                        }
                    }
                }
            }
            Ok(())
        }

        // ---- select ----
        Cmd::Select { name, system } => {
            if system { check_system_write_access()?; }
            let write_scope = resolve_scope(system);
            environment::select_environment(&name, write_scope)?;
            if system {
                eprintln!("Set system default environment: {name}");
            } else {
                eprintln!("Selected environment: {name}");
            }
            Ok(())
        }

        // ---- update ----
        Cmd::Update {
            name, image, version, tag, dockerfile, dockerfile_stub, force, include, flagfile,
            engine_arg, engine, shm_size, no_build, reinit, non_interactive: _,
        } => {
            let (env_name, env_scope) = match name {
                Some(n) => {
                    let scope = cfg::find_env_scope(&n)?;
                    (n, scope)
                }
                None => {
                    let (n, s, _) = environment::resolve_active_environment()?;
                    (n, s)
                }
            };
            if env_scope == Scope::System {
                check_system_write_access()?;
            }

            // Handle --dockerfile-stub: generate stub if no Dockerfile exists
            let resolved_dockerfile = if dockerfile.is_some() && dockerfile_stub {
                return Err(ManagerError::EnvError(
                    "Cannot use both --dockerfile and --dockerfile-stub".to_string(),
                ));
            } else if dockerfile_stub {
                let df_path = cfg::env_dockerfile_path(env_scope, &env_name);
                if df_path.exists() && !force {
                    return Err(ManagerError::EnvError(format!(
                        "Dockerfile already exists: {}\nUse --force to overwrite.",
                        df_path.display()
                    )));
                }
                let stub_dir = cfg::data_dir(env_scope).join("tmp");
                fs::create_dir_all(&stub_dir).map_err(|e| {
                    ManagerError::EnvError(format!("Failed to create tmp dir: {e}"))
                })?;
                let stub_path = stub_dir.join(format!("{env_name}.Dockerfile"));
                let stub_content = format!(
                    "# morloc environment: {env_name}\n\
                     # Edit this file, then rebuild with: morloc-manager update\n\
                     \n\
                     # CONTAINER_BASE is replaced at build time with the environment's base image\n\
                     ARG CONTAINER_BASE=scratch\n\
                     FROM ${{CONTAINER_BASE}}\n\
                     \n\
                     # Example: install system packages\n\
                     # RUN apt-get update && apt-get install -y jq && rm -rf /var/lib/apt/lists/*\n\
                     \n\
                     # Example: install Python packages\n\
                     # RUN pip install scikit-learn pandas\n\
                     \n\
                     # Example: install R packages\n\
                     # RUN R -e \"install.packages('ggplot2', repos='https://cloud.r-project.org')\"\n"
                );
                fs::write(&stub_path, &stub_content).map_err(|e| {
                    ManagerError::EnvError(format!("Failed to write stub Dockerfile: {e}"))
                })?;
                Some(stub_path.to_string_lossy().to_string())
            } else {
                dockerfile
            };

            if version.is_some() && image.is_some() {
                return Err(ManagerError::EnvError(
                    "--version and --image are mutually exclusive".to_string()
                ));
            }

            // Resolve base image if --version, --tag, or --image provided
            let (base_image, original_image, morloc_ver) = if let Some(ref ver_str) = version {
                let ec = cfg::read_env_config(env_scope, &env_name)?;
                let clean = ver_str.strip_prefix('v').unwrap_or(ver_str);
                let ver: Version = clean.parse().map_err(|_| {
                    ManagerError::InvalidVersion(ver_str.clone())
                })?;
                let img = environment::pull_version_image(ec.engine, &ver)?;
                (Some(img), None, Some(ver))
            } else if let Some(ref t) = tag {
                let ec = cfg::read_env_config(env_scope, &env_name)?;
                let (img, ver) = environment::pull_tagged_image(ec.engine, t)?;
                (Some(img), None, Some(ver))
            } else if let Some(ref img) = image {
                let ec = cfg::read_env_config(env_scope, &env_name)?;
                environment::pull_custom_image(ec.engine, img)?;
                // Detect version from the new image so it doesn't stay stale
                let detected_ver = environment::detect_morloc_version(ec.engine, img).ok();
                (Some(img.clone()), None, detected_ver)
            } else {
                (None, None, None)
            };

            eprintln!("Updating environment: {env_name}");
            let opts = environment::ApplyOptions {
                name: env_name.clone(),
                scope: env_scope,
                is_new: false,
                base_image,
                original_image,
                morloc_version: morloc_ver,
                dockerfile: resolved_dockerfile,
                includes: include,
                flagfile,
                engine_args: engine_arg,
                engine: engine.map(|e| e.into()),
                shm_size,
                skip_dockerfile_build: no_build || dockerfile_stub,
                verbose,
            };
            environment::apply_environment(&opts)?;

            if dockerfile_stub {
                let df_path = cfg::env_dockerfile_path(env_scope, &env_name);
                eprintln!("Stub Dockerfile: {}", df_path.display());
                eprintln!("Edit it, then run: morloc-manager update {env_name}");
            }

            // --version, --tag, and --image imply --reinit (ABI may have changed)
            if reinit || version.is_some() || tag.is_some() || image.is_some() {
                // Re-read the config (apply_environment may have updated it)
                let ec = cfg::read_env_config(env_scope, &env_name)?;

                // Check for running serve container -- reinit replaces morloc-nexus
                // which will fail with "Text file busy" if the container has it open.
                let serve_name = serve::serve_container_name(&env_name);
                let running = serve::find_running_serve_containers(ec.engine);
                if running.iter().any(|n| n == &serve_name) {
                    return Err(ManagerError::EnvError(format!(
                        "Cannot reinit environment '{env_name}' while its serve container is running.\n  \
                         Run 'morloc-manager stop {env_name}' first."
                    )));
                }

                run_morloc_init_for(Some((env_name.clone(), env_scope, ec)), verbose)?;
            }

            eprintln!("{}", bold_green(&format!("Environment '{env_name}' updated.")));

            if env_scope == Scope::System && !check_podman_additional_stores(
                cfg::read_env_config(env_scope, &env_name)
                    .map(|ec| ec.engine)
                    .unwrap_or(ContainerEngine::Podman),
            ) {
                eprintln!();
                warn_podman_additional_stores();
            }

            Ok(())
        }

        // ---- freeze ----
        Cmd::Freeze { name, output, force } => {
            let output_dir = output.as_deref().unwrap_or("./morloc-freeze");
            // Protect against silently overwriting a previous freeze
            let existing_tar = std::path::Path::new(output_dir).join("state.tar.gz");
            if existing_tar.exists() && !force {
                return Err(ManagerError::FreezeError(format!(
                    "Output directory already contains a freeze: {}\n  \
                     Use --force to overwrite, or specify a different -o path.",
                    existing_tar.display()
                )));
            }
            let (env_name, env_scope, ec) = resolve_env_or_active(name)?;
            let engine = ec.engine;
            // Detect the version from the container binary for sanity check.
            // The morloc binary can't report prerelease tags (stack limitation),
            // so if major.minor.patch match, keep the recorded version which has
            // the full tag from the image.
            eprintln!("Detecting morloc version from image...");
            let detected = environment::detect_morloc_version(ec.engine, ec.active_image())?;
            let ver = if let Some(ref recorded) = ec.morloc_version {
                if recorded.major == detected.major
                    && recorded.minor == detected.minor
                    && recorded.patch == detected.patch
                {
                    recorded.clone()
                } else {
                    eprintln!(
                        "Warning: recorded morloc version ({}) does not match image ({}).",
                        recorded.show(), detected.show()
                    );
                    detected
                }
            } else {
                detected
            };
            let data_dir = cfg::env_data_dir(env_scope, &env_name);
            let image = ec.active_image().to_string();
            let result = freeze::freeze_from_dir(env_scope, ver.clone(), engine, &image, &data_dir.to_string_lossy(), output_dir, verbose);
            if result.is_ok() && ec.morloc_version.as_ref() != Some(&ver) {
                let mut updated = ec.clone();
                updated.morloc_version = Some(ver);
                let _ = cfg::write_env_config(env_scope, &env_name, &updated);
            }
            result
        }

        // ---- unfreeze ----
        Cmd::Unfreeze { from, tag, base, engine: engine_override, rebuild } => {
            let from = {
                let p = std::path::Path::new(&from);
                if p.is_dir() {
                    let tar = p.join("state.tar.gz");
                    if tar.is_file() {
                        tar.to_string_lossy().to_string()
                    } else {
                        return Err(ManagerError::UnfreezeError(format!(
                            "Directory '{}' does not contain state.tar.gz. \
                             Pass the path to state.tar.gz directly, or the directory containing it.",
                            from
                        )));
                    }
                } else if p.is_file() {
                    from
                } else {
                    return Err(ManagerError::UnfreezeError(format!(
                        "Input not found: {from}. \
                         Pass the path to state.tar.gz or the directory containing it."
                    )));
                }
            };
            // Read version and engine from the freeze manifest so unfreeze
            // works on deployment machines with no morloc environments.
            let tarball_dir = std::path::Path::new(&from)
                .parent()
                .unwrap_or(std::path::Path::new("."));
            let manifest_path = tarball_dir.join("freeze-manifest.json");
            let manifest = freeze::read_freeze_manifest(&manifest_path.to_string_lossy())
                .map_err(|_| ManagerError::UnfreezeError(format!(
                    "Cannot read freeze manifest at {}. Ensure state.tar.gz and freeze-manifest.json are in the same directory.",
                    manifest_path.display()
                )))?;
            let engine = match engine_override {
                Some(EngineArg::Docker) => ContainerEngine::Docker,
                Some(EngineArg::Podman) => ContainerEngine::Podman,
                None => {
                    let e = ensure_engine()?;
                    eprintln!(
                        "Note: using {} engine from global config. Override with --engine if needed.",
                        display_engine(e)
                    );
                    e
                }
            };
            serve::build_serve_image(engine, verbose, &from, &tag, manifest.morloc_version, base.as_deref(), rebuild, &manifest.programs)
        }

        // ---- start ----
        Cmd::Start { name, port, env_vars, env_file, force } => {
            let (env_name, env_scope, ec) = resolve_env_or_active(name)?;
            let image = ec.active_image().to_string();
            let data_dir = cfg::env_data_dir(env_scope, &env_name);
            let container_name = serve::serve_container_name(&env_name);
            // Warn if a Dockerfile is configured but the layered image hasn't been built
            if ec.dockerfile.is_some() && ec.built_image.is_none() {
                eprintln!("Warning: Dockerfile is configured but image has not been built. Using base image.");
                eprintln!("  Run 'morloc-manager update {env_name}' to build the Dockerfile layer.");
            }
            // Refuse to replace a running container unless --force is passed
            if container::container_exists(ec.engine, &container_name) {
                if !force {
                    return Err(ManagerError::EnvError(format!(
                        "Serve container already running for '{env_name}'. Use --force to replace."
                    )));
                }
                eprintln!("Warning: replacing existing serve container '{container_name}'");
            }
            let port_mappings = if port.is_empty() {
                vec![(8080, 8080)]
            } else {
                port
            };
            let flags_path = cfg::env_flags_path(env_scope, &env_name);
            let extra_flags = cfg::read_flags_file(&flags_path);
            let user_env = collect_env_vars(&env_vars, env_file.as_deref())?;
            serve::serve_environment(
                ec.engine, verbose, &image,
                &data_dir.to_string_lossy(), &container_name,
                &port_mappings, &extra_flags, &Some(ec.shm_size.clone()),
                &user_env,
            )
        }

        // ---- stop ----
        Cmd::Stop { name } => {
            let (env_name, _, ec) = resolve_env_or_active(name)?;
            let container_name = serve::serve_container_name(&env_name);
            if crate::container::container_exists(ec.engine, &container_name) {
                serve::stop_serve_container(ec.engine, verbose, &container_name)?;
                eprintln!("Stopped serving environment: {env_name}");
            } else {
                return Err(ManagerError::EnvError(
                    format!("No serve container running for environment '{env_name}'")
                ));
            }
            Ok(())
        }

        // ---- logs ----
        Cmd::Logs { name, follow } => {
            let (container_name, engine) = if let Some(ref n) = name {
                let (_, _, ec) = resolve_env_or_active(Some(n.clone()))?;
                let cname = serve::serve_container_name(n);
                if !container::container_exists(ec.engine, &cname) {
                    return Err(ManagerError::EnvError(
                        format!("No serve container running for environment '{n}'")
                    ));
                }
                (cname, ec.engine)
            } else {
                find_running_serve_container()?
            };
            let exe = match engine {
                ContainerEngine::Podman => "podman",
                ContainerEngine::Docker => "docker",
            };
            let mut cmd_args = vec!["logs"];
            if follow {
                cmd_args.push("-f");
            }
            cmd_args.push(&container_name);
            // Log content is the primary data of this command, so both the
            // container's original stdout and stderr should go to our stdout.
            // docker/podman logs preserves the original stream split; we merge
            // them so that `morloc-manager logs | grep ERROR` works.
            let stdout_handle = std::io::stdout();
            let status = std::process::Command::new(exe)
                .args(&cmd_args)
                .stdin(Stdio::null())
                .stdout(Stdio::inherit())
                .stderr(Stdio::from(stdout_handle))
                .status()
                .map_err(|e| ManagerError::EnvError(format!("Failed to run {exe} logs: {e}")))?;
            if !status.success() {
                return Err(ManagerError::EngineError {
                    engine,
                    code: status.code().unwrap_or(1),
                    stderr: String::new(),
                });
            }
            Ok(())
        }

        // ---- eval ----
        Cmd::Eval { first, second, port } => {
            let expr = if let Some(ref expr_arg) = second {
                // first is env name — validate it exists and its serve container is running
                let (env_name, _, ec) = resolve_env_or_active(Some(first))?;
                let container_name = serve::serve_container_name(&env_name);
                if !container::container_exists(ec.engine, &container_name) {
                    return Err(ManagerError::EnvError(format!(
                        "No serve container running for '{env_name}'. Start with: morloc-manager start {env_name}"
                    )));
                }
                expr_arg.clone()
            } else {
                first
            };
            use std::io::{Read as IoRead, Write as IoWrite};
            let body = format!("{{\"expr\":{}}}", serde_json::to_string(&expr).unwrap_or_default());
            let request = format!(
                "POST /eval HTTP/1.1\r\nHost: localhost\r\nContent-Type: application/json\r\nContent-Length: {}\r\nConnection: close\r\n\r\n{}",
                body.len(), body
            );
            let addr = format!("127.0.0.1:{port}");
            let mut stream = std::net::TcpStream::connect(&addr).map_err(|e| {
                ManagerError::EnvError(format!(
                    "Cannot connect to serve container on {addr}: {e}\n  Is a serve container running? Start with: morloc-manager start"
                ))
            })?;
            stream.write_all(request.as_bytes()).map_err(|e| {
                ManagerError::EnvError(format!("Failed to send request: {e}"))
            })?;
            let mut response = String::new();
            stream.read_to_string(&mut response).map_err(|e| {
                ManagerError::EnvError(format!("Failed to read response: {e}"))
            })?;
            // Extract body from HTTP response (after \r\n\r\n)
            if let Some(pos) = response.find("\r\n\r\n") {
                let body = &response[pos + 4..];
                println!("{body}");
            } else {
                println!("{response}");
            }
            Ok(())
        }

        // ---- status ----
        Cmd::Status => {
            let mut all_containers: Vec<serve::ServeContainerInfo> = Vec::new();
            let mut any_engine = false;
            for engine in [ContainerEngine::Podman, ContainerEngine::Docker] {
                let exe = match engine {
                    ContainerEngine::Podman => "podman",
                    ContainerEngine::Docker => "docker",
                };
                if which(exe) {
                    any_engine = true;
                    if let Ok(containers) = serve::query_serve_containers(engine, verbose) {
                        all_containers.extend(containers);
                    }
                }
            }
            if !any_engine {
                return Err(ManagerError::EngineNotFound);
            }
            if json {
                #[derive(serde::Serialize)]
                struct StatusOutput { containers: Vec<serve::ServeContainerInfo> }
                let output = StatusOutput { containers: all_containers };
                println!("{}", serde_json::to_string_pretty(&output).unwrap());
            } else if all_containers.is_empty() {
                println!("No morloc serve containers running.");
            } else {
                println!("Running servers:");
                for c in &all_containers {
                    println!("  {}  {}  ({})  [{}]", c.name, c.ports, c.env, c.status);
                }
            }
            Ok(())
        }

        // ---- doctor ----
        Cmd::Doctor { name, system, deep, strict } => {
            let (env_name, env_scope, ec) = if let Some(ref n) = name {
                let s = if system { Scope::System } else { cfg::find_env_scope(n)? };
                let c = cfg::read_env_config(s, n)?;
                (n.clone(), s, c)
            } else {
                resolve_env_or_active(None)?
            };
            doctor::doctor(ec.engine, verbose, &env_name, env_scope, &ec, deep, strict, json)
        }

    }
}

// ======================================================================
// Serve container discovery
// ======================================================================

/// Find exactly one running morloc-serve-* container across all engines.
/// Returns (container_name, engine). Errors if zero or multiple found.
fn find_running_serve_container() -> Result<(String, ContainerEngine)> {
    let mut found: Vec<(String, ContainerEngine)> = Vec::new();
    for engine in [ContainerEngine::Podman, ContainerEngine::Docker] {
        let exe = match engine {
            ContainerEngine::Podman => "podman",
            ContainerEngine::Docker => "docker",
        };
        if which(exe) {
            for name in serve::find_running_serve_containers(engine) {
                found.push((name, engine));
            }
        }
    }
    match found.len() {
        0 => Err(ManagerError::EnvError(
            "No morloc serve containers running".to_string(),
        )),
        1 => Ok(found.into_iter().next().unwrap()),
        _ => {
            let names: Vec<String> = found.iter().map(|(n, _)| n.clone()).collect();
            Err(ManagerError::EnvError(format!(
                "Multiple serve containers running. Specify one explicitly:\n  {}",
                names.join("\n  ")
            )))
        }
    }
}

// ======================================================================
// Container run
// ======================================================================

fn run_in_container(
    verbose: bool,
    shell: bool,
    args: &[String],
    user_env: &[(String, String)],
) -> Result<()> {
    run_in_container_for(None, verbose, shell, args, user_env)
}

fn run_in_container_for(
    target: Option<(String, Scope, EnvironmentConfig)>,
    verbose: bool,
    shell: bool,
    args: &[String],
    user_env: &[(String, String)],
) -> Result<()> {
    let (env_name, env_scope, ec) = match target {
        Some(t) => t,
        None => environment::resolve_active_environment()?,
    };
    let engine = ec.engine;
    let image = ec.active_image().to_string();
    let data_dir = cfg::env_data_dir(env_scope, &env_name);
    let v_data_dir = data_dir.to_string_lossy().to_string();

    // Warn if a Dockerfile is configured but the layered image hasn't been built
    if ec.dockerfile.is_some() && ec.built_image.is_none() {
        eprintln!("Warning: Dockerfile is configured but image has not been built. Using base image.");
        eprintln!("  Run 'morloc-manager update {env_name}' to build the Dockerfile layer.");
    }

    // Fail fast with a clear message if docker socket is unreachable
    require_docker_socket(engine)?;

    // Verify the image is accessible before attempting to run
    if !container::image_exists_locally(engine, &image) {
        // Show the raw container engine error before our hint
        if let Some(raw_err) = container::image_inspect_stderr(engine, &image) {
            let trimmed = raw_err.trim();
            if !trimmed.is_empty() {
                eprintln!("{trimmed}");
            }
        }
        if env_scope == Scope::System && !check_podman_additional_stores(engine) {
            return Err(ManagerError::EnvError(format!(
                "Image '{image}' not found. The environment '{env_name}' is a system environment \
                 but Podman is not configured to see rootful images.\n\
                 Option 1 (recommended): Use Docker for system environments.\n\
                 Option 2: Add to [storage.options] in /etc/containers/storage.conf:\n\n  \
                 additionalimagestores = [\"/var/lib/containers/storage\"]\n\n\
                 Note: Option 2 may cause storage locking conflicts on Fedora and Debian.\n"
            )));
        }
        let hint = if env_scope == Scope::System {
            format!("Ask your administrator to run: sudo morloc-manager update {env_name}")
        } else {
            format!("Run 'morloc-manager update {env_name}' to build it.")
        };
        return Err(ManagerError::EnvError(format!(
            "Image '{image}' not found locally. {hint}"
        )));
    }

    let se_mode = detect_selinux();
    let suffix = volume_suffix(se_mode);
    let home = dirs::home_dir()
        .unwrap_or_default()
        .to_string_lossy()
        .to_string();
    let cwd = std::env::current_dir()
        .unwrap_or_default()
        .to_string_lossy()
        .to_string();

    // Refuse to run from the root directory — container engines cannot
    // bind-mount "/" and the resulting error is opaque.
    if !shell && cwd == "/" {
        return Err(ManagerError::EnvError(
            "Cannot run from the root directory (/). \
             Change to a subdirectory first (e.g., cd /tmp).".to_string()
        ));
    }

    // Read flags from the environment's flags file
    let flags_path = cfg::env_flags_path(env_scope, &env_name);
    let extra_flags = cfg::read_flags_file(&flags_path);

    let is_init = matches!(args, [a, b, ..] if a == "morloc" && b == "init");
    let is_home_dir = normalize_trailing(&cwd) == normalize_trailing(&home);

    if !is_init && !suffix.is_empty() && !is_home_dir {
        selinux::validate_mount_path(&cwd)?;
        run_with_config(
            engine, verbose, &image, &v_data_dir, &home, &cwd, suffix,
            shell, args, false, &ec.shm_size, &extra_flags, user_env,
        )
    } else {
        let (cwd_final, skip_work_mount) = if is_home_dir && !suffix.is_empty() && !is_init {
            eprintln!("Warning: running from home directory with SELinux; working directory mount skipped.");
            eprintln!("Workaround: create a project subdirectory and work from there:");
            eprintln!("  mkdir ~/myproject && cd ~/myproject");
            (home.clone(), true)
        } else {
            (cwd, false)
        };
        run_with_config(
            engine, verbose, &image, &v_data_dir, &home, &cwd_final, suffix,
            shell, args, is_init || skip_work_mount, &ec.shm_size, &extra_flags, user_env,
        )
    }
}

fn run_with_config(
    engine: ContainerEngine,
    verbose: bool,
    image: &str,
    v_data_dir: &str,
    home: &str,
    cwd: &str,
    suffix: &str,
    shell: bool,
    args: &[String],
    is_init: bool,
    shm_size: &str,
    extra_flags: &[String],
    user_env: &[(String, String)],
) -> Result<()> {
    if shell {
        if !io::stdin().is_terminal() || !io::stdout().is_terminal() {
            eprintln!("Error: --shell requires an interactive terminal (TTY).");
            eprintln!("If connecting over SSH, use: ssh -t <host> morloc-manager run --shell");
            std::process::exit(1);
        }
    }

    // Mount data at /opt/morloc — matching the serve container (start).
    // The compiler reads MORLOC_HOME to resolve all generated paths.
    let mh = "/opt/morloc";
    let base_mounts = vec![
        (v_data_dir.to_string(), mh.to_string()),
    ];
    let work_mount = if is_init {
        Vec::new()
    } else {
        vec![(cwd.to_string(), cwd.to_string())]
    };
    let all_mounts: Vec<(String, String)> = base_mounts.into_iter().chain(work_mount).collect();
    let work_dir = if is_init {
        mh.to_string()
    } else {
        cwd.to_string()
    };
    let mut env_vars = vec![
        ("HOME".to_string(), home.to_string()),
        ("MORLOC_HOME".to_string(), mh.to_string()),
        (
            "PATH".to_string(),
            format!("{mh}/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin"),
        ),
    ];
    env_vars.extend(user_env.iter().cloned());
    let cmd = if shell {
        Some(vec!["/bin/bash".to_string()])
    } else if args.is_empty() {
        None
    } else {
        Some(args.to_vec())
    };

    let cfg = RunConfig {
        image: image.to_string(),
        bind_mounts: all_mounts,
        env: env_vars,
        interactive: shell,
        shm_size: Some(shm_size.to_string()),
        work_dir: Some(work_dir),
        selinux_suffix: suffix.to_string(),
        command: cmd,
        extra_flags: extra_flags.to_vec(),
        ..RunConfig::new(image)
    };

    let status = container_run_passthrough(engine, verbose, shell, &cfg);
    let code = status.code().unwrap_or(1);
    if status.success() {
        Ok(())
    } else if code >= 125 {
        // Exit 125+ = container engine error (not the user's program)
        Err(ManagerError::EngineError {
            engine,
            code,
            stderr: "Container engine error".to_string(),
        })
    } else {
        // Exit 1-124 = program exited with non-zero, pass through silently
        std::process::exit(code);
    }
}

fn run_morloc_init_for(
    target: Option<(String, Scope, EnvironmentConfig)>,
    verbose: bool,
) -> Result<()> {
    let init_args: Vec<String> = if verbose {
        ["morloc", "init", "-f"].iter().map(|s| s.to_string()).collect()
    } else {
        ["morloc", "init", "-f", "-q"].iter().map(|s| s.to_string()).collect()
    };
    eprintln!("Initializing morloc (this may take several minutes)...");
    run_in_container_for(target, verbose, false, &init_args, &[])
}

fn normalize_trailing(p: &str) -> String {
    let mut s = p.to_string();
    if !s.ends_with('/') {
        s.push('/');
    }
    s
}

// ======================================================================
// Tests
// ======================================================================

#[cfg(test)]
mod tests {
    use super::*;
    use crate::container::{build_build_args, build_run_args, engine_executable, engine_specific_run_flags, BuildConfig};

    // ---- Type tests ----

    #[test]
    fn show_version_formats_correctly() {
        assert_eq!(Version::new(0, 67, 0).show(), "0.67.0");
    }

    #[test]
    fn parse_version_round_trips() {
        assert_eq!("0.67.0".parse::<Version>().ok(), Some(Version::new(0, 67, 0)));
    }

    #[test]
    fn parse_version_rejects_invalid() {
        assert!("abc".parse::<Version>().is_err());
    }

    #[test]
    fn parse_version_rejects_incomplete() {
        assert!("0.67".parse::<Version>().is_err());
    }

    #[test]
    fn version_ordering_is_semantic() {
        assert!(Version::new(1, 0, 0) > Version::new(0, 99, 99));
    }

    #[test]
    fn version_ordering_minor() {
        assert!(Version::new(0, 2, 0) > Version::new(0, 1, 99));
    }

    #[test]
    fn version_equality() {
        assert_eq!(Version::new(0, 67, 0), Version::new(0, 67, 0));
    }

    #[test]
    fn parse_version_with_prerelease() {
        for (input, expected_pre) in [
            ("0.77.0-rc.1", "rc.1"),
            ("1.0.0-alpha", "alpha"),
            ("1.0.0-beta.2", "beta.2"),
            ("0.1.0-dev.20260414", "dev.20260414"),
        ] {
            let ver: Version = input.parse().unwrap();
            assert_eq!(ver.prerelease, Some(expected_pre.to_string()), "input: {input}");
            assert_eq!(ver.show(), input, "round-trip failed for: {input}");
        }
    }

    #[test]
    fn prerelease_sorts_before_release() {
        let rc: Version = "0.77.0-rc.1".parse().unwrap();
        let release = Version::new(0, 77, 0);
        assert!(rc < release);
    }

    // ---- Error message tests ----

    #[test]
    fn invalid_version_renders() {
        let err = ManagerError::InvalidVersion("abc".to_string());
        assert!(err.to_string().contains("Invalid version"));
    }

    #[test]
    fn no_command_renders() {
        let err = ManagerError::NoCommand;
        assert!(err.to_string().contains("No command"));
    }

    #[test]
    fn no_active_environment_suggests_new() {
        let err = ManagerError::NoActiveEnvironment;
        assert!(err.to_string().contains("new"));
    }

    #[test]
    fn config_permission_denied_mentions_permissions() {
        let err = ManagerError::ConfigPermissionDenied("/etc/morloc/config.json".to_string());
        assert!(err.to_string().contains("Permission"));
    }

    #[test]
    fn freeze_error_renders() {
        let err = ManagerError::FreezeError("tar error".to_string());
        assert!(err.to_string().contains("Freeze failed"));
    }

    // ---- Config default tests ----

    #[test]
    fn default_config_has_no_active_env() {
        assert_eq!(Config::default().active_env, None);
    }

    #[test]
    fn default_config_uses_podman() {
        assert_eq!(Config::default().engine, ContainerEngine::Podman);
    }

    // ---- Config JSON round-trip tests ----

    #[test]
    fn config_json_round_trip() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("config.json");
        let cfg = Config {
            active_env: Some("ml".to_string()),
            engine: ContainerEngine::Docker,
        };
        cfg::write_config(&path, &cfg).unwrap();
        let cfg2: Config = cfg::read_config(&path).unwrap();
        assert_eq!(cfg2.active_env.as_deref(), Some("ml"));
        assert_eq!(cfg2.engine, ContainerEngine::Docker);
    }

    #[test]
    fn config_read_missing_returns_not_found() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("nonexistent.json");
        let result = cfg::read_config::<Config>(&path);
        assert!(matches!(result, Err(ManagerError::ConfigNotFound(_))));
    }

    #[test]
    fn config_read_invalid_json_returns_parse_error() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("bad.json");
        fs::write(&path, "not json at all").unwrap();
        let result = cfg::read_config::<Config>(&path);
        assert!(matches!(result, Err(ManagerError::ConfigParseError { .. })));
    }

    #[test]
    fn env_config_json_round_trip() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("env.json");
        let ec = EnvironmentConfig {
            name: "test".to_string(),
            base_image: "ghcr.io/morloc-project/morloc/morloc-full:0.67.0".to_string(),
            original_image: None,
            dockerfile: None,
            content_hash: None,
            built_image: None,
            engine: ContainerEngine::Podman,
            shm_size: "1g".to_string(),
            morloc_version: Some(Version::new(0, 67, 0)),
        };
        cfg::write_config(&path, &ec).unwrap();
        let ec2: EnvironmentConfig = cfg::read_config(&path).unwrap();
        assert_eq!(ec2.name, "test");
        assert_eq!(ec2.shm_size, "1g");
        assert_eq!(ec2.morloc_version, Some(Version::new(0, 67, 0)));
    }

    #[test]
    fn freeze_manifest_json_round_trip() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("fm.json");
        let fm = FreezeManifest {
            morloc_version: Version::new(0, 67, 0),
            frozen_at: chrono::Utc::now(),
            modules: vec![ModuleEntry {
                name: "math".to_string(),
                version: Some("0.3.0".to_string()),
                sha256: "abc123".to_string(),
            }],
            programs: vec![ProgramEntry {
                name: "svc".to_string(),
                commands: vec!["hello".to_string(), "compute".to_string()],
            }],
            base_image: "morloc-full:0.67.0".to_string(),
            env_layer: Some(FrozenEnvLayer {
                name: "ml".to_string(),
                dockerfile: "FROM scratch".to_string(),
                content_hash: "abc".to_string(),
                image_tag: None,
            }),
            env_vars: Vec::new(),
        };
        cfg::write_config(&path, &fm).unwrap();
        let fm2: FreezeManifest = cfg::read_config(&path).unwrap();
        assert_eq!(fm2.morloc_version, Version::new(0, 67, 0));
        assert_eq!(fm2.modules.len(), 1);
        assert_eq!(fm2.programs.len(), 1);
        assert_eq!(fm2.programs[0].commands, vec!["hello", "compute"]);
        // env_vars is no longer written but can still be read from old manifests
        assert!(fm2.env_vars.is_empty());
    }

    #[test]
    fn freeze_manifest_reads_legacy_env_vars() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("legacy.json");
        // Simulate an old manifest that included env_vars
        let json = r#"{
            "morloc_version": {"major":0,"minor":67,"patch":0,"pre":null},
            "frozen_at": "2025-01-01T00:00:00Z",
            "modules": [],
            "programs": [],
            "base_image": "morloc-full:0.67.0",
            "env_layer": null,
            "env_vars": ["API_KEY", "DB_URL"]
        }"#;
        std::fs::write(&path, json).unwrap();
        let fm: FreezeManifest = cfg::read_config(&path).unwrap();
        assert_eq!(fm.env_vars, vec!["API_KEY", "DB_URL"]);
    }

    // ---- Config flags tests ----

    #[test]
    fn read_flags_file_parses() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("test.flags");
        fs::write(
            &path,
            "# This is a comment\n--gpus all\n\n  -v /data:/data  \n# another comment\n--network host\n",
        )
        .unwrap();
        let flags = cfg::read_flags_file(&path);
        assert_eq!(
            flags,
            vec!["--gpus", "all", "-v", "/data:/data", "--network", "host"]
        );
    }

    #[test]
    fn read_flags_file_missing() {
        let dir = tempfile::tempdir().unwrap();
        let flags = cfg::read_flags_file(&dir.path().join("nope.flags"));
        assert!(flags.is_empty());
    }

    #[test]
    fn read_flags_file_expands_env_vars() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("test.flags");
        fs::write(&path, "-v $HOME/data:/data\n").unwrap();
        let flags = cfg::read_flags_file(&path);
        let home = std::env::var("HOME").unwrap();
        assert_eq!(flags, vec!["-v", &format!("{home}/data:/data")]);
    }

    #[test]
    fn read_flags_file_expands_tilde() {
        let dir = tempfile::tempdir().unwrap();
        let path = dir.path().join("test.flags");
        fs::write(&path, "-v ~/data:/data\n").unwrap();
        let flags = cfg::read_flags_file(&path);
        let home = std::env::var("HOME").unwrap();
        assert_eq!(flags, vec!["-v", &format!("{home}/data:/data")]);
    }

    // ---- Container CLI argument tests ----

    #[test]
    fn engine_executable_docker() {
        assert_eq!(engine_executable(ContainerEngine::Docker), "docker");
    }

    #[test]
    fn engine_executable_podman() {
        assert_eq!(engine_executable(ContainerEngine::Podman), "podman");
    }

    #[test]
    fn build_run_args_minimal() {
        let cfg = RunConfig::new("myimage:latest");
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        assert_eq!(args[0], "run");
        assert!(args.contains(&"--rm".to_string()));
        assert!(args.contains(&"myimage:latest".to_string()));
        assert!(!args.contains(&"-it".to_string()));
    }

    #[test]
    fn build_run_args_podman_userns() {
        let cfg = RunConfig::new("myimage:latest");
        let args = build_run_args(
            ContainerEngine::Podman,
            &engine_specific_run_flags(ContainerEngine::Podman),
            &cfg,
        );
        assert!(args.contains(&"--userns=keep-id".to_string()));
    }

    #[test]
    fn build_run_args_interactive() {
        let mut cfg = RunConfig::new("img");
        cfg.interactive = true;
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        assert!(args.contains(&"-it".to_string()));
    }

    #[test]
    fn build_run_args_selinux_suffix() {
        let mut cfg = RunConfig::new("img");
        cfg.bind_mounts = vec![("/host".to_string(), "/container".to_string())];
        cfg.selinux_suffix = ":z".to_string();
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        assert!(args.contains(&"-v".to_string()));
        assert!(args.contains(&"/host:/container:z".to_string()));
    }

    #[test]
    fn build_run_args_workdir() {
        let mut cfg = RunConfig::new("img");
        cfg.work_dir = Some("/work".to_string());
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        assert!(args.contains(&"-w".to_string()));
        assert!(args.contains(&"/work".to_string()));
    }

    #[test]
    fn build_run_args_read_only() {
        let mut cfg = RunConfig::new("img");
        cfg.read_only = true;
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        assert!(args.contains(&"--read-only".to_string()));
    }

    #[test]
    fn build_run_args_command_at_end() {
        let mut cfg = RunConfig::new("img");
        cfg.command = Some(vec![
            "morloc".to_string(),
            "make".to_string(),
            "-o".to_string(),
            "svc".to_string(),
            "svc.loc".to_string(),
        ]);
        let args = build_run_args(
            ContainerEngine::Docker,
            &engine_specific_run_flags(ContainerEngine::Docker),
            &cfg,
        );
        let img_idx = args.iter().position(|a| a == "img").unwrap();
        let cmd_idx = args.iter().position(|a| a == "morloc").unwrap();
        assert!(img_idx < cmd_idx);
    }

    #[test]
    fn build_build_args_includes_tag_and_dockerfile() {
        let cfg = BuildConfig {
            dockerfile: "/tmp/Dockerfile".to_string(),
            context: "/tmp/ctx".to_string(),
            tag: "test:v1".to_string(),
            build_args: vec![("BASE".to_string(), "ubuntu:22.04".to_string())],
        };
        let args = build_build_args(&cfg);
        assert_eq!(args[0], "build");
        assert!(args.contains(&"-f".to_string()));
        assert!(args.contains(&"-t".to_string()));
        assert!(args.contains(&"--build-arg".to_string()));
        assert_eq!(args.last().unwrap(), "/tmp/ctx");
    }

    // ---- SELinux tests ----

    #[test]
    fn root_is_unsafe() {
        assert!(!selinux::is_safe_to_relabel("/"));
    }

    #[test]
    fn tmp_is_unsafe() {
        assert!(!selinux::is_safe_to_relabel("/tmp"));
    }

    #[test]
    fn tmp_subdir_is_unsafe() {
        assert!(!selinux::is_safe_to_relabel("/tmp/foo"));
    }

    #[test]
    fn home_subdir_is_safe() {
        assert!(selinux::is_safe_to_relabel("/home/user/project"));
    }

    #[test]
    fn var_tmp_is_unsafe() {
        assert!(!selinux::is_safe_to_relabel("/var/tmp"));
    }
}


================================================
FILE: data/rust/morloc-manager/src/selinux.rs
================================================
use std::path::Path;
use std::process::Command;

use crate::error::{ManagerError, Result};

#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum SELinuxMode {
    Enforcing,
    Permissive,
    Disabled,
}

pub fn detect_selinux() -> SELinuxMode {
    if !Path::new("/usr/sbin/getenforce").exists() {
        return SELinuxMode::Disabled;
    }
    let Ok(output) = Command::new("getenforce").output() else {
        return SELinuxMode::Disabled;
    };
    if !output.status.success() {
        return SELinuxMode::Disabled;
    }
    let stdout = String::from_utf8_lossy(&output.stdout);
    let first_line = stdout.lines().next().unwrap_or("");
    match first_line {
        "Enforcing" => SELinuxMode::Enforcing,
        "Permissive" => SELinuxMode::Permissive,
        _ => SELinuxMode::Disabled,
    }
}

pub fn volume_suffix(mode: SELinuxMode) -> &'static str {
    match mode {
        SELinuxMode::Enforcing => ":z",
        SELinuxMode::Permissive | SELinuxMode::Disabled => "",
    }
}

pub fn is_safe_to_relabel(path: &str) -> bool {
    let home = dirs::home_dir().unwrap_or_default();
    let norm = normalize(path);
    let home_norm = normalize_trailing(&home.to_string_lossy());
    let is_home_root = normalize_trailing(&norm) == home_norm;
    !is_unsafe_system_path(&norm) && !is_home_root
}

pub fn validate_mount_path(path: &str) -> Result<()> {
    if is_safe_to_relabel(path) {
        Ok(())
    } else {
        Err(ManagerError::SELinuxError(format!(
            "Cannot bind-mount {path} with SELinux relabeling. \
             This path is unsafe to relabel. \
             Use a subdirectory instead (e.g., {path}/project/)."
        )))
    }
}

fn is_unsafe_system_path(p: &str) -> bool {
    let norm = normalize_trailing(p);
    norm == "/" || norm.starts_with("/tmp/") || norm == "/tmp/" || norm.starts_with("/var/tmp/") || norm == "/var/tmp/"
}

fn normalize(p: &str) -> String {
    // Simple normalization: resolve . and remove trailing /
    let path = Path::new(p);
    path.to_string_lossy().to_string()
}

fn normalize_trailing(p: &str) -> String {
    let mut s = normalize(p);
    if !s.ends_with('/') {
        s.push('/');
    }
    s
}


================================================
FILE: data/rust/morloc-manager/src/serve.rs
================================================
use std::fs;
use std::path::Path;
use std::process::{Command, Stdio};
use std::thread;
use std::time::Duration;

use crate::container::{
    container_build, container_pull, container_run, container_run_quiet, container_stop,
    container_remove, engine_executable, exit_code_to_int, image_exists_locally,
    BuildConfig, RunConfig,
};
use crate::error::{ManagerError, Result};
use crate::types::*;

pub fn build_serve_image(
    engine: ContainerEngine,
    verbose: bool,
    state_tarball: &str,
    tag: &str,
    ver: Version,
    base_override: Option<&str>,
    rebuild: bool,
    programs: &[ProgramEntry],
) -> Result<()> {
    if !Path::new(state_tarball).exists() {
        return Err(ManagerError::UnfreezeError(format!(
            "Tarball not found: {state_tarball}"
        )));
    }

    if !rebuild && image_exists_locally(engine, tag) {
        eprintln!("Image '{tag}' already exists locally; skipping build (use --rebuild to force)");
        return Ok(());
    }

    let tarball_dir = Path::new(state_tarball)
        .parent()
        .unwrap_or(Path::new("."));
    let manifest_path = tarball_dir.join("freeze-manifest.json");
    let m_manifest = if manifest_path.exists() {
        crate::freeze::read_freeze_manifest(&manifest_path.to_string_lossy()).ok()
    } else {
        None
    };

    let base_image = match base_override {
        Some(b) => b.to_string(),
        None => resolve_base_from_manifest(engine, m_manifest.as_ref(), ver),
    };

    eprintln!("Using base image: {base_image}");
    if !image_exists_locally(engine, &base_image) {
        let exe = engine_executable(engine);
        if verbose {
            eprintln!("[morloc-manager] {exe} pull {base_image}");
        }
        let (pull_status, _, pull_err) = container_pull(engine, &base_image);
        if !pull_status.success() {
            return Err(ManagerError::EngineError {
                engine,
                code: exit_code_to_int(pull_status),
                stderr: pull_err,
            });
        }
    }

    let context_dir = tarball_dir.join("serve-build");
    fs::create_dir_all(&context_dir)
        .map_err(|e| ManagerError::UnfreezeError(format!("mkdir failed: {e}")))?;

    eprintln!("Extracting frozen state...");
    let tar_status = Command::new("tar")
        .args(["-xzf", state_tarball, "-C", &context_dir.to_string_lossy()])
        .stdin(Stdio::null())
        .stdout(Stdio::null())
        .stderr(Stdio::inherit())
        .status()
        .map_err(|e| ManagerError::UnfreezeError(format!("tar extract failed: {e}")))?;
    if !tar_status.success() {
        return Err(ManagerError::UnfreezeError(
            "tar extract failed (see error output above)".to_string()
        ));
    }

    // Rewrite build.path in each manifest so the nexus chdirs to the
    // container-internal path instead of the original host path.
    rewrite_manifest_paths(&context_dir)?;

    let dockerfile_path = context_dir.join("Dockerfile");
    let has_exe = context_dir.join("exe").is_dir()
        && fs::read_dir(context_dir.join("exe"))
            .map(|mut d| d.next().is_some())
            .unwrap_or(false);
    let has_opt = context_dir.join("opt").is_dir()
        && fs::read_dir(context_dir.join("opt"))
            .map(|mut d| d.next().is_some())
            .unwrap_or(false);
    let has_src = context_dir.join("src").is_dir()
        && fs::read_dir(context_dir.join("src"))
            .map(|mut d| d.next().is_some())
            .unwrap_or(false);
    let mh = CONTAINER_MORLOC_HOME;
    let exe_line = if has_exe {
        format!("COPY exe/ {mh}/exe/\n")
    } else {
        String::new()
    };
    let opt_line = if has_opt {
        format!("COPY opt/ {mh}/opt/\n")
    } else {
        String::new()
    };
    let src_line = if has_src {
        format!("COPY src/ {mh}/src/\n")
    } else {
        String::new()
    };
    // Podman's OCI format drops HEALTHCHECK; omit it to avoid warnings.
    let healthcheck = if engine == ContainerEngine::Docker {
        "# Health check for container orchestrators\n\
         HEALTHCHECK --interval=30s --timeout=5s --retries=3 \\\n\
           CMD curl -sf http://localhost:8080/health || exit 1\n\
         \n"
            .to_string()
    } else {
        String::new()
    };
    let dockerfile_content = format!(
        "# Auto-generated by morloc-manager serve-image\n\
         FROM {base_image}\n\
         \n\
         # Ensure morloc binaries are on PATH\n\
         ENV PATH=\"{mh}/bin:${{PATH}}\"\n\
         \n\
         # Morloc home for pool path resolution\n\
         ENV MORLOC_HOME=\"{mh}\"\n\
         \n\
         # Copy frozen morloc state (modules, manifests, binaries, pools)\n\
         COPY lib/ {mh}/lib/\n\
         COPY fdb/ {mh}/fdb/\n\
         COPY bin/ {mh}/bin/\n\
         {exe_line}\
         {opt_line}\
         {src_line}\
         RUN chmod -R a+rX {mh}\n\
         \n\
         {healthcheck}\
         # Entrypoint: nexus router aggregates all installed programs\n\
         ENTRYPOINT [\"morloc-nexus\", \"--router\", \\\n\
                     \"--fdb\", \"{mh}/fdb\", \\\n\
                     \"--http-port\", \"8080\"]\n"
    );
    fs::write(&dockerfile_path, &dockerfile_content)
        .map_err(|e| ManagerError::UnfreezeError(format!("Write Dockerfile failed: {e}")))?;

    eprintln!("Building serve image {tag} (base: {base_image})...");
    let build_cfg = BuildConfig {
        dockerfile: dockerfile_path.to_string_lossy().to_string(),
        context: context_dir.to_string_lossy().to_string(),
        tag: tag.to_string(),
        build_args: Vec::new(),
    };
    if verbose {
        let exe = engine_executable(engine);
        eprintln!(
            "[morloc-manager] {exe} build -f {} -t {tag} {}",
            build_cfg.dockerfile, build_cfg.context
        );
    }
    let (status, _, build_err) = container_build(engine, &build_cfg);
    if !status.success() {
        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(status),
            stderr: build_err,
        });
    }
    eprintln!("Built serve image: {tag}");

    // Validate programs work inside the built image
    validate_programs(engine, tag, programs, Vec::new(), verbose)?;

    // Clean up the temporary build context
    if let Err(e) = fs::remove_dir_all(&context_dir) {
        eprintln!("Warning: failed to clean up {}: {e}", context_dir.display());
    }

    Ok(())
}

#[allow(dead_code)]
pub fn run_serve_container(
    engine: ContainerEngine,
    verbose: bool,
    image: &str,
    name: &str,
    ports: &[(u16, u16)],
) -> Result<()> {
    // Clean up any existing dead container with this name (silently)
    let _ = crate::container::container_remove_quiet(engine, name);

    let port_str: Vec<String> = ports
        .iter()
        .map(|(h, c)| format!("{h}:{c}"))
        .collect();
    eprintln!(
        "Starting serve container {name} on ports {}...",
        port_str.join(", ")
    );

    let mut cfg = RunConfig::new(image);
    cfg.read_only = true;
    cfg.remove_after = false;
    cfg.name = Some(name.to_string());
    cfg.ports = ports.to_vec();
    cfg.extra_flags = vec!["-d".to_string()];

    if verbose {
        let exe = engine_executable(engine);
        let extra = crate::container::engine_specific_run_flags_io(engine);
        let args = crate::container::build_run_args(engine, &extra, &cfg);
        let quoted: Vec<String> = args.iter().map(|a| {
            if a.contains(' ') { format!("'{a}'") } else { a.clone() }
        }).collect();
        eprintln!("[morloc-manager] {exe} {}", quoted.join(" "));
    }

    let (status, _stdout, run_err) = container_run(engine, &cfg);
    if !status.success() {
        let _ = crate::container::container_remove_quiet(engine, name);
        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(status),
            stderr: run_err,
        });
    }

    // Verify container reached running state
    thread::sleep(Duration::from_secs(1));
    let exe = engine_executable(engine);
    let insp_output = Command::new(exe)
        .args(["inspect", "--format", "{{.State.Status}}", name])
        .output();
    match insp_output {
        Ok(o) if o.status.success() => {
            let state = String::from_utf8_lossy(&o.stdout).trim().to_string();
            if state == "running" {
                eprintln!("Container {name} started");
                eprintln!("  Logs:   morloc-manager logs");
                eprintln!("  Stop:   morloc-manager stop {name}");
                eprintln!("  Status: morloc-manager status");
                Ok(())
            } else {
                let log_output = Command::new(exe).args(["logs", name]).output();
                let logs = log_output
                    .map(|o| {
                        let stdout = String::from_utf8_lossy(&o.stdout);
                        let stderr = String::from_utf8_lossy(&o.stderr);
                        format!("{stdout}{stderr}")
                    })
                    .unwrap_or_default();
                // Clean up the dead container to prevent name conflicts on retry
                let _ = container_remove(engine, name);
                Err(ManagerError::EngineError {
                    engine,
                    code: 1,
                    stderr: format!("Container failed to start (state: {state}):\n{logs}"),
                })
            }
        }
        _ => Err(ManagerError::EngineError {
            engine,
            code: 1,
            stderr: "Failed to inspect container state".to_string(),
        }),
    }
}

/// Serve an environment by bind-mounting its data directory into the container.
pub fn serve_environment(
    engine: ContainerEngine,
    verbose: bool,
    image: &str,
    data_dir: &str,
    container_name: &str,
    ports: &[(u16, u16)],
    extra_flags: &[String],
    shm_size: &Option<String>,
    user_env: &[(String, String)],
) -> Result<()> {
    // Clean up any existing dead container with this name (silently)
    let _ = crate::container::container_remove_quiet(engine, container_name);

    let port_str: Vec<String> = ports
        .iter()
        .map(|(h, c)| format!("{h}:{c}"))
        .collect();
    eprintln!(
        "Starting serve container {container_name} on ports {}...",
        port_str.join(", ")
    );

    let mut cfg = RunConfig::new(image);
    cfg.read_only = true;
    cfg.remove_after = false;
    cfg.name = Some(container_name.to_string());
    cfg.ports = ports.to_vec();
    let mh = CONTAINER_MORLOC_HOME;
    cfg.bind_mounts = vec![(data_dir.to_string(), mh.to_string())];
    cfg.env = vec![
        ("PATH".to_string(), format!("{mh}/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin")),
        ("MORLOC_HOME".to_string(), mh.to_string()),
    ];
    cfg.env.extend(user_env.iter().cloned());
    cfg.command = Some(vec![
        "morloc-nexus".to_string(),
        "--router".to_string(),
        "--fdb".to_string(), format!("{mh}/fdb"),
        "--http-port".to_string(), "8080".to_string(),
    ]);
    cfg.shm_size = shm_size.clone();
    cfg.extra_flags = vec!["-d".to_string()];
    cfg.extra_flags.extend(extra_flags.iter().cloned());

    if verbose {
        let exe = engine_executable(engine);
        let extra = crate::container::engine_specific_run_flags_io(engine);
        let args = crate::container::build_run_args(engine, &extra, &cfg);
        let quoted: Vec<String> = args.iter().map(|a| {
            if a.contains(' ') { format!("'{a}'") } else { a.clone() }
        }).collect();
        eprintln!("[morloc-manager] {exe} {}", quoted.join(" "));
    }

    let (status, _stdout, run_err) = container_run(engine, &cfg);
    if !status.success() {
        // `container_run` may have left a partially-created container behind
        // (e.g., port conflict after container creation). Clean it up so the
        // next `start` doesn't fail on a name collision.
        let _ = crate::container::container_remove_quiet(engine, container_name);

        // Detect port conflict and provide a friendlier error message
        let lower = run_err.to_lowercase();
        if lower.contains("address already in use") || lower.contains("port is already allocated")
            || lower.contains("pasta failed")
        {
            // Try to extract the port number from the error
            let port_hint = ports.first()
                .map(|(h, _)| format!(" Port {h} is already in use."))
                .unwrap_or_default();
            return Err(ManagerError::EnvError(format!(
                "{port_hint}\n  \
                 Another container or process is using this port.\n  \
                 Use '-p <other-port>:8080' to choose a different host port, or\n  \
                 check running containers with 'morloc-manager status'."
            )));
        }

        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(status),
            stderr: run_err,
        });
    }

    // Verify container reached running state
    thread::sleep(Duration::from_secs(1));
    let exe = engine_executable(engine);
    let insp_output = Command::new(exe)
        .args(["inspect", "--format", "{{.State.Status}}", container_name])
        .output();
    match insp_output {
        Ok(o) if o.status.success() => {
            let state = String::from_utf8_lossy(&o.stdout).trim().to_string();
            if state == "running" {
                eprintln!("Container {container_name} started");
                eprintln!("  Logs:   morloc-manager logs");
                eprintln!("  Stop:   morloc-manager stop");
                eprintln!("  Status: morloc-manager status");
                Ok(())
            } else {
                let log_output = Command::new(exe).args(["logs", container_name]).output();
                let logs = log_output
                    .map(|o| {
                        let stdout = String::from_utf8_lossy(&o.stdout);
                        let stderr = String::from_utf8_lossy(&o.stderr);
                        format!("{stdout}{stderr}")
                    })
                    .unwrap_or_default();
                let _ = container_remove(engine, container_name);
                Err(ManagerError::EngineError {
                    engine,
                    code: 1,
                    stderr: format!("Container failed to start (state: {state}):\n{logs}"),
                })
            }
        }
        _ => Err(ManagerError::EngineError {
            engine,
            code: 1,
            stderr: "Failed to inspect container state".to_string(),
        }),
    }
}

pub fn stop_serve_container(engine: ContainerEngine, verbose: bool, name: &str) -> Result<()> {
    if !crate::container::container_exists(engine, name) {
        return Err(ManagerError::EnvError(format!(
            "No serve container running for '{name}'"
        )));
    }
    if verbose {
        let exe = engine_executable(engine);
        eprintln!("[morloc-manager] {exe} stop {name}");
    }
    let (status, err) = container_stop(engine, name);
    let _ = crate::container::container_remove_quiet(engine, name);
    if !status.success() {
        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(status),
            stderr: err,
        });
    }
    Ok(())
}

/// Build the serve container name for an environment.
/// Format: morloc-serve-<username>-<envname>
pub fn serve_container_name(env_name: &str) -> String {
    let user = std::env::var("USER")
        .or_else(|_| std::env::var("LOGNAME"))
        .unwrap_or_else(|_| "unknown".to_string());
    format!("morloc-serve-{user}-{env_name}")
}

/// The prefix used to filter all serve containers for the current user.
pub fn serve_container_prefix() -> String {
    let user = std::env::var("USER")
        .or_else(|_| std::env::var("LOGNAME"))
        .unwrap_or_else(|_| "unknown".to_string());
    format!("morloc-serve-{user}-")
}

/// Extract the environment name from a serve container name.
pub fn env_name_from_container(container_name: &str) -> &str {
    let prefix = serve_container_prefix();
    container_name.strip_prefix(&prefix).unwrap_or(container_name)
}

#[derive(serde::Serialize)]
pub struct ServeContainerInfo {
    pub name: String,
    pub env: String,
    pub ports: String,
    pub status: String,
}

/// Query running serve containers and return structured info.
pub fn query_serve_containers(engine: ContainerEngine, verbose: bool) -> Result<Vec<ServeContainerInfo>> {
    let exe = engine_executable(engine);
    let fmt = "{{.Names}}\t{{.Status}}\t{{.Ports}}";
    let prefix = serve_container_prefix();
    let filter = format!("name={prefix}");
    if verbose {
        eprintln!("[morloc-manager] {exe} ps -a --filter {filter} --format '{fmt}'");
    }
    let output = Command::new(exe)
        .args([
            "ps", "-a", "--filter", &filter, "--format", fmt,
        ])
        // Use /tmp as cwd to avoid podman "cannot chdir" failures when the
        // current directory is inaccessible (e.g. another user's home).
        .current_dir("/tmp")
        .output()
        .map_err(|e| ManagerError::EngineError {
            engine,
            code: 1,
            stderr: format!("Failed to list containers: {e}"),
        })?;
    if !output.status.success() {
        return Err(ManagerError::EngineError {
            engine,
            code: exit_code_to_int(output.status),
            stderr: String::from_utf8_lossy(&output.stderr).to_string(),
        });
    }
    let text = String::from_utf8_lossy(&output.stdout).trim().to_string();
    let mut result = Vec::new();
    for line in text.lines() {
        let parts: Vec<&str> = line.split('\t').collect();
        if parts.len() >= 3 {
            let name = parts[0];
            let status = parts[1];
            let ports = parts[2];
            let env = env_name_from_container(name);
            result.push(ServeContainerInfo {
                name: name.to_string(),
                env: env.to_string(),
                ports: if ports.is_empty() { "-".to_string() } else { ports.to_string() },
                status: status.to_string(),
            });
        }
    }
    Ok(result)
}

/// Find running serve container names for the current user.
pub fn find_running_serve_containers(engine: ContainerEngine) -> Vec<String> {
    let exe = engine_executable(engine);
    let filter = format!("name={}", serve_container_prefix());
    let output = Command::new(exe)
        .args(["ps", "--filter", &filter, "--format", "{{.Names}}"])
        .current_dir("/tmp")
        .output();
    match output {
        Ok(o) if o.status.success() => {
            String::from_utf8_lossy(&o.stdout)
                .lines()
                .filter(|l| !l.is_empty())
                .map(|l| l.to_string())
                .collect()
        }
        _ => Vec::new(),
    }
}

// ======================================================================
// Program validation
// ======================================================================

/// Run `--help` for each installed program inside a container image to
/// verify that pool processes start correctly (e.g. all imports resolve).
///
/// `bind_mounts` should be non-empty for pre-freeze validation (where the
/// data dir is on the host) and empty for post-unfreeze validation (where
/// everything is baked into the image).
pub fn validate_programs(
    engine: ContainerEngine,
    image: &str,
    programs: &[ProgramEntry],
    bind_mounts: Vec<(String, String)>,
    verbose: bool,
) -> Result<()> {
    if programs.is_empty() {
        return Ok(());
    }
    eprintln!("Validating installed programs...");
    let mut any_failed = false;
    for prog in programs {
        let exe_path = format!("{}/bin/{}", CONTAINER_MORLOC_HOME, prog.name);
        if verbose {
            let exe = engine_executable(engine);
            eprintln!("[morloc-manager] {exe} run --rm --entrypoint '' {image} {exe_path} --help");
        }
        let cfg = RunConfig {
            bind_mounts: bind_mounts.clone(),
            command: Some(vec![exe_path, "--help".to_string()]),
            env: vec![
                ("MORLOC_HOME".to_string(), CONTAINER_MORLOC_HOME.to_string()),
            ],
            // Override the image ENTRYPOINT so the command runs directly
            // instead of being appended to the router entrypoint.
            extra_flags: vec!["--entrypoint".to_string(), "".to_string()],
            ..RunConfig::new(image)
        };
        let (status, _stdout, stderr) = container_run_quiet(engine, &cfg);
        if status.success() {
            let n = prog.commands.len();
            eprintln!("  [ok] {} ({} commands)", prog.name, n);
        } else {
            let snippet: String = stderr.lines().take(5).collect::<Vec<_>>().join("\n    ");
            eprintln!("  [FAIL] {}: {}", prog.name, snippet);
            any_failed = true;
        }
    }
    if any_failed {
        return Err(ManagerError::FreezeError(
            "Some programs failed validation (see errors above)".to_string(),
        ));
    }
    Ok(())
}

// ======================================================================
// Manifest path rewriting for frozen images
// ======================================================================

const CONTAINER_MORLOC_HOME: &str = "/opt/morloc";
const MANIFEST_MARKER: &str = "### MANIFEST ###";

/// Rewrite `build.path` in every `.manifest` file under `fdb/` so the
/// nexus inside the container chdirs to the correct location instead of
/// the original host path.
fn rewrite_manifest_paths(context_dir: &Path) -> Result<()> {
    let fdb_dir = context_dir.join("fdb");
    if !fdb_dir.is_dir() {
        return Ok(());
    }
    let entries = fs::read_dir(&fdb_dir)
        .map_err(|e| ManagerError::UnfreezeError(format!("read fdb/: {e}")))?;
    for entry in entries {
        let entry = entry
            .map_err(|e| ManagerError::UnfreezeError(format!("read fdb/ entry: {e}")))?;
        let path = entry.path();
        let name = entry.file_name();
        let name_str = name.to_string_lossy();
        if !name_str.ends_with(".manifest") {
            continue;
        }
        let prog_name = &name_str[..name_str.len() - ".manifest".len()];
        let container_build_path = format!("{}/exe/{}", CONTAINER_MORLOC_HOME, prog_name);
        rewrite_one_manifest(&path, &container_build_path)?;
    }
    Ok(())
}

/// Rewrite the `build.path` field in a single manifest wrapper script.
fn rewrite_one_manifest(path: &Path, new_build_path: &str) -> Result<()> {
    let content = fs::read_to_string(path)
        .map_err(|e| ManagerError::UnfreezeError(format!("read {}: {e}", path.display())))?;

    let (prefix, json_str) = if content.starts_with("#!") {
        if let Some(marker_pos) = content.find(MANIFEST_MARKER) {
            let after_marker = &content[marker_pos..];
            let json_start = after_marker
                .find('\n')
                .map(|i| marker_pos + i + 1)
                .unwrap_or(content.len());
            (&content[..json_start], &content[json_start..])
        } else {
            return Ok(()); // no marker, skip
        }
    } else {
        ("", content.as_str())
    };

    let mut manifest: serde_json::Value = serde_json::from_str(json_str)
        .map_err(|e| ManagerError::UnfreezeError(format!("parse {}: {e}", path.display())))?;

    if let Some(build) = manifest.get_mut("build") {
        if let Some(p) = build.get_mut("path") {
            *p = serde_json::Value::String(new_build_path.to_string());
        }
    }

    let new_json = serde_json::to_string(&manifest)
        .map_err(|e| ManagerError::UnfreezeError(format!("serialize {}: {e}", path.display())))?;

    let new_content = format!("{}{}\n", prefix, new_json);
    fs::write(path, new_content)
        .map_err(|e| ManagerError::UnfreezeError(format!("write {}: {e}", path.display())))?;
    Ok(())
}

// ======================================================================
// Manifest and image resolution
// ======================================================================

fn resolve_base_from_manifest(
    engine: ContainerEngine,
    m_manifest: Option<&FreezeManifest>,
    ver: Version,
) -> String {
    let ghcr_fallback = format!(
        "ghcr.io/morloc-project/morloc/morloc-full:{}",
        ver.show()
    );
    let Some(fm) = m_manifest else {
        return ghcr_fallback;
    };

    // Resolve the effective base image: use manifest's base_image if it exists
    // locally, otherwise fall back to the GHCR image. The manifest may record a
    // locally-retagged image (e.g. localhost/morloc:0.69.0) that won't exist on
    // other machines.
    let effective_base = if image_exists_locally(engine, &fm.base_image) {
        fm.base_image.clone()
    } else {
        eprintln!(
            "Base image '{}' not found locally, trying GHCR fallback...",
            fm.base_image
        );
        ghcr_fallback
    };

    match &fm.env_layer {
        None => effective_base,
        Some(fel) => {
            // Fast path: env image tag exists locally
            if let Some(ref tag) = fel.image_tag {
                let exe = engine_executable(engine);
                let check = Command::new(exe)
                    .args(["image", "inspect", tag])
                    .stdout(Stdio::null())
                    .stderr(Stdio::null())
                    .status();
                if check.map(|s| s.success()).unwrap_or(false) {
                    return tag.clone();
                }
            }
            // Rebuild env layer from stored Dockerfile using effective base
            rebuild_env_image(engine, &effective_base, fm, fel)
        }
    }
}

fn rebuild_env_image(
    engine: ContainerEngine,
    effective_base: &str,
    fm: &FreezeManifest,
    fel: &FrozenEnvLayer,
) -> String {
    let env_tag = format!(
        "localhost/morloc-env:{}-{}",
        fm.morloc_version.show(),
        fel.name
    );
    let exe = engine_executable(engine);
    // Check if tagged image exists locally
    let check = Command::new(exe)
        .args(["image", "inspect", &env_tag])
        .stdout(Stdio::null())
        .stderr(Stdio::null())
        .status();
    if check.map(|s| s.success()).unwrap_or(false) {
        return env_tag;
    }

    eprintln!("Building deployment image (environment layer: {})", fel.name);
    let build_dir = "/tmp/morloc-env-rebuild";
    let _ = fs::create_dir_all(build_dir);
    let df_path = format!("{build_dir}/Dockerfile");
    let _ = fs::write(&df_path, &fel.dockerfile);
    let build_cfg = BuildConfig {
        dockerfile: df_path,
        context: build_dir.to_string(),
        tag: env_tag.clone(),
        build_args: vec![("CONTAINER_BASE".to_string(), effective_base.to_string())],
    };
    let (status, _, build_err) = container_build(engine, &build_cfg);
    if status.success() {
        env_tag
    } else {
        eprintln!(
            "Warning: env rebuild failed, falling back to base image: {build_err}"
        );
        effective_base.to_string()
    }
}


================================================
FILE: data/rust/morloc-manager/src/types.rs
================================================
use serde::{Deserialize, Deserializer, Serialize, Serializer};
use std::cmp::Ordering;
use std::str::FromStr;

// ======================================================================
// Core enumerations
// ======================================================================

#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord)]
pub enum Scope {
    Local,
    System,
}

impl Serialize for Scope {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        match self {
            Scope::Local => serializer.serialize_str("local"),
            Scope::System => serializer.serialize_str("system"),
        }
    }
}

impl<'de> Deserialize<'de> for Scope {
    fn deserialize<D: Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let s = String::deserialize(deserializer)?;
        match s.as_str() {
            "local" => Ok(Scope::Local),
            "system" => Ok(Scope::System),
            _ => Err(serde::de::Error::custom(format!("Unknown scope: {s}"))),
        }
    }
}

#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum ContainerEngine {
    Docker,
    Podman,
}

impl Serialize for ContainerEngine {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        match self {
            ContainerEngine::Docker => serializer.serialize_str("docker"),
            ContainerEngine::Podman => serializer.serialize_str("podman"),
        }
    }
}

impl<'de> Deserialize<'de> for ContainerEngine {
    fn deserialize<D: Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let s = String::deserialize(deserializer)?;
        match s.as_str() {
            "docker" => Ok(ContainerEngine::Docker),
            "podman" => Ok(ContainerEngine::Podman),
            _ => Err(serde::de::Error::custom(format!(
                "Unknown container engine: {s}"
            ))),
        }
    }
}

// ======================================================================
// Version
// ======================================================================

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct Version {
    pub major: u32,
    pub minor: u32,
    pub patch: u32,
    pub prerelease: Option<String>,
}

impl Version {
    #[cfg(test)]
    pub fn new(major: u32, minor: u32, patch: u32) -> Self {
        Self {
            major,
            minor,
            patch,
            prerelease: None,
        }
    }

    pub fn show(&self) -> String {
        match &self.prerelease {
            Some(pre) => format!("{}.{}.{}-{}", self.major, self.minor, self.patch, pre),
            None => format!("{}.{}.{}", self.major, self.minor, self.patch),
        }
    }
}

impl Ord for Version {
    fn cmp(&self, other: &Self) -> Ordering {
        self.major
            .cmp(&other.major)
            .then(self.minor.cmp(&other.minor))
            .then(self.patch.cmp(&other.patch))
            .then(match (&self.prerelease, &other.prerelease) {
                (None, None) => Ordering::Equal,
                (Some(_), None) => Ordering::Less,    // pre-release < release
                (None, Some(_)) => Ordering::Greater,  // release > pre-release
                (Some(a), Some(b)) => a.cmp(b),
            })
    }
}

impl PartialOrd for Version {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl FromStr for Version {
    type Err = String;

    fn from_str(s: &str) -> Result<Self, Self::Err> {
        // Split off pre-release suffix on first '-': "0.77.0-rc.1" -> ("0.77.0", Some("rc.1"))
        let (version_part, prerelease) = match s.find('-') {
            Some(idx) => (&s[..idx], Some(s[idx + 1..].to_string())),
            None => (s, None),
        };
        let parts: Vec<&str> = version_part.split('.').collect();
        if parts.len() != 3 {
            return Err(format!("Invalid version: {s}. Expected format: MAJOR.MINOR.PATCH[-PRERELEASE]"));
        }
        let major = parts[0]
            .parse()
            .map_err(|_| format!("Invalid major version: {}", parts[0]))?;
        let minor = parts[1]
            .parse()
            .map_err(|_| format!("Invalid minor version: {}", parts[1]))?;
        let patch = parts[2]
            .parse()
            .map_err(|_| format!("Invalid patch version: {}", parts[2]))?;
        Ok(Version {
            major,
            minor,
            patch,
            prerelease,
        })
    }
}

impl Serialize for Version {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        serializer.serialize_str(&self.show())
    }
}

impl<'de> Deserialize<'de> for Version {
    fn deserialize<D: Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let s = String::deserialize(deserializer)?;
        s.parse().map_err(serde::de::Error::custom)
    }
}

// ======================================================================
// Configuration
// ======================================================================

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct Config {
    /// Name of the active environment.
    pub active_env: Option<String>,
    /// Default container engine.
    #[serde(default = "default_engine")]
    pub engine: ContainerEngine,
}

fn default_engine() -> ContainerEngine {
    ContainerEngine::Podman
}

impl Default for Config {
    fn default() -> Self {
        Self {
            active_env: None,
            engine: ContainerEngine::Podman,
        }
    }
}

// ======================================================================
// Environment configuration
// ======================================================================

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct EnvironmentConfig {
    /// Human-readable name (also the directory name).
    pub name: String,
    /// Base container image reference.
    pub base_image: String,
    /// Original pullable image reference (e.g., :edge tag) before local re-tagging.
    #[serde(default)]
    pub original_image: Option<String>,
    /// Filename of the custom Dockerfile layer (within the env config dir).
    #[serde(default)]
    pub dockerfile: Option<String>,
    /// SHA256 hash of the Dockerfile content (for rebuild detection).
    #[serde(default)]
    pub content_hash: Option<String>,
    /// Built image tag after applying the Dockerfile layer.
    /// None when only the base image is used.
    #[serde(default)]
    pub built_image: Option<String>,
    /// Container engine for this environment.
    pub engine: ContainerEngine,
    /// Shared memory size for container runs.
    #[serde(default = "default_shm_size")]
    pub shm_size: String,
    /// Morloc version this environment was created from.
    #[serde(default)]
    pub morloc_version: Option<Version>,
}

fn default_shm_size() -> String {
    "512m".to_string()
}

impl EnvironmentConfig {
    /// Returns the image to use for running containers.
    /// Prefers the built Dockerfile layer image, falls back to base_image.
    pub fn active_image(&self) -> &str {
        self.built_image.as_deref().unwrap_or(&self.base_image)
    }
}

// ======================================================================
// Freeze manifest
// ======================================================================

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct FreezeManifest {
    pub morloc_version: Version,
    pub frozen_at: chrono::DateTime<chrono::Utc>,
    pub modules: Vec<ModuleEntry>,
    pub programs: Vec<ProgramEntry>,
    pub base_image: String,
    pub env_layer: Option<FrozenEnvLayer>,
    /// Deprecated: previously held expected env var names. Retained for backward
    /// compatibility when reading older freeze manifests.
    #[serde(default, skip_serializing)]
    #[allow(dead_code)]
    pub env_vars: Vec<String>,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct FrozenEnvLayer {
    pub name: String,
    pub dockerfile: String,
    pub content_hash: String,
    /// Container image tag (e.g. localhost/morloc-env:0.79.2-dnd).
    /// Named image_tag because it stores a mutable tag, not a content-addressed digest.
    #[serde(alias = "image_digest")]
    pub image_tag: Option<String>,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ModuleEntry {
    pub name: String,
    pub version: Option<String>,
    pub sha256: String,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ProgramEntry {
    pub name: String,
    pub commands: Vec<String>,
}


================================================
FILE: data/rust/morloc-manifest/Cargo.toml
================================================
[package]
name = "morloc-manifest"
version = "0.81.0"
edition = "2021"
description = "Morloc manifest schema (v2): shared Rust types for the .manifest JSON blob produced by the morloc compiler and consumed by the nexus, runtime, and any future tooling."
# Version is intentionally synchronized with the morloc compiler version
# (see ../../../package.yaml). Manifests record the morloc_version that
# built them; consumers reject manifests whose version differs from
# CARGO_PKG_VERSION at parse time. Bumping the morloc compiler version
# requires bumping this version in lockstep.

[dependencies]
serde = { workspace = true }
serde_json = { workspace = true }


================================================
FILE: data/rust/morloc-manifest/src/lib.rs
================================================
//! Morloc manifest schema (v2) -- canonical Rust types.
//!
//! The morloc compiler emits a `.manifest` JSON blob describing every
//! exported command's interface. This crate is the **single source of
//! truth** for that schema's Rust representation. Both the CLI nexus
//! (`morloc-nexus`) and the C-FFI runtime (`morloc-runtime`) depend on
//! these types so neither has to maintain its own deserialization
//! logic.
//!
//! ## Versioning
//!
//! The manifest does not carry a dedicated schema version. Manifests
//! are transient build artifacts (always regenerated on `morloc make`,
//! never stored in version control), so the morloc compiler version
//! recorded in the [`Build`] sub-object serves as the staleness
//! indicator. The check happens in [`parse_manifest`].
//!
//! Version coupling: this crate's `CARGO_PKG_VERSION` is intentionally
//! kept in lockstep with the morloc Haskell compiler version (see
//! `package.yaml`). The same is true of `morloc-nexus` and
//! `morloc-runtime` -- bumping the morloc compiler requires bumping
//! all three Rust crates in the same commit.
//!
//! ## Extension slots
//!
//! Every entity object (manifest, pool, command, arg, return, group,
//! service) carries:
//!
//! - `constraints: Vec<Constraint>` -- enforceable rules. Currently
//!   the compiler emits only the `kind` constraint on named-type args
//!   (record/object/table). Future constraints (`min`, `max`, `regex`,
//!   `length`, `non_empty`, `row_count`, ...) will append to this
//!   list without any schema change.
//!
//! - `metadata: BTreeMap<String, serde_json::Value>` -- free-form
//!   informational key-value pairs. Always emitted as `{}` today;
//!   reserved so consumers never have to check whether the field
//!   exists. Future doc hints, studio annotations, telemetry tags,
//!   etc. live here until they stabilize into first-class fields.
//!
//! Many of these slots are `#[allow(dead_code)]` because no current
//! consumer reads them. They are deliberate forward-compatible
//! placeholders, not vestigial fields.
//!
//! ## Unknown-field tolerance
//!
//! All structs use `#[serde(default)]` on optional fields and silently
//! ignore unknown JSON keys. A manifest written by a newer morloc
//! compiler will still parse with an older nexus (modulo the version
//! mismatch error in [`parse_manifest`]).

use serde::Deserialize;
use std::collections::BTreeMap;

/// Convenient alias for the `metadata` extension slot. Using
/// `BTreeMap` (rather than `HashMap` or raw `serde_json::Value`) gives
/// us (a) compile-time enforcement that metadata is always a JSON
/// object, and (b) deterministic iteration order for stable diffs.
pub type Metadata = BTreeMap<String, serde_json::Value>;

// -- Top-level manifest -------------------------------------------------------

/// The top-level manifest object. Embedded in every built nexus binary
/// as a JSON blob after the `### MANIFEST ###` marker.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct Manifest {
    /// Program identifier -- comes from the morloc `module` declaration.
    pub name: String,
    /// Compiler-sourced build metadata (path, timestamp, version).
    /// Distinct from the user-sourced top-level `metadata` slot.
    pub build: Build,
    /// Language pool daemons that this program dispatches to.
    #[serde(default)]
    pub pools: Vec<Pool>,
    /// Exported commands the user can invoke.
    #[serde(default)]
    pub commands: Vec<Command>,
    /// Command groups for organizing CLI subcommands in help output.
    #[serde(default)]
    pub groups: Vec<CmdGroup>,
    /// Daemon-mode service configuration. None for normal CLI mode.
    #[serde(default)]
    pub service: Option<Service>,
    /// Module-level description lines (from docstrings before `module`).
    /// Shown after "Usage:" and before "Nexus options" in top-level help.
    #[serde(default)]
    pub desc: Vec<String>,
    /// Epilogue blocks shown at the end of top-level help output.
    #[serde(default)]
    pub epilogues: Vec<Vec<String>>,
    /// **Reserved.** User-sourced free-form annotations on the module.
    /// Always emitted as `{}` today. Distinct from `build` (which is
    /// compiler-sourced).
    #[serde(default)]
    pub metadata: Metadata,
}

/// Compiler-sourced metadata about how this manifest was produced.
///
/// Future build fields (`hash`, `source_hash`, `host`, `user`, `system`,
/// `dependencies`, `cflags`, `reproducible`, ...) will be added directly
/// to this struct as additive non-breaking changes -- no sub-metadata
/// nesting required.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct Build {
    /// Absolute path to the build directory containing this program's
    /// pool executables and generated source files. The nexus chdirs
    /// here at startup so relative pool exec paths resolve.
    pub path: String,
    /// Unix timestamp at which the manifest was generated.
    pub time: i64,
    /// Version of the morloc compiler that produced this manifest. The
    /// nexus compares this against its own compile-time
    /// `CARGO_PKG_VERSION` (which is intentionally synchronized with
    /// the morloc compiler version) in [`parse_manifest`]; a mismatch
    /// produces an actionable "rebuild with the current compiler"
    /// error.
    pub morloc_version: String,
}

/// A single language pool daemon. Each pool is one OS process that
/// hosts the language-specific implementations of source functions.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct Pool {
    /// Language tag (e.g. `"py"`, `"cpp"`, `"r"`, `"julia"`).
    pub lang: String,
    /// argv used to spawn the pool process (e.g. `["python3", "pool.py"]`).
    pub exec: Vec<String>,
    /// Unix domain socket basename (under tmpdir) for IPC.
    pub socket: String,
    /// **Reserved.** Per-pool metadata. Future slots: `resource`
    /// (cpu/memory limits), `env` (environment variables),
    /// `startup_timeout`, `health_check`.
    #[serde(default)]
    pub metadata: Metadata,
}

// -- Commands -----------------------------------------------------------------

/// Discriminator for the command kind. Closed enum so adding a new
/// variant requires explicit code changes everywhere it's matched.
#[derive(Debug, Deserialize, Clone, Copy, PartialEq, Eq)]
#[serde(rename_all = "lowercase")]
pub enum CmdType {
    /// Dispatched to a language pool process via IPC.
    Remote,
    /// Evaluated inline by the nexus from an embedded expression tree.
    Pure,
}

/// One exported morloc function the user can invoke as a CLI subcommand.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct Command {
    /// CLI subcommand name (defaults to the morloc function name; can
    /// be overridden via a `--' name:` docstring directive).
    pub name: String,
    /// Discriminator: [`CmdType::Remote`] (dispatch to a pool) or
    /// [`CmdType::Pure`] (evaluate inline via the manifest's `expr`
    /// tree).
    #[serde(rename = "type")]
    pub cmd_type: CmdType,

    // -- Remote-only dispatch info ----------------------------------------
    /// Manifold ID -- the integer key under which the pool's dispatch
    /// table contains this function's entry. Remote commands only.
    #[serde(default)]
    pub mid: u32,
    /// Index into [`Manifest::pools`] for the primary pool that hosts
    /// this command's top-level function. Remote commands only.
    #[serde(default, rename = "pool")]
    pub pool_index: usize,
    /// Indices of every pool transitively required to execute this
    /// command (the primary pool plus any pools called as foreign
    /// functions from inside it). Remote commands only.
    #[serde(default)]
    pub needed_pools: Vec<usize>,

    // -- Common fields ----------------------------------------------------
    /// Description lines shown in CLI help. The first line is the
    /// summary used in subcommand listings.
    #[serde(default)]
    pub desc: Vec<String>,
    /// Argument list, in declaration order. Each entry is a
    /// discriminated union -- see [`Arg`].
    #[serde(default)]
    pub args: Vec<Arg>,
    /// Return-value descriptor. Always present, even for nullary
    /// returns (use a Nil schema in that case).
    #[serde(default, rename = "return")]
    pub ret: Return,
    /// **Reserved.** Command-level constraints -- invariants that span
    /// multiple arguments (e.g. `equal_length` of two list args).
    /// Empty in v2; populated when the constraint system rolls out.
    #[serde(default)]
    pub constraints: Vec<Constraint>,
    /// **Reserved.** Per-command metadata. Future slots: `effects`
    /// (declared I/O / network / filesystem effect set), `resource`
    /// (CPU/memory/time limits), `auth` (required capabilities),
    /// `version` (semantic version of the command's API),
    /// `deprecated` (migration notice).
    #[serde(default)]
    pub metadata: Metadata,

    // -- Pure-only evaluation info ----------------------------------------
    /// Embedded expression tree (NexusExpr JSON) for pure commands.
    /// Evaluated inline by the nexus instead of being dispatched to a
    /// pool. Absent on remote commands.
    #[serde(default)]
    pub expr: Option<serde_json::Value>,

    // -- Command group ----------------------------------------------------
    /// Optional name of the command group this command belongs to. Used
    /// to organize subcommands in help output. The Haskell emitter now
    /// writes a real JSON null for absent groups (see
    /// `Morloc.CodeGenerator.Nexus.cmdGroupField`), so no custom
    /// deserializer is needed.
    #[serde(default)]
    pub group: Option<String>,
}

impl Command {
    pub fn is_pure(&self) -> bool {
        self.cmd_type == CmdType::Pure
    }
}

/// Return-value descriptor. Structurally similar to a typed [`Arg`]
/// minus the CLI-specific fields (kind, metavar, quoted, short/long,
/// default). Always present on every command.
#[derive(Debug, Deserialize, Default)]
#[allow(dead_code)]
pub struct Return {
    /// Morloc serialization schema string for the return type. The
    /// nexus uses this to deserialize the bytes coming back from the
    /// pool process.
    #[serde(default)]
    pub schema: String,
    /// User-facing type name as written in the morloc source (e.g.
    /// `"Int"`, `"Config"`, `"[Int]"`). Used in help output and error
    /// messages. JSON key is `type`; the Rust field is `type_desc`
    /// because `type` is a reserved keyword.
    #[serde(default, rename = "type")]
    pub type_desc: String,
    /// Description lines for the return value, parsed from `--' return:`
    /// docstrings.
    #[serde(default)]
    pub desc: Vec<String>,
    /// **Reserved.** Constraints on the return value. Currently used
    /// only for `kind: record|object|table` on named return types;
    /// future constraints (min/max/regex/...) will live here.
    #[serde(default)]
    pub constraints: Vec<Constraint>,
    /// **Reserved.** Per-return metadata; same forward-compatibility
    /// rationale as the per-arg slot.
    #[serde(default)]
    pub metadata: Metadata,
}

// -- Constraints --------------------------------------------------------------

/// A single constraint entry attached to an arg, return value, or
/// command. Discriminated by `type`.
///
/// **Currently emitted constraint types**:
///
/// - `kind`: marks a named type as `record` / `object` / `table`. The
///   `value` payload is the lowercased name. The CLI help renderer
///   uses this to partition into Record Schemas / Table Schemas
///   sections.
///
/// **Reserved constraint types** (defined shapes, not yet emitted by
/// any compiler pass -- names and payloads chosen so the schema
/// doesn't need to bump when the constraint feature lands):
///
/// - `min`, `max`: numeric bounds with `value: <number>`.
/// - `length`: `value: <int>` for a fixed length, or `{min, max}` for
///   a bounded range.
/// - `non_empty`: list/string must be non-empty (no payload).
/// - `regex`: string must match `value: "<pcre>"`.
/// - `enum`: value must be one of `value: [...]`.
/// - `unique`: list elements must be pairwise distinct (no payload).
/// - `row_count`: fixed/bounded row count for `table`-tagged args.
/// - `sorted`: `value: "asc"|"desc"`.
///
/// **Extensibility rules**:
///
/// 1. Unknown `type` values MUST be silently ignored by readers.
/// 2. Adding a new constraint type does not bump the manifest version.
/// 3. Changing the payload shape of an existing type DOES bump.
/// 4. Constraints are unordered.
/// 5. Multiple constraints of the same type on the same entity are
///    allowed.
#[derive(Debug, Deserialize, Clone)]
#[allow(dead_code)]
pub struct Constraint {
    /// Constraint discriminator. JSON key is `type`; the Rust field is
    /// `ctype` because `type` is a reserved keyword.
    #[serde(rename = "type")]
    pub ctype: String,
    /// Constraint-specific payload. Shape depends on `ctype`. Some
    /// constraint types (`non_empty`, `unique`) carry no payload.
    #[serde(default)]
    pub value: Option<serde_json::Value>,
}

// -- Arguments ----------------------------------------------------------------

/// CLI argument variants. Each command's argument list is a sequence
/// of these, in declaration order.
///
/// Three of the four variants (`Positional`, `Optional`, `Group`)
/// carry type/schema/constraints information because they represent
/// typed values that flow through to a pool. `Flag` is a pure boolean
/// toggle with no associated type -- and therefore no `schema`,
/// `type_desc`, or `constraints` slot.
///
/// `#[allow(dead_code)]` covers the `metadata` slots that are reserved
/// for future use and not read by any current consumer.
#[derive(Debug, Deserialize)]
#[serde(tag = "kind")]
#[allow(dead_code)]
pub enum Arg {
    /// A positional CLI argument.
    #[serde(rename = "pos")]
    Positional {
        /// Morloc serialization schema string. Used at dispatch time
        /// to parse the user's CLI input into a binary data packet.
        #[serde(default)]
        schema: Option<String>,
        /// User-facing type name (e.g. `"Int"`, `"Config"`). The Rust
        /// field is `type_desc` because `type` is a reserved keyword.
        #[serde(default, rename = "type")]
        type_desc: Option<String>,
        /// Display placeholder shown in help (e.g. `"FILE"`). None
        /// falls back to a generic `ARG` placeholder.
        #[serde(default)]
        metavar: Option<String>,
        /// If true, the user's CLI value is JSON-wrapped before being
        /// passed to the pool. Used for `Str`-typed positionals
        /// declared with `--' literal: true`.
        #[serde(default)]
        quoted: bool,
        /// Description lines from `--' desc:` docstrings.
        #[serde(default)]
        desc: Vec<String>,
        /// Per-argument enforceable invariants. Currently only the
        /// `kind` constraint is emitted (for named-type args). Future
        /// constraints (min/max/regex/length/...) will populate this.
        #[serde(default)]
        constraints: Vec<Constraint>,
        /// **Reserved.** Per-argument informational metadata. Always
        /// emitted as `{}` in v2; not yet read by any consumer.
        #[serde(default)]
        metadata: Metadata,
    },
    /// An optional CLI argument with a long/short option name.
    #[serde(rename = "opt")]
    Optional {
        /// Morloc serialization schema for the option's value type.
        #[serde(default)]
        schema: Option<String>,
        /// User-facing type name. JSON key is `type`.
        #[serde(default, rename = "type")]
        type_desc: Option<String>,
        /// Required display placeholder (e.g. `"FILE"`).
        #[serde(default)]
        metavar: Option<String>,
        /// JSON-wrap flag for `Str`-typed literal options.
        #[serde(default)]
        quoted: bool,
        /// Single-character short option (e.g. `"f"` for `-f`).
        #[serde(default, rename = "short")]
        short_opt: Option<String>,
        /// Long option name (e.g. `"file"` for `--file`).
        #[serde(default, rename = "long")]
        long_opt: Option<String>,
        /// Default value used when the user does not pass the option.
        /// Always present (declared via `--' default:` docstring).
        #[serde(default, rename = "default")]
        default_val: Option<String>,
        /// Description lines.
        #[serde(default)]
        desc: Vec<String>,
        /// Per-argument constraints -- see [`Arg::Positional`]'s
        /// `constraints` field.
        #[serde(default)]
        constraints: Vec<Constraint>,
        /// **Reserved.** Per-argument metadata. Not read in v2.
        #[serde(default)]
        metadata: Metadata,
    },
    /// A pure boolean flag toggle. Carries no type, schema, or
    /// constraints because it has no payload -- flipping the flag
    /// produces the value `true` or `false`.
    #[serde(rename = "flag")]
    Flag {
        /// Single-character short option (e.g. `"v"` for `-v`).
        #[serde(default, rename = "short")]
        short_opt: Option<String>,
        /// Long option name (e.g. `"verbose"` for `--verbose`).
        #[serde(default, rename = "long")]
        long_opt: Option<String>,
        /// Long option name that flips the flag in the opposite
        /// direction (e.g. `"no-verbose"` for `--no-verbose`).
        #[serde(default)]
        long_rev: Option<String>,
        /// Default value when the flag is not present on the CLI.
        /// String form: `"true"` or `"false"`.
        #[serde(default, rename = "default")]
        default_val: Option<String>,
        /// Description lines.
        #[serde(default)]
        desc: Vec<String>,
        /// **Reserved.** Per-flag metadata. Not read in v2.
        #[serde(default)]
        metadata: Metadata,
    },
    /// A record-typed argument that has been "unrolled" into a flat
    /// collection of CLI flags/options, one per record field. The
    /// group's top-level `schema` is the schema of the whole record;
    /// dispatch sends the assembled record to the pool, so individual
    /// entries never need their own schemas.
    #[serde(rename = "grp")]
    Group {
        /// Morloc schema for the whole record (a `Map` schema).
        #[serde(default)]
        schema: Option<String>,
        /// User-facing record type name (e.g. `"SysConfig"`).
        #[serde(default, rename = "type")]
        type_desc: Option<String>,
        /// Display placeholder for the group as a whole.
        #[serde(default)]
        metavar: Option<String>,
        /// Description lines for the group.
        #[serde(default)]
        desc: Vec<String>,
        /// Optional CLI option that accepts the entire record as a
        /// single JSON value (e.g. `--sys-config '{...}'`).
        #[serde(default)]
        group_opt: Option<GroupOpt>,
        /// Flattened per-field options/flags. Each entry's `arg` is a
        /// nested [`Arg`] (typically `Optional` or `Flag`) that has
        /// no schema of its own -- only the group's top-level schema
        /// matters at dispatch time.
        #[serde(default)]
        entries: Vec<GroupEntry>,
        /// Per-group constraints. Currently the `kind` constraint
        /// (almost always `record`) is emitted.
        #[serde(default)]
        constraints: Vec<Constraint>,
        /// **Reserved.** Per-group metadata. Not read in v2.
        #[serde(default)]
        metadata: Metadata,
    },
}

/// Nested CLI option that accepts the entire record (associated with
/// an [`Arg::Group`]) as a single JSON value.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct GroupOpt {
    /// Short option char that accepts the whole record as one JSON value.
    #[serde(default, rename = "short")]
    pub short_opt: Option<String>,
    /// Long option name that accepts the whole record as one JSON value.
    #[serde(default, rename = "long")]
    pub long_opt: Option<String>,
}

/// One entry inside an [`Arg::Group`] -- pairs a record field name
/// with the CLI flag/option that backs it.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct GroupEntry {
    /// Record field name.
    pub key: String,
    /// CLI binding for this field. Always a [`Arg::Optional`] or
    /// [`Arg::Flag`] in practice; never carries its own schema (the
    /// containing group's schema covers all fields).
    pub arg: Arg,
}

/// CLI command group -- purely organizational metadata used to bucket
/// related subcommands together in the help output.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct CmdGroup {
    /// Group name; matches `Command::group` on member commands.
    pub name: String,
    /// Group description lines for the help output.
    #[serde(default)]
    pub desc: Vec<String>,
    /// **Reserved.** Per-group metadata. Not read in v2.
    #[serde(default)]
    pub metadata: Metadata,
}

/// Daemon-mode service configuration. Present only when the program
/// is configured to run as a long-lived service rather than a one-shot
/// CLI invocation.
#[derive(Debug, Deserialize)]
#[allow(dead_code)]
pub struct Service {
    /// Transport type: typically `"http"`, `"tcp"`, or `"unix"`.
    #[serde(rename = "type")]
    pub service_type: Option<String>,
    /// Listening host address (TCP/HTTP).
    pub host: Option<String>,
    /// Listening port (TCP/HTTP).
    pub port: Option<i32>,
    /// Unix socket path (when `service_type` is `"unix"`).
    pub socket: Option<String>,
    /// **Reserved.** Per-service metadata. Not read in v2.
    #[serde(default)]
    pub metadata: Metadata,
}

// -- I/O ----------------------------------------------------------------------

/// Read the manifest payload from a built-nexus wrapper script. The
/// nexus binary is wrapped in a shell script that contains a
/// `### MANIFEST ###` marker followed by the JSON blob. Plain JSON
/// files (no shebang) are returned as-is.
pub fn read_manifest_payload(path: &str) -> Result<String, String> {
    let content = std::fs::read_to_string(path)
        .map_err(|e| format!("Cannot open manifest file '{}': {}", path, e))?;

    if content.starts_with("#!") {
        if let Some(pos) = content.find("### MANIFEST ###") {
            let after_marker = &content[pos..];
            let payload_start = after_marker
                .find('\n')
                .map(|i| pos + i + 1)
                .unwrap_or(content.len());
            Ok(content[payload_start..].to_string())
        } else {
            Err("No ### MANIFEST ### marker found in wrapper script".into())
        }
    } else {
        Ok(content)
    }
}

/// Parse a manifest JSON payload into a [`Manifest`]. Performs a
/// staleness check on `build.morloc_version` against this crate's own
/// `CARGO_PKG_VERSION` (which is intentionally pinned to match the
/// morloc compiler version). Mismatched versions return a clean
/// "rebuild with the current compiler" error rather than silently
/// misinterpreting the manifest.
pub fn parse_manifest(payload: &str) -> Result<Manifest, String> {
    let m: Manifest = serde_json::from_str(payload)
        .map_err(|e| format!("Failed to parse manifest JSON: {}", e))?;
    let crate_version = env!("CARGO_PKG_VERSION");
    if m.build.morloc_version != crate_version {
        return Err(format!(
            "manifest built with morloc {}, runtime is {}; rebuild with the current compiler",
            m.build.morloc_version, crate_version
        ));
    }
    Ok(m)
}

// -- Arg accessors ------------------------------------------------------------
//
// Variant-agnostic helpers for the fields that exist on multiple Arg
// variants. Callers in the nexus and runtime use these instead of
// pattern-matching at every site.

impl Arg {
    /// Single-character short option (e.g. `'f'` for `-f`). Returns
    /// None for positional and group args.
    pub fn short_opt_char(&self) -> Option<char> {
        let s = match self {
            Arg::Optional { short_opt, .. } => short_opt.as_deref(),
            Arg::Flag { short_opt, .. } => short_opt.as_deref(),
            _ => None,
        };
        s.and_then(|s| s.chars().next())
    }

    /// Long option name (e.g. `"verbose"` for `--verbose`). Returns
    /// None for positional and group args.
    pub fn long_opt_str(&self) -> Option<&str> {
        match self {
            Arg::Optional { long_opt, .. } => long_opt.as_deref(),
            Arg::Flag { long_opt, .. } => long_opt.as_deref(),
            _ => None,
        }
    }

    /// True if this arg is a boolean flag toggle.
    pub fn is_flag(&self) -> bool {
        matches!(self, Arg::Flag { .. })
    }

    /// True if the user's CLI value should be JSON-wrapped before
    /// being passed to the pool. Used for `Str`-typed arguments
    /// declared with `--' literal: true`. Always false for flags and
    /// groups.
    pub fn is_quoted(&self) -> bool {
        match self {
            Arg::Positional { quoted, .. } | Arg::Optional { quoted, .. } => *quoted,
            _ => false,
        }
    }

    /// Default CLI value when the user does not pass the argument.
    /// Returns None for positional args (which are always required)
    /// and groups.
    pub fn default_val(&self) -> Option<&str> {
        match self {
            Arg::Optional { default_val, .. } => default_val.as_deref(),
            Arg::Flag { default_val, .. } => default_val.as_deref(),
            _ => None,
        }
    }

    /// CLI display placeholder (e.g. `"FILE"`, `"INT"`). None for
    /// flags and for positional args without an explicit metavar.
    pub fn metavar_str(&self) -> Option<&str> {
        match self {
            Arg::Positional { metavar, .. } => metavar.as_deref(),
            Arg::Optional { metavar, .. } => metavar.as_deref(),
            Arg::Group { metavar, .. } => metavar.as_deref(),
            _ => None,
        }
    }

    /// Description lines from the source-level docstring. Always
    /// available regardless of variant.
    pub fn desc_lines(&self) -> &[String] {
        match self {
            Arg::Positional { desc, .. }
            | Arg::Optional { desc, .. }
            | Arg::Flag { desc, .. }
            | Arg::Group { desc, .. } => desc,
        }
    }

    /// User-facing type name for typed args (e.g. `"Int"`,
    /// `"Config"`). Returns None for flags, which carry no type.
    pub fn type_desc_str(&self) -> Option<&str> {
        match self {
            Arg::Positional { type_desc, .. }
            | Arg::Optional { type_desc, .. }
            | Arg::Group { type_desc, .. } => type_desc.as_deref(),
            Arg::Flag { .. } => None,
        }
    }

    /// Morloc serialization schema string for typed args. Returns
    /// None for flags. The schema drives both dispatch (how to encode
    /// the value into a packet) and help rendering (how to extract
    /// record field layouts for the Record/Table Schemas sections).
    pub fn schema_str(&self) -> Option<&str> {
        match self {
            Arg::Positional { schema, .. }
            | Arg::Optional { schema, .. }
            | Arg::Group { schema, .. } => schema.as_deref(),
            Arg::Flag { .. } => None,
        }
    }

    /// All constraints attached to this arg. Empty for flags. The
    /// caller is responsible for filtering by constraint type and
    /// silently ignoring unknown types (per the extensibility rules
    /// on [`Constraint`]).
    pub fn constraints(&self) -> &[Constraint] {
        match self {
            Arg::Positional { constraints, .. }
            | Arg::Optional { constraints, .. }
            | Arg::Group { constraints, .. } => constraints,
            Arg::Flag { .. } => &[],
        }
    }

    /// Convenience accessor: extract the `value` of the `kind`
    /// constraint as a string slice. Returns the lowercased
    /// `"record"`, `"object"`, or `"table"` for named-type args.
    /// None for everything else (including untagged primitive types).
    pub fn kind_constraint(&self) -> Option<&str> {
        self.constraints()
            .iter()
            .find(|c| c.ctype == "kind")
            .and_then(|c| c.value.as_ref().and_then(|v| v.as_str()))
    }
}

// -- Tests --------------------------------------------------------------------

#[cfg(test)]
mod tests {
    use super::*;

    /// Wrap a v2 command body with the required top-level fields so
    /// each test fixture stays compact.
    fn wrap(commands_json: &str) -> String {
        let v = env!("CARGO_PKG_VERSION");
        format!(
            r#"{{
                "name": "main",
                "build": {{
                    "path": "/tmp/test",
                    "time": 0,
                    "morloc_version": "{}"
                }},
                "pools": [
                    {{"lang": "py", "exec": ["python3", "pool.py"], "socket": "pipe-py", "metadata": {{}}}}
                ],
                "commands": {},
                "groups": [],
                "metadata": {{}}
            }}"#,
            v, commands_json
        )
    }

    #[test]
    fn test_parse_simple_manifest() {
        let json = wrap(
            r#"[
                {
                    "name": "f",
                    "type": "remote",
                    "mid": 1,
                    "pool": 0,
                    "needed_pools": [0],
                    "desc": [],
                    "args": [
                        {
                            "kind": "pos",
                            "schema": "s",
                            "type": "Str",
                            "metavar": null,
                            "quoted": false,
                            "desc": [],
                            "constraints": [],
                            "metadata": {}
                        }
                    ],
                    "return": {
                        "schema": "s",
                        "type": "Str",
                        "desc": [],
                        "constraints": [],
                        "metadata": {}
                    },
                    "constraints": [],
                    "metadata": {},
                    "group": null
                }
            ]"#,
        );
        let m = parse_manifest(&json).unwrap();
        assert_eq!(m.pools.len(), 1);
        assert_eq!(m.pools[0].lang, "py");
        assert_eq!(m.commands.len(), 1);
        assert_eq!(m.commands[0].name, "f");
        assert!(!m.commands[0].is_pure());
        assert_eq!(m.commands[0].mid, 1);
        assert!(m.commands[0].group.is_none());
        assert_eq!(m.commands[0].args.len(), 1);
        assert_eq!(m.commands[0].args[0].schema_str(), Some("s"));
        assert_eq!(m.commands[0].args[0].type_desc_str(), Some("Str"));
        assert_eq!(m.commands[0].ret.schema, "s");
        assert_eq!(m.commands[0].ret.type_desc, "Str");
    }

    #[test]
    fn test_parse_pure_command() {
        let json = wrap(
            r#"[
                {
                    "name": "greet",
                    "type": "pure",
                    "desc": ["Say hello"],
                    "args": [
                        {
                            "kind": "pos",
                            "schema": "s",
                            "type": "Str",
                            "metavar": "NAME",
                            "quoted": true,
                            "desc": ["name"],
                            "constraints": [],
                            "metadata": {}
                        }
                    ],
                    "return": {
                        "schema": "s",
                        "type": "Str",
                        "desc": [],
                        "constraints": [],
                        "metadata": {}
                    },
                    "expr": {"tag": "lit", "schema": "s", "lit_type": "str", "value": "hello"},
                    "constraints": [],
                    "metadata": {},
                    "group": null
                }
            ]"#,
        );
        let m = parse_manifest(&json).unwrap();
        assert!(m.commands[0].is_pure());
        assert!(m.commands[0].expr.is_some());
    }

    #[test]
    fn test_parse_kind_constraint() {
        let json = wrap(
            r#"[
                {
                    "name": "process",
                    "type": "remote",
                    "mid": 1,
                    "pool": 0,
                    "needed_pools": [0],
                    "desc": [],
                    "args": [
                        {
                            "kind": "pos",
                            "schema": "<dict>m24name<list>a<str>s3age<list>a<int>i4",
                            "type": "People",
                            "metavar": null,
                            "quoted": false,
                            "desc": [],
                            "constraints": [
                                {"type": "kind", "value": "table"}
                            ],
                            "metadata": {}
                        }
                    ],
                    "return": {
                        "schema": "i4",
                        "type": "Int",
                        "desc": [],
                        "constraints": [],
                        "metadata": {}
                    },
                    "constraints": [],
                    "metadata": {},
                    "group": null
                }
            ]"#,
        );
        let m = parse_manifest(&json).unwrap();
        assert_eq!(m.commands[0].args[0].kind_constraint(), Some("table"));
    }

    #[test]
    fn test_version_mismatch_rejected() {
        let json = r#"{
            "name": "main",
            "build": {"path": "/tmp/x", "time": 0, "morloc_version": "0.0.1-stale"},
            "pools": [],
            "commands": [],
            "groups": [],
            "metadata": {}
        }"#;
        let err = parse_manifest(json).unwrap_err();
        assert!(
            err.contains("rebuild with the current compiler"),
            "got: {}",
            err
        );
    }
}


================================================
FILE: data/rust/morloc-nexus/Cargo.toml
================================================
[package]
name = "morloc-nexus"
version = "0.81.0"
edition = "2021"
description = "Morloc nexus: CLI dispatcher for multi-language pool orchestration"
# Version is intentionally synchronized with the morloc compiler version
# (see ../../../package.yaml). Manifests record the morloc_version that
# built them; the nexus rejects manifests whose version differs from its
# own CARGO_PKG_VERSION at parse time. Bumping the morloc compiler
# version requires bumping this version in lockstep.

[[bin]]
name = "morloc-nexus"
path = "src/main.rs"

[dependencies]
morloc-manifest = { path = "../morloc-manifest" }
morloc-runtime = { path = "../morloc-runtime" }
libc = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
nix = { workspace = true }
clap = { workspace = true }
thiserror = { workspace = true }


================================================
FILE: data/rust/morloc-nexus/build.rs
================================================
fn main() {
    // Use MORLOC_HOME at build time if set, else fall back to $HOME default.
    // This is only for the compile-time link search path.
    let morloc_lib = std::env::var("MORLOC_HOME")
        .map(|h| format!("{}/lib", h))
        .unwrap_or_else(|_| {
            format!(
                "{}/.local/share/morloc/lib",
                std::env::var("HOME").unwrap_or_else(|_| "/root".into())
            )
        });
    println!("cargo:rustc-link-search=native={}", morloc_lib);
    println!("cargo:rustc-link-lib=dylib=morloc");

    // Embed $ORIGIN-relative rpaths so the nexus finds libmorloc.so
    // regardless of install location:
    //   $ORIGIN/../lib           covers /opt/morloc/bin -> /opt/morloc/lib
    //   $ORIGIN/../share/morloc/lib  covers ~/.local/bin -> ~/.local/share/morloc/lib
    println!("cargo:rustc-link-arg=-Wl,-rpath,$ORIGIN/../lib");
    println!("cargo:rustc-link-arg=-Wl,-rpath,$ORIGIN/../share/morloc/lib");

    // The morloc compiler version is sourced from CARGO_PKG_VERSION
    // (this crate's Cargo.toml), which is intentionally kept in
    // lockstep with the morloc Haskell package.yaml. No build-time
    // extraction needed -- Cargo guarantees CARGO_PKG_VERSION is set
    // and rebuilds when Cargo.toml changes.
}


================================================
FILE: data/rust/morloc-nexus/src/dispatch.rs
================================================
//! Command dispatch: CLI argument parsing and routing to pools.
//!
//! Replaces the dispatch_command, dispatch, run_command, and run_pure_command
//! functions from nexus.c. Uses the C libmorloc for packet construction and
//! serialization until Phase 2/3 replaces those.
//!
//! For Phase 1, the nexus links against the C libmorloc.so for:
//! - make_call_packet_from_cli, parse_cli_data_argument
//! - send_and_receive_over_socket
//! - pack_with_schema, print_voidstar, etc.
//! - morloc_eval for pure commands

use crate::help;
use crate::manifest::{Arg, Command, Manifest};
use crate::process::{self, PoolSocket};

/// Output format enum.
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum OutputFormat {
    Json,
    MessagePack,
    VoidStar,
    Packet,
}

/// Nexus configuration parsed from CLI options.
#[derive(Debug, Clone)]
pub struct NexusConfig {
    pub help_flag: bool,
    pub print_flag: bool,
    pub packet_path: Option<String>,
    pub socket_base: Option<String>,
    pub output_path: Option<String>,
    pub output_format: OutputFormat,
    pub daemon_flag: bool,
    pub router_flag: bool,
    pub unix_socket_path: Option<String>,
    pub tcp_port: Option<i32>,
    pub http_port: Option<i32>,
    pub fdb_path: Option<String>,
    pub eval_timeout: i32,
}

impl Default for NexusConfig {
    fn default() -> Self {
        NexusConfig {
            help_flag: false,
            print_flag: false,
            packet_path: None,
            socket_base: None,
            output_path: None,
            output_format: OutputFormat::Json,
            daemon_flag: false,
            router_flag: false,
            unix_socket_path: None,
            tcp_port: None,
            http_port: None,
            fdb_path: None,
            eval_timeout: 30,
        }
    }
}

/// Emit a uniform error when pool communication fails, then exit.
///
/// The pool's stderr was inherited by the nexus, so any traceback the pool
/// printed before dying is already on the user's terminal. This helper
/// reports the communication error plus the pool's exit status (if it has
/// been reaped) so the user can correlate the two.
///
/// Race condition: the pool process may still be writing its error output
/// (traceback, panic message, etc.) to stderr when the nexus detects the
/// broken connection. If we call clean_exit immediately, it sends SIGTERM
/// to the pool process group, which can kill the pool before its stderr
/// buffer is flushed. We insert a brief drain window to let any in-flight
/// stderr from the dying pool reach the terminal before tearing everything
/// down. This is best-effort: a pool killed by SIGKILL (OOM killer, etc.)
/// won't have pending output, and a pool stuck in a blocking syscall won't
/// flush within the window. But for the common case of a Python exception
/// traceback, this is enough.
fn die_with_pool_error(
    socket: &PoolSocket,
    pool_index: usize,
    context: &str,
    comm_err: &dyn std::fmt::Display,
) -> ! {
    // Give the dying pool process time to flush its stderr/stdout before
    // we tear down the process group. Without this, a Python traceback or
    // error message that is still in a pipe buffer gets lost when
    // clean_exit sends SIGTERM/SIGKILL to the pool's process group.
    std::thread::sleep(std::time::Duration::from_millis(100));

    eprintln!("Error: {}: {}", context, comm_err);
    if let Some(info) = process::pool_death_info(pool_index) {
        eprintln!("Pool '{}' {}", socket.lang, info);
    }
    process::clean_exit(1);
}

/// Parse nexus-level options from argv. Returns the index of the first
/// non-option argument (the manifest path or subcommand).
pub fn parse_nexus_options(args: &[String], config: &mut NexusConfig) -> usize {
    let mut i = 1; // skip argv[0]
    while i < args.len() {
        let arg = &args[i];
        match arg.as_str() {
            "-h" | "--help" => {
                config.help_flag = true;
                i += 1;
            }
            "-p" | "--print" => {
                config.print_flag = true;
                i += 1;
            }
            "-c" | "--call-packet" => {
                i += 1;
                if i < args.len() {
                    config.packet_path = Some(args[i].clone());
                    i += 1;
                }
            }
            "-s" | "--socket-base" => {
                i += 1;
                if i < args.len() {
                    config.socket_base = Some(args[i].clone());
                    i += 1;
                }
            }
            "-o" | "--output-file" => {
                i += 1;
                if i < args.len() {
                    config.output_path = Some(args[i].clone());
                    i += 1;
                }
            }
            "-f" | "--output-form" => {
                i += 1;
                if i < args.len() {
                    config.output_format = parse_output_format(&args[i]);
                    i += 1;
                }
            }
            "--daemon" => {
                config.daemon_flag = true;
                i += 1;
            }
            "--router" => {
                config.router_flag = true;
                i += 1;
            }
            "--socket" => {
                i += 1;
                if i < args.len() {
                    config.unix_socket_path = Some(args[i].clone());
                    i += 1;
                }
            }
            "--port" => {
                i += 1;
                if i < args.len() {
                    config.tcp_port = args[i].parse().ok();
                    i += 1;
                }
            }
            "--http-port" => {
                i += 1;
                if i < args.len() {
                    config.http_port = args[i].parse().ok();
                    i += 1;
                }
            }
            "--fdb" => {
                i += 1;
                if i < args.len() {
                    config.fdb_path = Some(args[i].clone());
                    i += 1;
                }
            }
            "--eval-timeout" => {
                i += 1;
                if i < args.len() {
                    config.eval_timeout = args[i].parse().unwrap_or(30);
                    i += 1;
                }
            }
            _ => {
                // Handle --key=value forms
                if let Some(val) = arg.strip_prefix("--socket=") {
                    config.unix_socket_path = Some(val.to_string());
                    i += 1;
                } else if let Some(val) = arg.strip_prefix("--port=") {
                    config.tcp_port = val.parse().ok();
                    i += 1;
                } else if let Some(val) = arg.strip_prefix("--http-port=") {
                    config.http_port = val.parse().ok();
                    i += 1;
                } else if let Some(val) = arg.strip_prefix("--fdb=") {
                    config.fdb_path = Some(val.to_string());
                    i += 1;
                } else if let Some(val) = arg.strip_prefix("--eval-timeout=") {
                    config.eval_timeout = val.parse().unwrap_or(30);
                    i += 1;
                } else {
                    // Not a nexus option - stop parsing
                    break;
                }
            }
        }
    }
    i
}

/// Extract daemon/server long options from argv in single-command mode.
/// Removes matched options from the args vector.
pub fn extract_global_options(args: &mut Vec<String>, config: &mut NexusConfig) {
    let mut i = 1;
    while i < args.len() {
        if args[i] == "--" {
            break;
        }

        let mut matched = false;
        let mut consumed = 1;

        match args[i].as_str() {
            "--daemon" => {
                config.daemon_flag = true;
                matched = true;
            }
            "--socket" if i + 1 < args.len() => {
                config.unix_socket_path = Some(args[i + 1].clone());
                consumed = 2;
                matched = true;
            }
            "--port" if i + 1 < args.len() => {
                config.tcp_port = args[i + 1].parse().ok();
                consumed = 2;
                matched = true;
            }
            "--http-port" if i + 1 < args.len() => {
                config.http_port = args[i + 1].parse().ok();
                consumed = 2;
                matched = true;
            }
            "--fdb" if i + 1 < args.len() => {
                config.fdb_path = Some(args[i + 1].clone());
                consumed = 2;
                matched = true;
            }
            "--eval-timeout" if i + 1 < args.len() => {
                config.eval_timeout = args[i + 1].parse().unwrap_or(30);
                consumed = 2;
                matched = true;
            }
            _ => {
                // Check --key=value forms
                if let Some(val) = args[i].strip_prefix("--socket=") {
                    config.unix_socket_path = Some(val.to_string());
                    matched = true;
                } else if let Some(val) = args[i].strip_prefix("--port=") {
                    config.tcp_port = val.parse().ok();
                    matched = true;
                } else if let Some(val) = args[i].strip_prefix("--http-port=") {
                    config.http_port = val.parse().ok();
                    matched = true;
                } else if let Some(val) = args[i].strip_prefix("--fdb=") {
                    config.fdb_path = Some(val.to_string());
                    matched = true;
                } else if let Some(val) = args[i].strip_prefix("--eval-timeout=") {
                    config.eval_timeout = val.parse().unwrap_or(30);
                    matched = true;
                }
            }
        }

        if matched {
            for _ in 0..consumed {
                args.remove(i);
            }
        } else {
            i += 1;
        }
    }
}

fn parse_output_format(s: &str) -> OutputFormat {
    match s {
        "json" => OutputFormat::Json,
        "mpk" => OutputFormat::MessagePack,
        "voidstar" => OutputFormat::VoidStar,
        "packet" => OutputFormat::Packet,
        _ => {
            eprintln!("Invalid output format: {}", s);
            std::process::exit(1);
        }
    }
}

/// Wrap a string in JSON quotes (for literal string arguments).
pub fn quoted(s: &str) -> String {
    // JSON-escape the string
    let escaped = serde_json::to_string(s).unwrap_or_else(|_| format!("\"{}\"", s));
    escaped
}

/// Main dispatch entry point. Routes to the correct command based on argv.
pub fn dispatch(
    args: &[String],
    arg_start: usize,
    _shm_basename: &str,
    config: &NexusConfig,
    manifest: &Manifest,
    sockets: &mut [PoolSocket],
    prog_name: &str,
) {
    if arg_start >= args.len() {
        help::print_usage(prog_name, manifest);
    }

    let cmd_name = &args[arg_start];
    let next = arg_start + 1;

    // Check if it matches a group name
    for grp in &manifest.groups {
        if grp.name == *cmd_name {
            if next >= args.len() {
                help::print_group_usage(prog_name, manifest, cmd_name);
            }
            let subcmd = &args[next];
            if subcmd == "-h" || subcmd == "--help" {
                help::print_group_usage(prog_name, manifest, cmd_name);
            }
            // Find command within this group
            for cmd in &manifest.commands {
                if cmd.group.as_deref() == Some(cmd_name.as_str()) && cmd.name == *subcmd {
                    dispatch_command(args, next + 1, config, manifest, cmd, sockets, prog_name);
                    return;
                }
            }
            eprintln!("Unrecognized command '{}' in group '{}'", subcmd, cmd_name);
            process::clean_exit(1);
        }
    }

    // Try ungrouped commands
    for cmd in &manifest.commands {
        if cmd.name == *cmd_name && cmd.group.is_none() {
            dispatch_command(args, next, config, manifest, cmd, sockets, prog_name);
            return;
        }
    }

    eprintln!("Unrecognized command '{}'", cmd_name);
    process::clean_exit(1);
}

/// Dispatch a single command: parse its args, start needed daemons, execute.
pub fn dispatch_command(
    args: &[String],
    arg_start: usize,
    config: &NexusConfig,
    manifest: &Manifest,
    cmd: &Command,
    sockets: &mut [PoolSocket],
    prog_name: &str,
) {
    let single_cmd = manifest.commands.len() == 1 && manifest.groups.is_empty();

    // Parse command-specific arguments
    let (parsed_args, _remaining_start) =
        parse_command_args(args, arg_start, cmd, config, single_cmd, prog_name);

    // Start daemons for remote commands
    if !cmd.is_pure() {
        if let Err(e) = process::start_daemons(sockets, &cmd.needed_pools) {
            eprintln!("Error: {}", e);
            process::clean_exit(1);
        }
    }

    // Execute the command
    if cmd.is_pure() {
        run_pure_command(cmd, &parsed_args, config);
    } else {
        run_remote_command(cmd, &parsed_args, sockets, config);
    }
}

/// Parsed CLI argument value for a manifest arg slot.
#[derive(Debug)]
pub enum ArgValue {
    /// A value string (already quoted if needed).
    Value(String),
    /// Null/absent value.
    Null,
    /// Group argument with per-entry values.
    Group {
        grp_val: Option<String>,
        fields: Vec<Option<String>>,
        defaults: Vec<Option<String>>,
    },
}

/// Parse command-specific arguments from argv.
fn parse_command_args(
    args: &[String],
    pos: usize,
    cmd: &Command,
    _config: &NexusConfig,
    single_cmd: bool,
    prog_name: &str,
) -> (Vec<ArgValue>, usize) {
    let mut parsed = Vec::with_capacity(cmd.args.len());
    // Simple option tracking: collect all --opt=val and -o val
    let mut opt_values: std::collections::HashMap<String, String> = std::collections::HashMap::new();
    let mut flag_values: std::collections::HashMap<String, String> = std::collections::HashMap::new();
    let mut positional_idx = 0;
    let mut positionals: Vec<String> = Vec::new();

    // First pass: separate options from positionals
    let mut i = pos;
    while i < args.len() {
        let arg = &args[i];
        if arg == "--" {
            i += 1;
            // Everything after -- is positional
            while i < args.len() {
                positionals.push(args[i].clone());
                i += 1;
            }
            break;
        }
        if arg == "-h" || arg == "--help" {
            if single_cmd {
                help::print_command_help_single(prog_name, cmd);
            } else {
                help::print_command_help(prog_name, cmd);
            }
        }
        if arg.starts_with("--") && arg.len() > 2 {
            // Long option
            if let Some(eq_pos) = arg.find('=') {
                let key = &arg[2..eq_pos];
                let val = &arg[eq_pos + 1..];
                opt_values.insert(key.to_string(), val.to_string());
                i += 1;
            } else {
                let key = &arg[2..];
                // Check if it's a flag
                if is_flag_opt(cmd, key) {
                    flag_values.insert(key.to_string(), flag_forward_value(cmd, key));
                    i += 1;
                } else if is_rev_flag(cmd, key) {
                    if let Some(orig) = find_flag_by_rev(cmd, key) {
                        flag_values.insert(orig, flag_reverse_value_by_rev(cmd, key));
                    }
                    i += 1;
                } else if i + 1 < args.len() {
                    opt_values.insert(key.to_string(), args[i + 1].clone());
                    i += 2;
                } else {
                    eprintln!("Error: option --{} requires a value", key);
                    process::clean_exit(1);
                }
            }
        } else if arg.starts_with('-') && arg.len() == 2 && arg.as_bytes()[1].is_ascii_alphabetic() {
            let ch = arg.chars().nth(1).unwrap();
            if is_short_flag(cmd, ch) {
                flag_values.insert(
                    short_to_long(cmd, ch).unwrap_or_else(|| ch.to_string()),
                    flag_forward_value_by_short(cmd, ch),
                );
                i += 1;
            } else if i + 1 < args.len() {
                opt_values.insert(
                    short_to_long(cmd, ch).unwrap_or_else(|| ch.to_string()),
                    args[i + 1].clone(),
                );
                i += 2;
            } else {
                eprintln!("Error: option -{} requires a value", ch);
                process::clean_exit(1);
            }
        } else {
            positionals.push(arg.clone());
            i += 1;
        }
    }

    // Second pass: build ArgValue for each manifest arg
    for arg_def in &cmd.args {
        match arg_def {
            Arg::Positional { quoted, .. } => {
                if positional_idx < positionals.len() {
                    let val = if *quoted {
                        self::quoted(&positionals[positional_idx])
                    } else {
                        positionals[positional_idx].clone()
                    };
                    parsed.push(ArgValue::Value(val));
                    positional_idx += 1;
                } else {
                    eprintln!("Error: too few positional arguments");
                    process::clean_exit(1);
                }
            }
            Arg::Optional {
                long_opt,
                short_opt,
                default_val,
                quoted,
                ..
            } => {
                let key = long_opt
                    .as_deref()
                    .or_else(|| short_opt.as_deref())
                    .unwrap_or("");
                let user_val = opt_values.get(key);
                if let Some(val) = user_val {
                    let v = if *quoted { self::quoted(val) } else { val.clone() };
                    parsed.push(ArgValue::Value(v));
                } else if let Some(def) = default_val {
                    parsed.push(ArgValue::Value(def.clone()));
                } else {
                    parsed.push(ArgValue::Null);
                }
            }
            Arg::Flag {
                long_opt,
                default_val,
                ..
            } => {
                let key = long_opt.as_deref().unwrap_or("");
                if let Some(val) = flag_values.get(key) {
                    parsed.push(ArgValue::Value(val.clone()));
                } else {
                    parsed.push(ArgValue::Value(
                        default_val.as_deref().unwrap_or("false").to_string(),
                    ));
                }
            }
            Arg::Group {
                entries,
                group_opt,
                ..
            } => {
                let grp_val = group_opt.as_ref().and_then(|go| {
                    go.long_opt
                        .as_deref()
                        .and_then(|k| opt_values.get(k))
                        .cloned()
                });
                let mut fields = Vec::new();
                let mut defaults = Vec::new();
                for entry in entries {
                    // Look up by long option name or short option character
                    let long_key = entry.arg.long_opt_str().unwrap_or("");
                    let short_key = entry.arg.short_opt_char()
                        .map(|c| c.to_string())
                        .unwrap_or_default();
                    let user = opt_values
                        .get(long_key)
                        .or_else(|| opt_values.get(&short_key))
                        .or_else(|| flag_values.get(long_key))
                        .or_else(|| flag_values.get(&short_key))
                        .map(|v| {
                            if entry.arg.is_quoted() {
                                self::quoted(v)
                            } else {
                                v.clone()
                            }
                        });
                    fields.push(user);
                    defaults.push(entry.arg.default_val().map(|s| s.to_string()));
                }
                parsed.push(ArgValue::Group {
                    grp_val,
                    fields,
                    defaults,
                });
            }
        }
    }

    if positional_idx < positionals.len() {
        eprintln!("Error: too many positional arguments given");
        process::clean_exit(1);
    }

    (parsed, i)
}

// -- Command execution ------------------------------------------------------

/// Execute a remote command by sending a call packet to the pool.
fn run_remote_command(
    cmd: &Command,
    args: &[ArgValue],
    sockets: &[PoolSocket],
    config: &NexusConfig,
) {
    use morloc_runtime::packet;
    use morloc_runtime::schema::{parse_schema, SerialType};
    use std::io::{Read, Write};
    use std::os::unix::net::UnixStream;

    // C library functions from libmorloc.so
    extern "C" {
        fn parse_cli_data_argument(
            dest: *mut u8, arg: *const std::ffi::c_void,
            schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut u8;
        fn initialize_positional(value: *mut std::ffi::c_char) -> *mut std::ffi::c_void;
        fn free_argument_t(arg: *mut std::ffi::c_void);
        fn morloc_packet_size(packet: *const u8, errmsg: *mut *mut std::ffi::c_char) -> usize;
        fn make_morloc_local_call_packet(
            midx: u32, arg_packets: *const *const u8, nargs: usize,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut u8;
        fn get_morloc_data_packet_value(
            data: *const u8, schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut u8;
    }

    let socket = &sockets[cmd.pool_index];

    // Parse return schema
    let return_schema = match parse_schema(&cmd.ret.schema) {
        Ok(s) => s,
        Err(e) => {
            eprintln!("Error: failed to parse return schema '{}': {}", cmd.ret.schema, e);
            process::clean_exit(1);
        }
    };

    // The parsed `args` list and `cmd.args` are index-aligned 1:1 in
    // declaration order: parse_command_args pushes one ArgValue for
    // EVERY arg (including flags). The Haskell compiler emits one
    // schema per arg position too. Walk both lists in lockstep; for
    // flags, schema_str() returns None and the flag's ArgValue is
    // already a ready-to-send "true"/"false" string that doesn't need
    // packet conversion -- but the original v1 dispatch path still
    // ran flags through parse_cli_data_argument with the flag's bool
    // schema, so we mirror that to keep the wire format consistent.
    let mut arg_packets: Vec<Vec<u8>> = Vec::new();
    for (i, (arg_val, arg_def)) in args.iter().zip(cmd.args.iter()).enumerate() {
        let schema_str = arg_def.schema_str().unwrap_or("b");
        let schema = match parse_schema(schema_str) {
            Ok(s) => s,
            Err(e) => {
                eprintln!("Error: failed to parse arg schema #{}: {}", i, e);
                process::clean_exit(1);
            }
        };

        let c_schema = morloc_runtime::cschema::CSchema::from_rust(&schema);
        let mut errmsg: *mut std::ffi::c_char = std::ptr::null_mut();

        let c_arg;
        match arg_val {
            ArgValue::Group { grp_val, fields, defaults } => {
                // Group arg: use initialize_unrolled (matches C nexus behavior)
                extern "C" {
                    fn initialize_unrolled(
                        size: usize, default_value: *mut std::ffi::c_char,
                        fields: *mut *mut std::ffi::c_char,
                        default_fields: *mut *mut std::ffi::c_char,
                    ) -> *mut std::ffi::c_void;
                }
                let n = fields.len();
                let grp_val_c = grp_val.as_ref()
                    .map(|s| std::ffi::CString::new(s.as_str()).unwrap().into_raw())
                    .unwrap_or(std::ptr::null_mut());
                let mut c_fields: Vec<*mut std::ffi::c_char> = fields.iter()
                    .map(|f| f.as_ref()
                        .map(|s| std::ffi::CString::new(s.as_str()).unwrap().into_raw())
                        .unwrap_or(std::ptr::null_mut()))
                    .collect();
                let mut c_defaults: Vec<*mut std::ffi::c_char> = defaults.iter()
                    .map(|d| d.as_ref()
                        .map(|s| std::ffi::CString::new(s.as_str()).unwrap().into_raw())
                        .unwrap_or(std::ptr::null_mut()))
                    .collect();
                c_arg = unsafe {
                    initialize_unrolled(n, grp_val_c, c_fields.as_mut_ptr(), c_defaults.as_mut_ptr())
                };
            }
            _ => {
                let json_str = match arg_val {
                    ArgValue::Value(s) => s.clone(),
                    ArgValue::Null => "null".to_string(),
                    _ => unreachable!(),
                };
                let json_c = std::ffi::CString::new(json_str.as_str()).unwrap();
                c_arg = unsafe { initialize_positional(json_c.into_raw()) };
            }
        }

        let c_pkt = unsafe { parse_cli_data_argument(std::ptr::null_mut(), c_arg, c_schema, &mut errmsg) };
        unsafe { free_argument_t(c_arg) };
        unsafe { morloc_runtime::cschema::CSchema::free(c_schema) };

        if c_pkt.is_null() {
            let msg = if !errmsg.is_null() {
                let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
                unsafe { libc::free(errmsg as *mut std::ffi::c_void) };
                s
            } else {
                "unknown error".into()
            };
            eprintln!("Error: failed to parse argument #{}: {}", i, msg);
            process::clean_exit(1);
        }

        // Get packet size and copy to Vec
        let pkt_size = unsafe { morloc_packet_size(c_pkt, &mut errmsg) };
        let data_pkt = unsafe { std::slice::from_raw_parts(c_pkt, pkt_size).to_vec() };
        unsafe { libc::free(c_pkt as *mut std::ffi::c_void) };
        arg_packets.push(data_pkt);
    }

    // Build call packet via C library
    let arg_ptrs: Vec<*const u8> = arg_packets.iter().map(|p| p.as_ptr()).collect();
    let mut errmsg_call: *mut std::ffi::c_char = std::ptr::null_mut();
    let c_call = unsafe {
        make_morloc_local_call_packet(cmd.mid, arg_ptrs.as_ptr(), arg_packets.len(), &mut errmsg_call)
    };
    if c_call.is_null() {
        eprintln!("Error: failed to create call packet");
        process::clean_exit(1);
    }

    // Get call packet size
    let call_size = unsafe {
        let mut e: *mut std::ffi::c_char = std::ptr::null_mut();
        morloc_packet_size(c_call, &mut e)
    };
    let call_packet = unsafe { std::slice::from_raw_parts(c_call, call_size).to_vec() };
    unsafe { libc::free(c_call as *mut std::ffi::c_void) };

    // Send to pool and receive response
    let mut stream = match UnixStream::connect(&socket.socket_path) {
        Ok(s) => s,
        Err(e) => {
            die_with_pool_error(
                socket,
                cmd.pool_index,
                &format!("failed to connect to pool '{}'", socket.lang),
                &e,
            );
        }
    };

    if let Err(e) = stream.write_all(&call_packet) {
        die_with_pool_error(
            socket,
            cmd.pool_index,
            &format!("failed to send call packet to pool '{}'", socket.lang),
            &e,
        );
    }

    // Read response header
    let mut resp_header_bytes = [0u8; 32];
    if let Err(e) = stream.read_exact(&mut resp_header_bytes) {
        die_with_pool_error(
            socket,
            cmd.pool_index,
            &format!("failed to read response header from pool '{}'", socket.lang),
            &e,
        );
    }

    let resp_header = match packet::PacketHeader::from_bytes(&resp_header_bytes) {
        Ok(h) => h,
        Err(e) => {
            eprintln!("Error: invalid response packet: {}", e);
            process::clean_exit(1);
        }
    };

    // Read full response (metadata + payload)
    let offset = { resp_header.offset } as usize;
    let length = { resp_header.length } as usize;
    let remaining = offset + length;
    let mut resp_body = vec![0u8; remaining];
    if remaining > 0 {
        if let Err(e) = stream.read_exact(&mut resp_body) {
            die_with_pool_error(
                socket,
                cmd.pool_index,
                &format!("failed to read response body from pool '{}'", socket.lang),
                &e,
            );
        }
    }

    // Reconstruct full packet (header + body)
    let mut full_packet = Vec::with_capacity(32 + remaining);
    full_packet.extend_from_slice(&resp_header_bytes);
    full_packet.extend_from_slice(&resp_body);

    // Check for error
    match packet::get_error_message(&full_packet) {
        Ok(Some(err_msg)) => {
            eprintln!("Error: run failed\n{}", err_msg);
            process::clean_exit(1);
        }
        Ok(None) => {}
        Err(e) => {
            eprintln!("Error: failed to parse response: {}", e);
            process::clean_exit(1);
        }
    }

    // Extract and print via C library for correct voidstar handling
    let c_schema = morloc_runtime::cschema::CSchema::from_rust(&return_schema);
    let mut errmsg: *mut std::ffi::c_char = std::ptr::null_mut();
    let result_ptr = unsafe {
        get_morloc_data_packet_value(full_packet.as_ptr(), c_schema, &mut errmsg)
    };
    if result_ptr.is_null() {
        let msg = if !errmsg.is_null() {
            let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
            unsafe { libc::free(errmsg as *mut std::ffi::c_void) };
            s
        } else {
            "unknown error".into()
        };
        eprintln!("Error: failed to extract result: {}", msg);
        unsafe { morloc_runtime::cschema::CSchema::free(c_schema) };
        process::clean_exit(1);
    }

    // Check if response is Arrow format
    let is_arrow = resp_header.is_data() && unsafe { resp_header.command.data.format } == packet::PACKET_FORMAT_ARROW;

    // Print using the C library for correct output.
    // Suppress "null" for Unit-returning commands (CLI convention).
    if return_schema.serial_type != SerialType::Nil {
        print_result_c(result_ptr, c_schema, &full_packet, is_arrow, config);
    }
    unsafe { morloc_runtime::cschema::CSchema::free(c_schema) };
}

/// Print using the C library functions for correct voidstar handling.
fn print_result_c(
    ptr: *mut u8,
    schema: *const morloc_runtime::cschema::CSchema,
    full_packet: &[u8],
    is_arrow: bool,
    config: &NexusConfig,
) {
    extern "C" {
        fn print_voidstar(
            voidstar: *const std::ffi::c_void,
            schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> bool;
        fn pretty_print_voidstar(
            voidstar: *const std::ffi::c_void,
            schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> bool;
        fn print_arrow_as_json(
            data: *const std::ffi::c_void,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> bool;
        fn print_arrow_as_table(
            data: *const std::ffi::c_void,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> bool;
        fn pack_with_schema(
            mlc: *const std::ffi::c_void,
            schema: *const morloc_runtime::cschema::CSchema,
            mpkptr: *mut *mut std::ffi::c_char,
            mpk_size: *mut usize,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> i32;
    }

    let mut errmsg: *mut std::ffi::c_char = std::ptr::null_mut();

    match config.output_format {
        OutputFormat::Json => {
            let ok = unsafe {
                if is_arrow && config.print_flag {
                    print_arrow_as_table(ptr as *const std::ffi::c_void, &mut errmsg)
                } else if is_arrow {
                    print_arrow_as_json(ptr as *const std::ffi::c_void, &mut errmsg)
                } else if config.print_flag {
                    pretty_print_voidstar(ptr as *const std::ffi::c_void, schema, &mut errmsg)
                } else {
                    print_voidstar(ptr as *const std::ffi::c_void, schema, &mut errmsg)
                }
            };
            if !ok {
                let msg = if !errmsg.is_null() {
                    let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
                    unsafe { libc::free(errmsg as *mut std::ffi::c_void) };
                    s
                } else {
                    "unknown error".into()
                };
                eprintln!("Error: {}", msg);
                process::clean_exit(1);
            }
        }
        OutputFormat::MessagePack => {
            let mut mpk_ptr: *mut std::ffi::c_char = std::ptr::null_mut();
            let mut mpk_size: usize = 0;
            let rc = unsafe {
                pack_with_schema(
                    ptr as *const std::ffi::c_void,
                    schema,
                    &mut mpk_ptr,
                    &mut mpk_size,
                    &mut errmsg,
                )
            };
            if rc != 0 {
                eprintln!("Error: msgpack serialization failed");
                process::clean_exit(1);
            }
            if config.print_flag {
                let bytes = unsafe { std::slice::from_raw_parts(mpk_ptr as *const u8, mpk_size) };
                for (i, b) in bytes.iter().enumerate() {
                    if i > 0 && i % 16 == 0 { println!(); }
                    print!("{:02x} ", b);
                }
                println!();
            } else {
                use std::io::Write;
                let bytes = unsafe { std::slice::from_raw_parts(mpk_ptr as *const u8, mpk_size) };
                let _ = std::io::stdout().lock().write_all(bytes);
            }
            if !mpk_ptr.is_null() {
                unsafe { libc::free(mpk_ptr as *mut std::ffi::c_void) };
            }
        }
        OutputFormat::VoidStar => {
            extern "C" {
                fn print_morloc_data_packet(
                    packet: *const u8,
                    schema: *const morloc_runtime::cschema::CSchema,
                    errmsg: *mut *mut std::ffi::c_char,
                ) -> i32;
            }
            if config.print_flag {
                // Hex dump
                for (i, b) in full_packet.iter().enumerate() {
                    if i > 0 && i % 4 == 0 {
                        if i % 24 == 0 { println!(); } else { print!(" "); }
                    }
                    print!("{:02X}", b);
                }
                if !full_packet.is_empty() { println!(); }
            } else {
                let mut errmsg2: *mut std::ffi::c_char = std::ptr::null_mut();
                unsafe { print_morloc_data_packet(full_packet.as_ptr(), schema, &mut errmsg2) };
            }
        }
        OutputFormat::Packet => {
            // Packet format: write raw binary packet to stdout (used by SLURM)
            use std::io::Write;
            let _ = std::io::stdout().lock().write_all(&full_packet);
        }
    }
    process::clean_exit(0);
}

/// Print using Rust-native functions (kept for reference, currently unused).
#[allow(dead_code)]
fn print_result(
    ptr: morloc_runtime::shm::AbsPtr,
    schema: &morloc_runtime::Schema,
    config: &NexusConfig,
) {
    use morloc_runtime::{json, mpack};

    match config.output_format {
        OutputFormat::Json => {
            if config.print_flag {
                if let Err(e) = json::pretty_print_voidstar(ptr, schema) {
                    eprintln!("Error: {}", e);
                    process::clean_exit(1);
                }
            } else {
                if let Err(e) = json::print_voidstar(ptr, schema) {
                    eprintln!("Error: {}", e);
                    process::clean_exit(1);
                }
            }
        }
        OutputFormat::MessagePack => {
            let mpk = match mpack::pack_with_schema(ptr, schema) {
                Ok(m) => m,
                Err(e) => {
                    eprintln!("Error: {}", e);
                    process::clean_exit(1);
                }
            };
            if config.print_flag {
                // Hex dump for human-readable msgpack
                for (i, byte) in mpk.iter().enumerate() {
                    if i > 0 && i % 16 == 0 {
                        println!();
                    }
                    print!("{:02x} ", byte);
                }
                println!();
            } else {
                use std::io::Write;
                let stdout = std::io::stdout();
                let mut handle = stdout.lock();
                let _ = handle.write_all(&mpk);
            }
        }
        OutputFormat::VoidStar | OutputFormat::Packet => {
            eprintln!("Error: voidstar/packet output not supported in Rust-native print path");
            process::clean_exit(1);
        }
    }
    process::clean_exit(0);
}

/// Execute a pure command by evaluating the expression via C library.
fn run_pure_command(cmd: &Command, args: &[ArgValue], config: &NexusConfig) {
    use morloc_runtime::schema::{parse_schema, SerialType};

    extern "C" {
        fn build_manifest_expr(
            json_str: *const std::ffi::c_char,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut std::ffi::c_void; // morloc_expression_t*
        fn morloc_eval(
            expr: *mut std::ffi::c_void,
            return_schema: *const morloc_runtime::cschema::CSchema,
            arg_voidstar: *const *mut u8,
            arg_schemas: *const *const morloc_runtime::cschema::CSchema,
            nargs: usize,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut std::ffi::c_void; // absptr_t
        fn parse_cli_data_argument(
            dest: *mut u8, arg: *const std::ffi::c_void,
            schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut u8;
        fn initialize_positional(value: *mut std::ffi::c_char) -> *mut std::ffi::c_void;
        fn free_argument_t(arg: *mut std::ffi::c_void);
        fn get_morloc_data_packet_value(
            data: *const u8, schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut std::ffi::c_char,
        ) -> *mut u8;
        fn make_standard_data_packet(
            relptr: isize,
            schema: *const morloc_runtime::cschema::CSchema,
        ) -> *mut u8;
        fn abs2rel(ptr: *mut std::ffi::c_void, errmsg: *mut *mut std::ffi::c_char) -> isize;
    }

    // Build expression tree from manifest JSON
    let expr_json = match &cmd.expr {
        Some(v) => serde_json::to_string(v).unwrap_or_default(),
        None => {
            eprintln!("Error: pure command '{}' has no expression", cmd.name);
            process::clean_exit(1);
        }
    };
    let expr_c = std::ffi::CString::new(expr_json.as_str()).unwrap();
    let mut errmsg: *mut std::ffi::c_char = std::ptr::null_mut();
    let expr = unsafe { build_manifest_expr(expr_c.as_ptr(), &mut errmsg) };
    if expr.is_null() {
        let msg = unsafe_errmsg_to_string(errmsg);
        eprintln!("Error: failed to build expression: {}", msg);
        process::clean_exit(1);
    }

    // Parse return schema
    let return_schema = match parse_schema(&cmd.ret.schema) {
        Ok(s) => s,
        Err(e) => {
            eprintln!("Error: failed to parse return schema '{}': {}", cmd.ret.schema, e);
            process::clean_exit(1);
        }
    };
    let c_return_schema = morloc_runtime::cschema::CSchema::from_rust(&return_schema);

    // The parsed `args` list and `cmd.args` are index-aligned 1:1 in
    // declaration order: parse_command_args pushes one ArgValue for
    // EVERY arg (including flags). The Haskell compiler emits one
    // schema per arg position too. Walk both lists in lockstep; for
    // flags, the schema_str() accessor returns None and we fall back
    // to the bool schema "b" so the wire format stays consistent.
    let mut c_arg_schemas: Vec<*const morloc_runtime::cschema::CSchema> = Vec::new();
    let mut c_arg_voidstars: Vec<*mut u8> = Vec::new();

    for (i, (arg_val, arg_def)) in args.iter().zip(cmd.args.iter()).enumerate() {
        let schema_str = arg_def.schema_str().unwrap_or("b");
        let schema = match parse_schema(schema_str) {
            Ok(s) => s,
            Err(e) => {
                eprintln!("Error: failed to parse arg schema #{}: {}", i, e);
                process::clean_exit(1);
            }
        };
        let c_schema = morloc_runtime::cschema::CSchema::from_rust(&schema);

        let json_str = match arg_val {
            ArgValue::Value(s) => s.clone(),
            ArgValue::Null => "null".to_string(),
            ArgValue::Group { .. } => "null".to_string(),
        };

        // Parse CLI arg to data packet, then extract voidstar
        let json_c = std::ffi::CString::new(json_str.as_str()).unwrap();
        let c_arg = unsafe { initialize_positional(json_c.into_raw()) };
        let c_pkt = unsafe { parse_cli_data_argument(std::ptr::null_mut(), c_arg, c_schema, &mut errmsg) };
        unsafe { free_argument_t(c_arg) };

        if c_pkt.is_null() {
            let msg = unsafe_errmsg_to_string(errmsg);
            eprintln!("Error: failed to parse argument #{}: {}", i, msg);
            process::clean_exit(1);
        }

        let voidstar = unsafe { get_morloc_data_packet_value(c_pkt, c_schema, &mut errmsg) };
        unsafe { libc::free(c_pkt as *mut std::ffi::c_void) };
        if voidstar.is_null() {
            let msg = unsafe_errmsg_to_string(errmsg);
            eprintln!("Error: failed to extract argument #{}: {}", i, msg);
            process::clean_exit(1);
        }

        c_arg_schemas.push(c_schema);
        c_arg_voidstars.push(voidstar);
    }

    // Call morloc_eval
    let result = unsafe {
        morloc_eval(
            expr,
            c_return_schema,
            c_arg_voidstars.as_ptr(),
            c_arg_schemas.as_ptr(),
            c_arg_voidstars.len(),
            &mut errmsg,
        )
    };

    if result.is_null() {
        let msg = unsafe_errmsg_to_string(errmsg);
        eprintln!("Error: evaluation failed: {}", msg);
        process::clean_exit(1);
    }

    // Convert result to relptr and make a data packet for printing
    let result_relptr = unsafe { abs2rel(result, &mut errmsg) };
    let result_packet = unsafe { make_standard_data_packet(result_relptr, c_return_schema) };

    if result_packet.is_null() {
        eprintln!("Error: failed to create result packet");
        process::clean_exit(1);
    }

    // Get packet as bytes for print_result_c
    extern "C" {
        fn morloc_packet_size(packet: *const u8, errmsg: *mut *mut std::ffi::c_char) -> usize;
    }
    let pkt_size = unsafe { morloc_packet_size(result_packet, &mut errmsg) };
    let pkt_bytes = unsafe { std::slice::from_raw_parts(result_packet, pkt_size).to_vec() };

    // Extract voidstar value from the result packet
    let result_ptr = unsafe { get_morloc_data_packet_value(pkt_bytes.as_ptr(), c_return_schema, &mut errmsg) };

    if return_schema.serial_type != SerialType::Nil {
        print_result_c(result_ptr, c_return_schema, &pkt_bytes, false, config);
    }

    // Cleanup
    for cs in &c_arg_schemas {
        unsafe { morloc_runtime::cschema::CSchema::free(*cs as *mut morloc_runtime::cschema::CSchema) };
    }
    unsafe {
        morloc_runtime::cschema::CSchema::free(c_return_schema);
        libc::free(result_packet as *mut std::ffi::c_void);
    }
}

fn unsafe_errmsg_to_string(errmsg: *mut std::ffi::c_char) -> String {
    if errmsg.is_null() {
        "unknown error".into()
    } else {
        let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
        unsafe { libc::free(errmsg as *mut std::ffi::c_void) };
        s
    }
}

// -- Helpers for command argument parsing ------------------------------------

fn is_flag_opt(cmd: &Command, long_name: &str) -> bool {
    cmd.args.iter().any(|a| match a {
        Arg::Flag { long_opt, .. } => long_opt.as_deref() == Some(long_name),
        Arg::Group { entries, .. } => entries.iter().any(|e| match &e.arg {
            Arg::Flag { long_opt, .. } => long_opt.as_deref() == Some(long_name),
            _ => false,
        }),
        _ => false,
    })
}

fn is_rev_flag(cmd: &Command, name: &str) -> bool {
    cmd.args.iter().any(|a| match a {
        Arg::Flag { long_rev, .. } => long_rev.as_deref() == Some(name),
        Arg::Group { entries, .. } => entries.iter().any(|e| match &e.arg {
            Arg::Flag { long_rev, .. } => long_rev.as_deref() == Some(name),
            _ => false,
        }),
        _ => false,
    })
}

fn find_flag_by_rev(cmd: &Command, rev_name: &str) -> Option<String> {
    for a in &cmd.args {
        match a {
            Arg::Flag { long_opt, long_rev, .. } => {
                if long_rev.as_deref() == Some(rev_name) {
                    return long_opt.clone();
                }
            }
            Arg::Group { entries, .. } => {
                for e in entries {
                    if let Arg::Flag { long_opt, long_rev, .. } = &e.arg {
                        if long_rev.as_deref() == Some(rev_name) {
                            return long_opt.clone();
                        }
                    }
                }
            }
            _ => {}
        }
    }
    None
}

fn flag_forward_value(cmd: &Command, long_name: &str) -> String {
    for a in &cmd.args {
        if let Arg::Flag {
            long_opt,
            default_val,
            ..
        } = a
        {
            if long_opt.as_deref() == Some(long_name) {
                let def = default_val.as_deref().unwrap_or("false");
                return if def == "true" {
                    "false".into()
                } else {
                    "true".into()
                };
            }
        }
    }
    "true".into()
}

fn flag_forward_value_by_short(cmd: &Command, ch: char) -> String {
    for a in &cmd.args {
        if let Arg::Flag {
            short_opt,
            default_val,
            ..
        } = a
        {
            if short_opt.as_deref().and_then(|s| s.chars().next()) == Some(ch) {
                let def = default_val.as_deref().unwrap_or("false");
                return if def == "true" {
                    "false".into()
                } else {
                    "true".into()
                };
            }
        }
    }
    "true".into()
}

fn flag_reverse_value_by_rev(cmd: &Command, rev_name: &str) -> String {
    // Search top-level and group entries
    let check = |long_rev: &Option<String>, default_val: &Option<String>| -> Option<String> {
        if long_rev.as_deref() == Some(rev_name) {
            let def = default_val.as_deref().unwrap_or("false");
            Some(if def == "true" { "true".into() } else { "false".into() })
        } else {
            None
        }
    };
    for a in &cmd.args {
        match a {
            Arg::Flag { long_rev, default_val, .. } => {
                if let Some(v) = check(long_rev, default_val) { return v; }
            }
            Arg::Group { entries, .. } => {
                for e in entries {
                    if let Arg::Flag { long_rev, default_val, .. } = &e.arg {
                        if let Some(v) = check(long_rev, default_val) { return v; }
                    }
                }
            }
            _ => {}
        }
    }
    "false".into()
}

fn is_short_flag(cmd: &Command, ch: char) -> bool {
    cmd.args.iter().any(|a| match a {
        Arg::Flag { short_opt, .. } => {
            short_opt.as_deref().and_then(|s| s.chars().next()) == Some(ch)
        }
        _ => false,
    })
}

fn short_to_long(cmd: &Command, ch: char) -> Option<String> {
    for a in &cmd.args {
        let (s, l) = match a {
            Arg::Optional {
                short_opt,
                long_opt,
                ..
            } => (short_opt.as_deref(), long_opt.clone()),
            Arg::Flag {
                short_opt,
                long_opt,
                ..
            } => (short_opt.as_deref(), long_opt.clone()),
            Arg::Group { entries, .. } => {
                // Search inside group entries
                for entry in entries {
                    let (es, el) = match &entry.arg {
                        Arg::Optional { short_opt, long_opt, .. } => (short_opt.as_deref(), long_opt.clone()),
                        Arg::Flag { short_opt, long_opt, .. } => (short_opt.as_deref(), long_opt.clone()),
                        _ => (None, None),
                    };
                    if es.and_then(|s| s.chars().next()) == Some(ch) {
                        return el.or_else(|| Some(ch.to_string()));
                    }
                }
                (None, None)
            }
            _ => (None, None),
        };
        if s.and_then(|s| s.chars().next()) == Some(ch) {
            return l;
        }
    }
    None
}


================================================
FILE: data/rust/morloc-nexus/src/help.rs
================================================
//! Help text generation matching the C nexus output format.

use crate::manifest::{Arg, Command, GroupEntry, Manifest};

/// Print nexus-level usage (no manifest loaded).
pub fn print_nexus_usage(prog_name: &str) -> ! {
    eprintln!("Usage: {} [OPTION...] COMMAND [ARG...]", prog_name);
    eprintln!();
    eprintln!("morloc-nexus is the morloc program dispatcher.");
    eprintln!();
    eprintln!("Arguments:");
    eprintln!("  <manifest>           Path to a .manifest file or wrapper script");
    eprintln!();
    eprintln!("Nexus options:");
    eprintln!("  -h, --help           Print this help message");
    eprintln!("  -p, --print          Pretty-print output for human consumption");
    eprintln!("  -o, --output-file    Print to this file instead of STDOUT");
    eprintln!("  -f, --output-format  Output format [json|mpk|voidstar]");
    eprintln!();
    eprintln!("Daemon mode:");
    eprintln!("  --daemon             Run as a long-lived daemon");
    eprintln!("  --http-port PORT     Listen on HTTP port");
    eprintln!("  --port PORT          Listen on TCP port");
    eprintln!("  --socket PATH        Listen on Unix socket");
    eprintln!("  --eval-timeout SECS  Timeout for /eval requests (default: 30)");
    eprintln!();
    eprintln!("Router mode:");
    eprintln!("  --router             Run as a multi-program router");
    eprintln!("  --fdb <path>         Path to fdb manifest directory");
    std::process::exit(0);
}

/// Print usage for a multi-command program.
pub fn print_usage(prog_name: &str, manifest: &Manifest) -> ! {
    eprintln!("Usage: {} [OPTION...] COMMAND [ARG...]", prog_name);

    // Module-level description
    if !manifest.desc.is_empty() {
        eprintln!();
        for line in &manifest.desc {
            eprintln!("{}", line);
        }
    }

    eprintln!();
    eprintln!("Nexus options:");
    eprintln!("  -h, --help           Print this help message");
    eprintln!("  -p, --print          Pretty-print output for human consumption");
    eprintln!("  -o, --output-file    Print to this file instead of STDOUT");
    eprintln!("  -f, --output-format  Output format [json|mpk|voidstar]");
    eprintln!();
    eprintln!("Daemon mode:");
    eprintln!("  --daemon             Run as a long-lived daemon");
    eprintln!("  --http-port PORT     Listen on HTTP port");
    eprintln!("  --port PORT          Listen on TCP port");
    eprintln!("  --socket PATH        Listen on Unix socket");
    eprintln!();

    // Ungrouped commands
    let ungrouped: Vec<&Command> = manifest
        .commands
        .iter()
        .filter(|c| c.group.is_none())
        .collect();

    if !ungrouped.is_empty() {
        eprintln!("Commands (call with -h/--help for more info):");
        let longest = ungrouped.iter().map(|c| c.name.len()).max().unwrap_or(0);
        for cmd in &ungrouped {
            eprint!("  {}", cmd.name);
            if let Some(first) = cmd.desc.first() {
                let pad = longest - cmd.name.len() + 2;
                eprint!("{:pad$}{}", "", first, pad = pad);
            }
            eprintln!();
        }
    }

    if !manifest.groups.is_empty() {
        if !ungrouped.is_empty() {
            eprintln!();
        }
        eprintln!("Command groups (call with -h/--help for more info):");
        let longest = manifest.groups.iter().map(|g| g.name.len()).max().unwrap_or(0);
        for grp in &manifest.groups {
            eprint!("  {}", grp.name);
            if let Some(first) = grp.desc.first() {
                let pad = longest - grp.name.len() + 2;
                eprint!("{:pad$}{}", "", first, pad = pad);
            }
            eprintln!();
        }
    }

    // Epilogues
    for epilogue in &manifest.epilogues {
        eprintln!();
        for line in epilogue {
            eprintln!("{}", line);
        }
    }

    std::process::exit(0);
}

/// Print usage for a command group.
pub fn print_group_usage(prog_name: &str, manifest: &Manifest, group_name: &str) -> ! {
    let grp = manifest.groups.iter().find(|g| g.name == group_name);

    eprintln!("Usage: {} {} COMMAND [ARG...]", prog_name, group_name);
    if let Some(g) = grp {
        if !g.desc.is_empty() {
            eprintln!();
            for line in &g.desc {
                eprintln!("{}", line);
            }
        }
    }
    eprintln!("\nCommands:");

    let cmds: Vec<&Command> = manifest
        .commands
        .iter()
        .filter(|c| c.group.as_deref() == Some(group_name))
        .collect();

    let longest = cmds.iter().map(|c| c.name.len()).max().unwrap_or(0);
    for cmd in &cmds {
        eprint!("  {}", cmd.name);
        if let Some(first) = cmd.desc.first() {
            let pad = longest - cmd.name.len() + 2;
            eprint!("{:pad$}{}", "", first, pad = pad);
        }
        eprintln!();
    }

    std::process::exit(0);
}

/// Print help for a specific subcommand.
pub fn print_command_help(prog_name: &str, cmd: &Command) -> ! {
    // Usage line
    if let Some(ref group) = cmd.group {
        eprint!("Usage: {} {} {}", prog_name, group, cmd.name);
    } else {
        eprint!("Usage: {} {}", prog_name, cmd.name);
    }
    print_usage_suffix(cmd);
    eprintln!();
    if !cmd.desc.is_empty() {
        eprintln!();
    }

    print_command_body(cmd);
    std::process::exit(0);
}

/// Print help for a single-command program.
pub fn print_command_help_single(prog_name: &str, cmd: &Command) -> ! {
    eprint!("Usage: {}", prog_name);
    print_usage_suffix(cmd);
    eprintln!();

    // Description
    if !cmd.desc.is_empty() {
        eprintln!();
        for (i, line) in cmd.desc.iter().enumerate() {
            if i == 0 && line.is_empty() {
                continue;
            }
            eprintln!("{}", line);
        }
    }

    // Nexus options
    eprintln!("\nNexus options:");
    eprintln!("  --print          Pretty-print output for human consumption");
    eprintln!("  --output-file    Print to this file instead of STDOUT");
    eprintln!("  --output-form    Output format [json|mpk|voidstar]");
    eprintln!("\nDaemon mode:");
    eprintln!("  --daemon         Run as a long-lived daemon");
    eprintln!("  --http-port PORT Listen on HTTP port");
    eprintln!("  --port PORT      Listen on TCP port");
    eprintln!("  --socket PATH    Listen on UNIX socket");

    print_args_body(cmd);
    print_type_definitions(cmd);
    print_return_info(cmd);
    std::process::exit(0);
}

// -- Helpers ----------------------------------------------------------------

fn print_usage_suffix(cmd: &Command) {
    let has_opts = cmd.args.iter().any(|a| !matches!(a, Arg::Positional { .. }));
    if has_opts {
        eprint!(" [OPTION...]");
    }
    for arg in &cmd.args {
        if let Arg::Positional { metavar, .. } = arg {
            eprint!(" {}", metavar.as_deref().unwrap_or("ARG"));
        }
    }
}

fn print_command_body(cmd: &Command) {
    // Description
    if !cmd.desc.is_empty() {
        for (i, line) in cmd.desc.iter().enumerate() {
            if i == 0 && line.is_empty() {
                continue;
            }
            eprintln!("{}", line);
        }
    }

    print_args_body(cmd);
    print_type_definitions(cmd);
    print_return_info(cmd);
}

fn print_args_body(cmd: &Command) {
    // Positional arguments
    let has_pos = cmd.args.iter().any(|a| matches!(a, Arg::Positional { .. }));
    if has_pos {
        eprintln!("\nPositional arguments:");
        for arg in &cmd.args {
            if let Arg::Positional {
                metavar,
                type_desc,
                desc,
                ..
            } = arg
            {
                eprint!("  {}", metavar.as_deref().unwrap_or("ARG"));
                if let Some(first) = desc.first() {
                    eprint!("  {}", first);
                }
                eprintln!();
                if let Some(td) = type_desc {
                    eprintln!("      type: {}", td);
                }
            }
        }
    }

    // Optional arguments (opts and flags)
    let has_opt = cmd
        .args
        .iter()
        .any(|a| matches!(a, Arg::Optional { .. } | Arg::Flag { .. }));
    if has_opt {
        eprintln!("\nOptional arguments:");
        for arg in &cmd.args {
            print_opt_or_flag(arg);
        }
    }

    // Group arguments
    for arg in &cmd.args {
        if let Arg::Group {
            metavar,
            desc,
            group_opt,
            entries,
            ..
        } = arg
        {
            eprintln!("\nGroup arguments:");
            eprint!("  {}", metavar.as_deref().unwrap_or(""));
            if let Some(first) = desc.first() {
                eprint!(": {}", first);
            }
            eprintln!();

            if let Some(go) = group_opt {
                eprint!("    ");
                if let Some(ref s) = go.short_opt {
                    eprint!("-{}, ", s);
                }
                if let Some(ref l) = go.long_opt {
                    eprint!("--{} {}", l, metavar.as_deref().unwrap_or(""));
                }
                eprintln!();
                eprintln!("        provide record as file or JSON string");
            }

            for entry in entries {
                print_group_entry(entry);
            }
        }
    }
}

fn print_opt_or_flag(arg: &Arg) {
    match arg {
        Arg::Optional {
            short_opt,
            long_opt,
            metavar,
            default_val,
            desc,
            type_desc,
            ..
        } => {
            eprint!("    ");
            match (short_opt.as_deref(), long_opt.as_deref()) {
                (Some(s), Some(l)) => eprint!(
                    "-{}, --{} {}",
                    s,
                    l,
                    metavar.as_deref().unwrap_or("")
                ),
                (Some(s), None) => {
                    eprint!("-{} {}", s, metavar.as_deref().unwrap_or(""))
                }
                (None, Some(l)) => eprint!(
                    "--{} {}",
                    l,
                    metavar.as_deref().unwrap_or("")
                ),
                _ => {}
            }
            eprintln!();
            if let Some(d) = default_val {
                eprintln!("        default: {}", d);
            }
            for d in desc {
                eprintln!("        {}", d);
            }
            if let Some(td) = type_desc {
                eprintln!("        type: {}", td);
            }
        }
        Arg::Flag {
            short_opt,
            long_opt,
            long_rev,
            default_val,
            desc,
            ..
        } => {
            eprint!("    ");
            match (short_opt.as_deref(), long_opt.as_deref()) {
                (Some(s), Some(l)) => eprint!("-{}, --{}", s, l),
                (Some(s), None) => eprint!("-{}", s),
                (None, Some(l)) => eprint!("--{}", l),
                _ => {}
            }
            eprintln!();
            if let Some(rev) = long_rev {
                eprintln!("    --{}", rev);
            }
            if let Some(d) = default_val {
                eprintln!("        default: {}", d);
            }
            for d in desc {
                eprintln!("        {}", d);
            }
        }
        _ => {}
    }
}

fn print_group_entry(entry: &GroupEntry) {
    let ea = &entry.arg;
    eprint!("    ");
    match ea {
        Arg::Optional {
            short_opt,
            long_opt,
            metavar,
            default_val,
            desc,
            ..
        } => {
            match (short_opt.as_deref(), long_opt.as_deref()) {
                (Some(s), Some(l)) => {
                    eprint!("-{}, --{}", s, l);
                    if let Some(m) = metavar {
                        eprint!(" {}", m);
                    }
                }
                (Some(s), None) => {
                    eprint!("-{}", s);
                    if let Some(m) = metavar {
                        eprint!(" {}", m);
                    }
                }
                (None, Some(l)) => {
                    eprint!("--{}", l);
                    if let Some(m) = metavar {
                        eprint!(" {}", m);
                    }
                }
                _ => {}
            }
            eprintln!();
            if let Some(d) = default_val {
                eprintln!("        default: {}", d);
            }
            for d in desc {
                eprintln!("        {}", d);
            }
        }
        Arg::Flag {
            short_opt,
            long_opt,
            default_val,
            desc,
            ..
        } => {
            match (short_opt.as_deref(), long_opt.as_deref()) {
                (Some(s), Some(l)) => eprint!("-{}, --{}", s, l),
                (Some(s), None) => eprint!("-{}", s),
                (None, Some(l)) => eprint!("--{}", l),
                _ => {}
            }
            eprintln!();
            if let Some(d) = default_val {
                eprintln!("        default: {}", d);
            }
            for d in desc {
                eprintln!("        {}", d);
            }
        }
        _ => {}
    }
}

fn print_return_info(cmd: &Command) {
    eprintln!("\nReturn: {}", cmd.ret.type_desc);
    for line in &cmd.ret.desc {
        eprintln!("  {}", line);
    }
}

// -- Schema-walking renderer for the Record / Table Schemas sections ---------
//
// In v2 the manifest no longer carries a parallel `type_definitions` list.
// The same information is reconstructed at help-render time by walking
// each command's args + return value: for every typed entry whose schema
// parses to a Map at the top level, we treat the entry's `type` name as
// the named-type label and its schema's keys + parameter schemas as the
// field list. The record-vs-table distinction comes from the entry's
// `kind` constraint.

/// A rendered named-type layout for the help output, sourced from a
/// parsed schema.
struct TypeLayout<'a> {
    name: &'a str,
    /// "record" | "object" | "table" -- comes from the `kind` constraint.
    kind: &'a str,
    /// (field_name, rendered_type)
    fields: Vec<(String, String)>,
}

/// Pretty-render a parsed `Schema` as a morloc-flavored type string,
/// suitable for the field-type column in the schemas block.
fn render_schema_type(s: &morloc_runtime::schema::Schema) -> String {
    use morloc_runtime::schema::SerialType::*;
    match s.serial_type {
        Nil => "()".into(),
        Bool => "Bool".into(),
        Sint8 => "Int8".into(),
        Sint16 => "Int16".into(),
        Sint32 => "Int".into(),
        Sint64 => "Int64".into(),
        Uint8 => "UInt8".into(),
        Uint16 => "UInt16".into(),
        Uint32 => "UInt32".into(),
        Uint64 => "UInt64".into(),
        Float32 => "Float32".into(),
        Float64 => "Real".into(),
        String => "Str".into(),
        Array => format!(
            "[{}]",
            s.parameters
                .first()
                .map(render_schema_type)
                .unwrap_or_else(|| "?".into())
        ),
        Tuple => {
            // `String` here is fully qualified because the surrounding
            // match brings `SerialType::String` into scope as a variant,
            // shadowing the std `String` type.
            let inner: Vec<std::string::String> =
                s.parameters.iter().map(render_schema_type).collect();
            format!("({})", inner.join(", "))
        }
        Map => {
            // A nested record-ish thing. Use the hint string when present
            // (which carries the language-specific concrete type name);
            // otherwise show an inline placeholder. Either way, the
            // nested record will be listed separately in the same
            // schema block if its name appears as another arg's type.
            s.hint.clone().unwrap_or_else(|| "{..}".into())
        }
        Optional => format!(
            "?{}",
            s.parameters
                .first()
                .map(render_schema_type)
                .unwrap_or_else(|| "?".into())
        ),
        Tensor => format!(
            "Tensor<{}>",
            s.parameters
                .first()
                .map(render_schema_type)
                .unwrap_or_else(|| "?".into())
        ),
    }
}

/// Try to extract a `TypeLayout` from a (name, schema_string, kind)
/// triple. Returns None if any input is missing or the schema does not
/// parse to a top-level Map. Tables (whose fields are arrays in the wire
/// schema) render their fields by the array's element type, mirroring
/// how the user wrote them in the source.
fn extract_named_layout<'a>(
    type_name: Option<&'a str>,
    schema_str: Option<&str>,
    kind: Option<&'a str>,
) -> Option<TypeLayout<'a>> {
    use morloc_runtime::schema::SerialType;
    let name = type_name?;
    let schema = schema_str?;
    let kind = kind?;
    let parsed = morloc_runtime::schema::parse_schema(schema).ok()?;
    if parsed.serial_type != SerialType::Map {
        return None;
    }
    // For a table, every field's wire schema is an Array -- peel one layer
    // off so the user sees `name :: Str` instead of `name :: [Str]`.
    let strip_array = kind == "table";
    let fields = parsed
        .keys
        .iter()
        .zip(parsed.parameters.iter())
        .map(|(k, p)| {
            let inner = if strip_array && p.serial_type == SerialType::Array {
                p.parameters.first().unwrap_or(p)
            } else {
                p
            };
            (k.clone(), render_schema_type(inner))
        })
        .collect();
    Some(TypeLayout { name, kind, fields })
}

/// Walk every arg + the return of a command. For each typed entry, try
/// to build a layout. Deduplicate by type name, preserving discovery
/// order so the rendering matches the order types appear in the
/// signature.
fn collect_command_layouts<'a>(cmd: &'a Command) -> Vec<TypeLayout<'a>> {
    use std::collections::HashSet;
    let mut seen: HashSet<&str> = HashSet::new();
    let mut out: Vec<TypeLayout<'a>> = Vec::new();

    for arg in &cmd.args {
        // Skip unrolled groups without a group_opt: each field already
        // appears as its own flag in the usage, so the schema is redundant.
        // Keep the schema when group_opt is present (the user can pass the
        // entire record as JSON and needs the full field spec).
        if let Arg::Group { group_opt: None, .. } = arg {
            continue;
        }
        if let Some(layout) =
            extract_named_layout(arg.type_desc_str(), arg.schema_str(), arg.kind_constraint())
        {
            if seen.insert(layout.name) {
                out.push(layout);
            }
        }
    }

    let ret_kind = cmd
        .ret
        .constraints
        .iter()
        .find(|c| c.ctype == "kind")
        .and_then(|c| c.value.as_ref().and_then(|v| v.as_str()));
    if let Some(layout) =
        extract_named_layout(Some(&cmd.ret.type_desc), Some(&cmd.ret.schema), ret_kind)
    {
        if seen.insert(layout.name) {
            out.push(layout);
        }
    }

    out
}

/// Print the Record Schemas / Table Schemas sections for any named
/// types referenced in this command's signature. The whole block is
/// skipped when there are none.
fn print_type_definitions(cmd: &Command) {
    let layouts = collect_command_layouts(cmd);
    if layouts.is_empty() {
        return;
    }

    let records: Vec<&TypeLayout> = layouts.iter().filter(|l| l.kind != "table").collect();
    let tables: Vec<&TypeLayout> = layouts.iter().filter(|l| l.kind == "table").collect();

    if !records.is_empty() {
        eprintln!("\nRecord Schemas:");
        print_layouts(&records);
    }
    if !tables.is_empty() {
        eprintln!("\nTable Schemas:");
        print_layouts(&tables);
    }
}

/// Render a list of layouts. Each layout shows its type name on its own
/// line followed by the field list with `::`-aligned column widths.
/// Definitions are separated by blank lines.
fn print_layouts(defs: &[&TypeLayout]) {
    for (i, def) in defs.iter().enumerate() {
        if i > 0 {
            eprintln!();
        }
        eprintln!("  {}", def.name);

        let name_width = def
            .fields
            .iter()
            .map(|(k, _)| k.len())
            .max()
            .unwrap_or(0);
        for (k, v) in &def.fields {
            eprintln!("    {:width$} :: {}", k, v, width = name_width);
        }
    }
}


================================================
FILE: data/rust/morloc-nexus/src/main.rs
================================================
//! Morloc Nexus: CLI dispatcher for multi-language pool orchestration.
//!
//! Replaces data/nexus.c. Entry point for all morloc programs.
//! Reads a .manifest JSON, spawns language pool daemons, and routes
//! function calls to them over Unix sockets.

mod dispatch;
mod help;
mod manifest;
mod process;

use dispatch::NexusConfig;

/// Resolve the morloc data directory: MORLOC_HOME if set, else ~/.local/share/morloc.
fn morloc_home() -> String {
    std::env::var("MORLOC_HOME").unwrap_or_else(|_| {
        format!(
            "{}/.local/share/morloc",
            std::env::var("HOME").unwrap_or_else(|_| "/root".into())
        )
    })
}

fn main() {
    let args: Vec<String> = std::env::args().collect();

    let mut config = NexusConfig::default();

    // First pass: parse nexus-level options
    let opt_end = dispatch::parse_nexus_options(&args, &mut config);

    // Handle --router mode (no manifest needed)
    if config.router_flag {
        run_router(&config);
        std::process::exit(0);
    }

    // If -h with no manifest argument, show nexus help
    let prog_name = args.first().map(|s| s.as_str()).unwrap_or("morloc-nexus");
    if config.help_flag && opt_end >= args.len() {
        help::print_nexus_usage(prog_name);
    }

    // Manifest path: either an explicit argument or derived from argv[0].
    // In daemon mode (`./test --daemon`), the manifest is at `<argv[0]>.manifest`.
    // In normal mode (`./test add 1 2`), argv[0] is also the manifest source.
    // An explicit path argument is only needed for multi-command mode.
    let manifest_path = if opt_end < args.len() {
        args[opt_end].clone()
    } else if config.daemon_flag || config.router_flag {
        // Daemon/router: derive from argv[0]
        args[0].clone()
    } else {
        help::print_nexus_usage(prog_name)
    };
    let prog_name = std::path::Path::new(&manifest_path)
        .file_name()
        .and_then(|n| n.to_str())
        .unwrap_or(&manifest_path)
        .to_string();
    let mut arg_cursor = if opt_end < args.len() { opt_end + 1 } else { args.len() };

    // Read and parse manifest
    let payload = match manifest::read_manifest_payload(&manifest_path) {
        Ok(p) => p,
        Err(e) => {
            eprintln!("Failed to load manifest '{}': {}", manifest_path, e);
            std::process::exit(1);
        }
    };

    let manifest = match manifest::parse_manifest(&payload) {
        Ok(m) => m,
        Err(e) => {
            eprintln!("Failed to parse manifest '{}': {}", manifest_path, e);
            std::process::exit(1);
        }
    };

    let single_command = manifest.commands.len() == 1 && manifest.groups.is_empty();

    // Second pass: parse options after manifest path (skip in single-command mode)
    let mut remaining_args = args.clone();
    if !single_command {
        arg_cursor = dispatch::parse_nexus_options(&args[opt_end..], &mut config) + opt_end;
    } else {
        // In single-command mode, extract daemon/server long options manually
        dispatch::extract_global_options(&mut remaining_args, &mut config);
    }

    // Pool paths in the manifest are absolute, so no chdir is needed.
    // This lets user programs resolve file paths relative to the caller's CWD.
    // Source imports in pools resolve via __file__-relative paths (Python sys.path)
    // or script-relative paths (R .morloc.source) rather than depending on CWD.

    // Validate pool executables exist
    if let Err(e) = process::validate_pools(&manifest.pools) {
        eprintln!("Error: {}", e);
        std::process::exit(1);
    }

    // Handle help flag with manifest loaded
    if config.help_flag {
        if single_command {
            help::print_command_help_single(&prog_name, &manifest.commands[0]);
        } else {
            help::print_usage(&prog_name, &manifest);
        }
    }

    // Setup tmpdir and SHM
    let tmpdir = match process::make_tmpdir() {
        Ok(t) => t,
        Err(e) => {
            eprintln!("Error: {}", e);
            std::process::exit(1);
        }
    };
    process::set_tmpdir(tmpdir.clone());

    let job_hash = process::make_job_hash(42);
    let shm_basename = format!("morloc-{}", job_hash);

    // Initialize shared memory via libmorloc.so using dlsym.
    // CRITICAL: We must use dlsym to call the CDYLIB's shinit, not the rlib's.
    // The rlib and cdylib have separate static globals (VOLUMES, ALLOC_MUTEX, etc.).
    // All SHM operations in pool-facing C code go through the cdylib's globals.
    // If we call the rlib's shinit, the cdylib's globals stay uninitialized.
    {
        let _lib = unsafe { libc::dlopen(std::ptr::null(), libc::RTLD_NOW) };
        // RTLD_DEFAULT (NULL handle) searches in order: executable, then loaded libs
        // But the rlib symbols come first. Use RTLD_NEXT-style lookup via the .so path.
        let lib_path = std::ffi::CString::new(
            format!("{}/lib/libmorloc.so", morloc_home())
        ).unwrap();
        let lib = unsafe { libc::dlopen(lib_path.as_ptr(), libc::RTLD_NOW | libc::RTLD_GLOBAL) };
        if lib.is_null() {
            let err = unsafe { libc::dlerror() };
            let err_msg = if err.is_null() {
                "unknown error".to_string()
            } else {
                unsafe { std::ffi::CStr::from_ptr(err) }.to_string_lossy().into_owned()
            };
            eprintln!("Error: failed to load libmorloc.so: {}", err_msg);
            process::clean_exit(1);
        }

        type ShmSetFallbackFn = unsafe extern "C" fn(*const std::ffi::c_char);
        type ShinitFn = unsafe extern "C" fn(*const std::ffi::c_char, usize, usize, *mut *mut std::ffi::c_char) -> *mut std::ffi::c_void;

        let set_fb_sym = std::ffi::CString::new("shm_set_fallback_dir").unwrap();
        let shinit_sym = std::ffi::CString::new("shinit").unwrap();

        let set_fb: ShmSetFallbackFn = unsafe { std::mem::transmute(libc::dlsym(lib, set_fb_sym.as_ptr())) };
        let do_shinit: ShinitFn = unsafe { std::mem::transmute(libc::dlsym(lib, shinit_sym.as_ptr())) };

        let tmpdir_c = std::ffi::CString::new(tmpdir.as_str()).unwrap();
        let basename_c = std::ffi::CString::new(shm_basename.as_str()).unwrap();
        let mut errmsg: *mut std::ffi::c_char = std::ptr::null_mut();
        unsafe {
            set_fb(tmpdir_c.as_ptr());
            let shm = do_shinit(basename_c.as_ptr(), 0, 0xffff, &mut errmsg);
            if shm.is_null() {
                let msg = if !errmsg.is_null() {
                    let s = std::ffi::CStr::from_ptr(errmsg).to_string_lossy().into_owned();
                    libc::free(errmsg as *mut std::ffi::c_void);
                    s
                } else {
                    "unknown error".into()
                };
                eprintln!("Error: failed to initialize shared memory: {}", msg);
                process::clean_exit(1);
            }
        }
        unsafe { libc::dlclose(lib) };
    }

    // Become subreaper for orphaned grandchildren
    process::set_child_subreaper();

    // Install signal handlers
    process::install_signal_handlers();

    // Setup sockets
    let mut sockets = process::setup_sockets(&manifest.pools, &tmpdir, &shm_basename);

    // Daemon mode
    if config.daemon_flag {
        let all_indices: Vec<usize> = (0..manifest.pools.len()).collect();
        if let Err(e) = process::start_daemons(&mut sockets, &all_indices) {
            eprintln!("Error: {}", e);
            process::clean_exit(1);
        }

        // Build DaemonConfig and call daemon_run in libmorloc.so
        run_daemon(&config, &mut sockets, &shm_basename, &payload);
        process::clean_exit(0);
    }

    // Normal CLI mode
    if config.packet_path.is_none() {
        if single_command {
            // Single-command: dispatch directly to the command, no subcommand lookup
            // Allow optional command name prefix for backward compatibility
            let mut cmd_arg_start = arg_cursor;
            if cmd_arg_start < remaining_args.len()
                && remaining_args[cmd_arg_start] == manifest.commands[0].name
            {
                cmd_arg_start += 1;
            }
            dispatch::dispatch_command(
                &remaining_args,
                cmd_arg_start,
                &config,
                &manifest,
                &manifest.commands[0],
                &mut sockets,
                &prog_name,
            );
        } else {
            if arg_cursor >= remaining_args.len() {
                help::print_usage(&prog_name, &manifest);
            }
            dispatch::dispatch(
                &remaining_args,
                arg_cursor,
                &shm_basename,
                &config,
                &manifest,
                &mut sockets,
                &prog_name,
            );
        }
    } else {
        // Call-packet mode: read a pre-built call packet from file,
        // send to the appropriate pool, write result as MessagePack.
        // Used by SLURM workers on remote compute nodes.
        run_call_packet(&config, &tmpdir);
    }

    process::clean_exit(0);
}

/// Run the daemon event loop by calling daemon_run in libmorloc.so.
fn run_daemon(
    config: &dispatch::NexusConfig,
    sockets: &mut [process::PoolSocket],
    shm_basename: &str,
    manifest_payload: &str,
) {
    use std::ffi::{c_char, c_void, CString};
    use std::ptr;

    // daemon_run and parse_manifest signatures from libmorloc.so
    extern "C" {
        fn daemon_run(
            config: *mut c_void,        // *mut DaemonConfig
            manifest: *mut c_void,       // *mut Manifest (opaque)
            sockets: *mut c_void,        // *mut MorlocSocket
            n_pools: usize,
            shm_basename: *const c_char,
        );
        fn parse_manifest(text: *const c_char, errmsg: *mut *mut c_char) -> *mut c_void;
    }

    // Build C MorlocSocket array (matches daemon_ffi::MorlocSocket layout)
    #[repr(C)]
    struct CMorlocSocket {
        lang: *mut c_char,
        syscmd: *mut *mut c_char,
        socket_filename: *mut c_char,
        pid: i32,
    }

    let n_pools = sockets.len();
    let mut c_sockets: Vec<CMorlocSocket> = Vec::with_capacity(n_pools);
    // Keep CStrings alive for the duration
    let mut _keepalive: Vec<Vec<CString>> = Vec::new();

    for sock in sockets.iter() {
        let lang_c = CString::new(sock.lang.as_str()).unwrap();
        let socket_c = CString::new(sock.socket_path.as_str()).unwrap();

        // Build NULL-terminated syscmd array
        let mut cmd_ptrs: Vec<*mut c_char> = Vec::new();
        let mut cmd_strs: Vec<CString> = Vec::new();
        for arg in &sock.syscmd {
            let c = CString::new(arg.to_bytes()).unwrap();
            cmd_ptrs.push(c.as_ptr() as *mut c_char);
            cmd_strs.push(c);
        }
        cmd_ptrs.push(ptr::null_mut());

        c_sockets.push(CMorlocSocket {
            lang: lang_c.as_ptr() as *mut c_char,
            syscmd: cmd_ptrs.as_ptr() as *mut *mut c_char,
            socket_filename: socket_c.as_ptr() as *mut c_char,
            pid: sock.pid,
        });

        // Keep everything alive
        _keepalive.push(cmd_strs);
        _keepalive.push(vec![lang_c, socket_c]);
    }

    // Build C DaemonConfig (matches daemon_ffi::DaemonConfig layout)
    #[repr(C)]
    struct CDaemonConfig {
        unix_socket_path: *const c_char,
        tcp_port: i32,
        http_port: i32,
        pool_check_fn: *const c_void,   // Option<fn> as null
        pool_alive_fn: *const c_void,   // Option<fn> as null
        n_pools: usize,
        eval_timeout: i32,
    }

    let unix_socket_cstr = config.unix_socket_path.as_ref()
        .map(|p| CString::new(p.as_str()).unwrap());

    let mut daemon_config = CDaemonConfig {
        unix_socket_path: unix_socket_cstr.as_ref()
            .map_or(ptr::null(), |c| c.as_ptr()),
        tcp_port: config.tcp_port.unwrap_or(0),
        http_port: config.http_port.unwrap_or(0),
        pool_check_fn: ptr::null(),
        pool_alive_fn: process::pool_is_alive_ptr(),
        n_pools,
        eval_timeout: config.eval_timeout,
    };

    // Parse manifest via the C FFI (so daemon_run gets the C-layout manifest).
    // The payload was already extracted from the wrapper script by the main flow.
    let manifest_c_str = CString::new(manifest_payload).unwrap();
    let mut errmsg: *mut c_char = ptr::null_mut();
    let c_manifest = unsafe { parse_manifest(manifest_c_str.as_ptr(), &mut errmsg) };
    if c_manifest.is_null() {
        let msg = if !errmsg.is_null() {
            let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
            unsafe { libc::free(errmsg as *mut c_void) };
            s
        } else {
            "unknown error".into()
        };
        eprintln!("Error: failed to parse manifest for daemon: {}", msg);
        process::clean_exit(1);
    }

    let shm_c = CString::new(shm_basename).unwrap();

    unsafe {
        daemon_run(
            &mut daemon_config as *mut CDaemonConfig as *mut c_void,
            c_manifest,
            c_sockets.as_mut_ptr() as *mut c_void,
            n_pools,
            shm_c.as_ptr(),
        );
    }
}

/// Run the multi-program router daemon.
/// Scans the fdb directory for .manifest files and serves them all via HTTP/TCP/Unix.
fn run_router(config: &dispatch::NexusConfig) {
    use std::ffi::{c_char, c_void, CString};
    use std::ptr;

    extern "C" {
        fn router_init(fdb_path: *const c_char, errmsg: *mut *mut c_char) -> *mut c_void;
        fn router_run(config: *mut c_void, router: *mut c_void);
        fn router_free(router: *mut c_void);
    }

    let fdb_path = config.fdb_path.clone().unwrap_or_else(|| {
        format!("{}/fdb", morloc_home())
    });
    let fdb_c = CString::new(fdb_path.as_str()).unwrap();

    let mut errmsg: *mut c_char = ptr::null_mut();
    let router = unsafe { router_init(fdb_c.as_ptr(), &mut errmsg) };
    if router.is_null() {
        let msg = if !errmsg.is_null() {
            let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
            unsafe { libc::free(errmsg as *mut c_void) };
            s
        } else {
            "unknown error".into()
        };
        eprintln!("Error: failed to initialize router: {}", msg);
        std::process::exit(1);
    }

    // Build DaemonConfig for the router
    #[repr(C)]
    struct CDaemonConfig {
        unix_socket_path: *const c_char,
        tcp_port: i32,
        http_port: i32,
        pool_check_fn: *const c_void,
        pool_alive_fn: *const c_void,
        n_pools: usize,
        eval_timeout: i32,
    }

    let unix_cstr = config.unix_socket_path.as_ref()
        .map(|p| CString::new(p.as_str()).unwrap());

    let mut dc = CDaemonConfig {
        unix_socket_path: unix_cstr.as_ref().map_or(ptr::null(), |c| c.as_ptr()),
        tcp_port: config.tcp_port.unwrap_or(0),
        http_port: config.http_port.unwrap_or(0),
        pool_check_fn: ptr::null(),
        pool_alive_fn: ptr::null(),
        n_pools: 0,
        eval_timeout: if config.eval_timeout > 0 { config.eval_timeout } else { 30 },
    };

    unsafe {
        router_run(&mut dc as *mut CDaemonConfig as *mut c_void, router);
        router_free(router);
    }
}

/// Run a pre-built call packet on a remote worker node (SLURM mode).
/// Reads a call packet from file, sends it to the pool, writes result as MessagePack.
fn run_call_packet(config: &dispatch::NexusConfig, tmpdir: &str) {
    use std::ffi::{c_char, c_void, CString};
    use std::ptr;

    extern "C" {
        fn read_binary_file(
            filename: *const c_char, file_size: *mut usize, errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn send_and_receive_over_socket(
            socket_path: *const c_char, packet: *const u8, errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn get_morloc_data_packet_error_message(
            data: *const u8, errmsg: *mut *mut c_char,
        ) -> *mut c_char;
        fn read_schema_from_packet_meta(
            packet: *const u8, errmsg: *mut *mut c_char,
        ) -> *mut c_char;
        fn parse_schema(
            schema_str: *const c_char, errmsg: *mut *mut c_char,
        ) -> *mut morloc_runtime::cschema::CSchema;
        fn get_morloc_data_packet_value(
            data: *const u8, schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn pack_with_schema(
            mlc: *const c_void, schema: *const morloc_runtime::cschema::CSchema,
            mpkptr: *mut *mut c_char, mpk_size: *mut usize, errmsg: *mut *mut c_char,
        ) -> i32;
        fn write_atomic(
            filename: *const c_char, data: *const u8, size: usize, errmsg: *mut *mut c_char,
        ) -> i32;
        fn print_morloc_data_packet(
            packet: *const u8, schema: *const morloc_runtime::cschema::CSchema,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let packet_path = config.packet_path.as_ref().unwrap();
    let socket_base = match &config.socket_base {
        Some(s) => s.clone(),
        None => {
            eprintln!("Error: --socket-base required for call-packet mode");
            process::clean_exit(1);
        }
    };
    let socket_path = format!("{}/{}", tmpdir, socket_base);

    let packet_c = CString::new(packet_path.as_str()).unwrap();
    let socket_c = CString::new(socket_path.as_str()).unwrap();
    let mut errmsg: *mut c_char = ptr::null_mut();

    // Read call packet from file
    let mut packet_size: usize = 0;
    let call_packet = unsafe { read_binary_file(packet_c.as_ptr(), &mut packet_size, &mut errmsg) };
    if call_packet.is_null() || !errmsg.is_null() {
        let msg = if !errmsg.is_null() {
            let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
            unsafe { libc::free(errmsg as *mut c_void) };
            s
        } else {
            "unknown error".into()
        };
        eprintln!("Error: failed to read call packet '{}': {}", packet_path, msg);
        process::clean_exit(1);
    }

    // Send to pool and receive response
    let result_packet = unsafe {
        send_and_receive_over_socket(socket_c.as_ptr(), call_packet, &mut errmsg)
    };
    unsafe { libc::free(call_packet as *mut c_void) };
    if result_packet.is_null() || !errmsg.is_null() {
        let msg = if !errmsg.is_null() {
            let s = unsafe { std::ffi::CStr::from_ptr(errmsg) }.to_string_lossy().into_owned();
            unsafe { libc::free(errmsg as *mut c_void) };
            s
        } else {
            "unknown error".into()
        };
        eprintln!("Error: run failed: {}", msg);
        process::clean_exit(1);
    }

    // Check for error in response
    let run_err = unsafe { get_morloc_data_packet_error_message(result_packet, &mut errmsg) };
    if !run_err.is_null() {
        let s = unsafe { std::ffi::CStr::from_ptr(run_err) }.to_string_lossy().into_owned();
        unsafe { libc::free(run_err as *mut c_void) };
        eprintln!("Error: run failed: {}", s);
        process::clean_exit(1);
    }

    // If output-form is "packet", write raw packet to output file
    if config.output_format == dispatch::OutputFormat::Packet {
        if let Some(ref output_path) = config.output_path {
            let schema_str = unsafe { read_schema_from_packet_meta(result_packet, &mut errmsg) };
            let schema = if !schema_str.is_null() {
                unsafe { parse_schema(schema_str, &mut errmsg) }
            } else {
                ptr::null_mut()
            };
            unsafe {
                print_morloc_data_packet(result_packet, schema, &mut errmsg);
            };
            // Also write as msgpack file
            if !schema.is_null() {
                let mlc = unsafe { get_morloc_data_packet_value(result_packet, schema, &mut errmsg) };
                if !mlc.is_null() && errmsg.is_null() {
                    let mut mpk_data: *mut c_char = ptr::null_mut();
                    let mut mpk_size: usize = 0;
                    unsafe { pack_with_schema(mlc as *const c_void, schema, &mut mpk_data, &mut mpk_size, &mut errmsg) };
                    if !mpk_data.is_null() && errmsg.is_null() {
                        let mpk_filename = format!("{}.mpk", output_path);
                        let mpk_c = CString::new(mpk_filename.as_str()).unwrap();
                        unsafe { write_atomic(mpk_c.as_ptr(), mpk_data as *const u8, mpk_size, &mut errmsg) };
                        unsafe { libc::free(mpk_data as *mut c_void) };
                    }
                }
            }
        }
    }

    unsafe { libc::free(result_packet as *mut c_void) };
}


================================================
FILE: data/rust/morloc-nexus/src/manifest.rs
================================================
//! Manifest types -- thin re-export shim over the canonical schema
//! definitions in the `morloc-manifest` crate.
//!
//! This module exists only so that existing code in this crate (and
//! its consumers) can keep saying `crate::manifest::Manifest` without
//! caring whether the types live here or in a sibling crate. The
//! actual schema, with full doc comments and parsing logic, lives in
//! `data/rust/morloc-manifest/src/lib.rs`.

pub use morloc_manifest::{
    parse_manifest, read_manifest_payload, Arg, Command,
    GroupEntry, Manifest, Pool,
};


================================================
FILE: data/rust/morloc-nexus/src/process.rs
================================================
//! Pool daemon process management, signal handling, and lifecycle.
//!
//! Replaces the fork/exec, SIGCHLD, SIGTERM, clean_exit logic from nexus.c.

use std::ffi::CString;
use std::path::Path;
use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
use std::time::Duration;

use crate::manifest::Pool;

pub const MAX_DAEMONS: usize = 32;

const INITIAL_PING_TIMEOUT: Duration = Duration::from_millis(10);
const INITIAL_RETRY_DELAY: Duration = Duration::from_millis(1);
const RETRY_MULTIPLIER: f64 = 1.25;
const MAX_RETRIES: usize = 16;

// ── Global state for signal handlers ───────────────────────────────────────

/// PIDs of spawned pool daemons. 0 = unused, -1 = reaped.
static PIDS: [AtomicI32; MAX_DAEMONS] = {
    const INIT: AtomicI32 = AtomicI32::new(0);
    [INIT; MAX_DAEMONS]
};

/// Process group IDs for cleanup.
static PGIDS: [AtomicI32; MAX_DAEMONS] = {
    const INIT: AtomicI32 = AtomicI32::new(0);
    [INIT; MAX_DAEMONS]
};

/// Exit statuses saved by SIGCHLD handler.
static EXIT_STATUSES: [AtomicI32; MAX_DAEMONS] = {
    const INIT: AtomicI32 = AtomicI32::new(0);
    [INIT; MAX_DAEMONS]
};

/// Re-entrancy guard for clean_exit.
static CLEANING_UP: AtomicBool = AtomicBool::new(false);

/// Global tmpdir path (set once in main, read during cleanup).
static TMPDIR: std::sync::OnceLock<String> = std::sync::OnceLock::new();

/// Socket info for each pool.
///
/// Pool stderr and stdout are intentionally NOT captured or intercepted by
/// the nexus: a core morloc guarantee is that anything a sourced function
/// prints to stderr/stdout is passed through unchanged. Raised exceptions
/// are caught inside each pool's dispatch wrapper (see pool.py/pool.cpp/
/// pool.R/pool.jl) and returned as morloc error packets, which the nexus
/// then annotates with call-site context when bubbling them up.
pub struct PoolSocket {
    pub lang: String,
    pub socket_path: String,
    pub syscmd: Vec<CString>,
    pub pid: i32,
}

// ── Signal handlers (async-signal-safe) ────────────────────────────────────

/// SIGCHLD handler: reap terminated children.
extern "C" fn sigchld_handler(_sig: libc::c_int) {
    #[cfg(target_os = "linux")]
    let saved_errno = unsafe { *libc::__errno_location() };
    #[cfg(target_os = "macos")]
    let saved_errno = unsafe { *libc::__error() };
    loop {
        let mut status: libc::c_int = 0;
        let pid = unsafe { libc::waitpid(-1, &mut status, libc::WNOHANG) };
        if pid <= 0 {
            break;
        }
        for i in 0..MAX_DAEMONS {
            if PIDS[i].load(Ordering::Relaxed) == pid {
                EXIT_STATUSES[i].store(status, Ordering::Relaxed);
                PIDS[i].store(-1, Ordering::Relaxed);
                break;
            }
        }
    }
    #[cfg(target_os = "linux")]
    unsafe { *libc::__errno_location() = saved_errno };
    #[cfg(target_os = "macos")]
    unsafe { *libc::__error() = saved_errno };
}

/// SIGTERM/SIGINT handler: clean shutdown.
extern "C" fn signal_exit_handler(sig: libc::c_int) {
    if CLEANING_UP.load(Ordering::Relaxed) {
        unsafe { libc::_exit(128 + sig) };
    }
    clean_exit(128 + sig);
}

/// Install signal handlers.
pub fn install_signal_handlers() {
    unsafe {
        // SIGCHLD
        let mut sa: libc::sigaction = std::mem::zeroed();
        sa.sa_sigaction = sigchld_handler as *const () as usize;
        libc::sigemptyset(&mut sa.sa_mask);
        sa.sa_flags = libc::SA_RESTART | libc::SA_NOCLDSTOP;
        libc::sigaction(libc::SIGCHLD, &sa, std::ptr::null_mut());

        // SIGTERM and SIGINT
        let mut sa_exit: libc::sigaction = std::mem::zeroed();
        sa_exit.sa_sigaction = signal_exit_handler as *const () as usize;
        libc::sigemptyset(&mut sa_exit.sa_mask);
        sa_exit.sa_flags = 0;
        libc::sigaction(libc::SIGTERM, &sa_exit, std::ptr::null_mut());
        libc::sigaction(libc::SIGINT, &sa_exit, std::ptr::null_mut());
    }
}

/// Set the global tmpdir for cleanup.
pub fn set_tmpdir(path: String) {
    let _ = TMPDIR.set(path);
}

/// Get the tmpdir path.
pub fn get_tmpdir() -> Option<&'static str> {
    TMPDIR.get().map(|s| s.as_str())
}

// ── Clean exit ─────────────────────────────────────────────────────────────

/// Terminate all pool daemons and clean up resources.
///
/// Race condition with stderr output: when a pool process is dying (e.g.,
/// Python printing a traceback), its stderr writes may still be in a pipe
/// buffer or mid-syscall when we send SIGTERM. The pool's signal handler
/// (or SIG_DFL) may kill the process before its output reaches the
/// terminal. We mitigate this by:
/// 1. Flushing the nexus's own stderr first (so our error message is out)
/// 2. Giving pools 200ms after SIGTERM before escalating to SIGKILL
///    (up from the previous 50ms, which was too short for Python's
///    atexit handlers and multiprocessing cleanup to flush buffers)
pub fn clean_exit(exit_code: i32) -> ! {
    CLEANING_UP.store(true, Ordering::SeqCst);

    // Flush nexus stderr so our error messages are visible even if
    // the process is killed by a parent (e.g., shell pipeline).
    unsafe { libc::fsync(2) };

    // Block SIGCHLD during cleanup
    unsafe {
        let mut block_chld: libc::sigset_t = std::mem::zeroed();
        libc::sigemptyset(&mut block_chld);
        libc::sigaddset(&mut block_chld, libc::SIGCHLD);
        libc::sigprocmask(libc::SIG_BLOCK, &block_chld, std::ptr::null_mut());
    }

    // Send SIGTERM to all pool process groups
    for i in 0..MAX_DAEMONS {
        let pgid = PGIDS[i].load(Ordering::Relaxed);
        if pgid > 0 {
            unsafe { libc::kill(-pgid, libc::SIGTERM) };
        }
    }

    // Wait for groups to exit (up to 200ms per group, then SIGKILL).
    // The 200ms window serves two purposes:
    // - Lets pool signal handlers run (Python's signal_handler in pool.py
    //   calls close_daemon and cleans up shared memory)
    // - Lets any pending stderr writes (tracebacks, error messages) drain
    //   to the terminal before the process is force-killed
    for i in 0..MAX_DAEMONS {
        let pgid = PGIDS[i].load(Ordering::Relaxed);
        if pgid <= 0 {
            continue;
        }

        // Reap any available children
        while unsafe { libc::waitpid(-1, std::ptr::null_mut(), libc::WNOHANG) } > 0 {}
        if unsafe { libc::kill(-pgid, 0) } == -1 {
            continue;
        }

        let mut group_dead = false;
        for _ in 0..100 {
            while unsafe { libc::waitpid(-1, std::ptr::null_mut(), libc::WNOHANG) } > 0 {}
            if unsafe { libc::kill(-pgid, 0) } == -1 {
                group_dead = true;
                break;
            }
            std::thread::sleep(Duration::from_millis(2));
        }

        if !group_dead {
            unsafe { libc::kill(-pgid, libc::SIGKILL) };
            std::thread::sleep(Duration::from_millis(50));
        }
    }

    // Final reap
    while unsafe { libc::waitpid(-1, std::ptr::null_mut(), libc::WNOHANG) } > 0 {}

    // Clean up shared memory segments
    extern "C" {
        fn shclose(errmsg: *mut *mut std::ffi::c_char) -> bool;
    }
    unsafe {
        let mut err: *mut std::ffi::c_char = std::ptr::null_mut();
        shclose(&mut err);
        if !err.is_null() {
            libc::free(err as *mut libc::c_void);
        }
    }

    // Clean up tmpdir
    if let Some(dir) = get_tmpdir() {
        let _ = std::fs::remove_dir_all(dir);
    }

    std::process::exit(exit_code);
}

// ── Pool daemon spawning ───────────────────────────────────────────────────

/// Setup socket descriptors for all pools from the manifest.
pub fn setup_sockets(pools: &[Pool], tmpdir: &str, shm_basename: &str) -> Vec<PoolSocket> {
    pools
        .iter()
        .map(|pool| {
            let socket_path = format!("{}/{}", tmpdir, pool.socket);

            // Build syscmd: exec_args... socket_path tmpdir shm_basename
            let mut syscmd: Vec<CString> = pool
                .exec
                .iter()
                .map(|s| CString::new(s.as_str()).unwrap())
                .collect();
            syscmd.push(CString::new(socket_path.as_str()).unwrap());
            syscmd.push(CString::new(tmpdir).unwrap());
            syscmd.push(CString::new(shm_basename).unwrap());

            PoolSocket {
                lang: pool.lang.clone(),
                socket_path,
                syscmd,
                pid: 0,
            }
        })
        .collect()
}

/// Fork and exec a language pool daemon. Returns child PID.
///
/// The child inherits the nexus's stdin/stdout/stderr unchanged: anything a
/// sourced function prints must reach the terminal byte-for-byte without
/// morloc interposing. Runtime errors raised inside the pool are caught by
/// the pool's own dispatch wrapper and returned as morloc error packets.
fn start_language_server(socket: &PoolSocket) -> Result<i32, String> {
    let pid = unsafe { libc::fork() };

    if pid == 0 {
        // Child process
        unsafe { libc::setpgid(0, 0) };

        let argv: Vec<*const libc::c_char> = socket
            .syscmd
            .iter()
            .map(|s| s.as_ptr())
            .chain(std::iter::once(std::ptr::null()))
            .collect();

        unsafe {
            libc::execvp(argv[0], argv.as_ptr());
        }
        // Only reached if exec fails.
        eprintln!(
            "execvp failed for {}: {}",
            socket.lang,
            std::io::Error::last_os_error()
        );
        unsafe { libc::_exit(127) };
    } else if pid > 0 {
        // Parent: ensure child is in its own process group
        unsafe { libc::setpgid(pid, pid) };
        Ok(pid)
    } else {
        Err(format!("fork failed: {}", std::io::Error::last_os_error()))
    }
}

/// Start pool daemons for the given socket indices and wait for them to respond to pings.
pub fn start_daemons(sockets: &mut [PoolSocket], indices: &[usize]) -> Result<(), String> {
    for &idx in indices {
        let pid = start_language_server(&sockets[idx])?;
        sockets[idx].pid = pid;
        PIDS[idx].store(pid, Ordering::Relaxed);
        PGIDS[idx].store(pid, Ordering::Relaxed);
    }

    // Wait for each daemon to respond to pings
    for &idx in indices {
        wait_for_daemon(&sockets[idx], idx)?;
    }

    Ok(())
}

/// Ping a daemon with exponential backoff until it responds.
/// Matches the C nexus behavior: initial delay 1ms, multiplier 1.25,
/// plus socket timeout that doubles from 10ms to ~10s.
fn wait_for_daemon(socket: &PoolSocket, pool_index: usize) -> Result<(), String> {
    use morloc_runtime::packet::PacketHeader;
    use std::os::unix::net::UnixStream;
    use std::io::{Read, Write};

    let ping = PacketHeader::ping();
    let ping_bytes = ping.to_bytes();
    let mut retry_delay = INITIAL_RETRY_DELAY.as_secs_f64();
    let mut ping_timeout = INITIAL_PING_TIMEOUT;

    for attempt in 0..=MAX_RETRIES {
        // Check if child already died. The pool's stderr was inherited
        // directly, so any traceback it printed is already on the user's
        // terminal; the nexus just reports the exit status here.
        if PIDS[pool_index].load(Ordering::Relaxed) == -1 {
            let status = EXIT_STATUSES[pool_index].load(Ordering::Relaxed);
            return Err(format!(
                "Pool process for '{}' died unexpectedly (status: {})",
                socket.lang, status
            ));
        }

        // Try to connect and ping
        match UnixStream::connect(&socket.socket_path) {
            Ok(mut stream) => {
                let _ = stream.set_read_timeout(Some(ping_timeout));
                let _ = stream.set_write_timeout(Some(ping_timeout));

                if stream.write_all(&ping_bytes).is_ok() {
                    let mut resp = [0u8; 32];
                    if stream.read_exact(&mut resp).is_ok() {
                        if let Ok(hdr) = PacketHeader::from_bytes(&resp) {
                            if hdr.is_ping() {
                                return Ok(());
                            }
                        }
                    }
                }
            }
            Err(_) => {}
        }

        if attempt == MAX_RETRIES {
            return Err(format!(
                "Failed to ping pool '{}' at {} after {} retries",
                socket.lang, socket.socket_path, MAX_RETRIES
            ));
        }

        // Sleep with exponential backoff
        // Use the larger of retry_delay or ping_timeout to ensure we wait
        // long enough for slow-starting pools (R, Python)
        let wait = retry_delay.max(ping_timeout.as_secs_f64());
        let secs = wait as u64;
        let nanos = ((wait - secs as f64) * 1e9) as u32;
        std::thread::sleep(Duration::new(secs, nanos));
        retry_delay *= RETRY_MULTIPLIER;
        ping_timeout = ping_timeout * 2;
    }

    unreachable!()
}

/// Return a C-compatible function pointer for pool_is_alive.
pub fn pool_is_alive_ptr() -> *const std::ffi::c_void {
    extern "C" fn pool_alive_c(pool_index: usize) -> bool {
        pool_is_alive(pool_index)
    }
    pool_alive_c as *const std::ffi::c_void
}

/// Check if a pool at given index is alive.
pub fn pool_is_alive(pool_index: usize) -> bool {
    if pool_index >= MAX_DAEMONS {
        return false;
    }
    let pid = PIDS[pool_index].load(Ordering::Relaxed);
    if pid <= 0 {
        return false;
    }
    unsafe { libc::kill(pid, 0) == 0 }
}

/// Get the exit status of a reaped pool, returning signal/exit info.
pub fn pool_death_info(pool_index: usize) -> Option<String> {
    if PIDS[pool_index].load(Ordering::Relaxed) != -1 {
        return None;
    }
    let st = EXIT_STATUSES[pool_index].load(Ordering::Relaxed);
    if libc::WIFSIGNALED(st) {
        let sig = libc::WTERMSIG(st);
        Some(format!("Pool process crashed with signal {sig}"))
    } else if libc::WIFEXITED(st) {
        let code = libc::WEXITSTATUS(st);
        Some(format!("Pool process exited with status {code}"))
    } else {
        Some("Pool process died unexpectedly".into())
    }
}

/// Validate that all pool executables exist.
pub fn validate_pools(pools: &[Pool]) -> Result<(), String> {
    for pool in pools {
        if let Some(exec) = pool.exec.last() {
            if !Path::new(exec).exists() {
                return Err(format!(
                    "Build artifacts missing or stale. Pool file '{}' not found. Re-run `morloc make`.",
                    exec
                ));
            }
        }
    }
    Ok(())
}

/// Create a temporary directory for this nexus session.
pub fn make_tmpdir() -> Result<String, String> {
    let template = CString::new("/tmp/morloc.XXXXXX").unwrap();
    let mut buf = template.into_bytes_with_nul();
    let ptr = buf.as_mut_ptr() as *mut libc::c_char;
    let result = unsafe { libc::mkdtemp(ptr) };
    if result.is_null() {
        return Err(format!(
            "Failed to create temporary directory: {}",
            std::io::Error::last_os_error()
        ));
    }
    let cstr = unsafe { std::ffi::CStr::from_ptr(result) };
    Ok(cstr.to_string_lossy().into_owned())
}

/// Generate a job hash from seed, pid, and timestamps.
pub fn make_job_hash(seed: u64) -> u64 {
    use morloc_runtime::hash::xxh64;

    let pid = std::process::id() as u64;
    let now = std::time::SystemTime::now()
        .duration_since(std::time::UNIX_EPOCH)
        .unwrap_or_default();
    let epoch_ns = now.as_nanos() as u64;

    let data = format!("{}:{}:{}", pid, epoch_ns, seed);
    xxh64(data.as_bytes())
}

/// Become a subreaper so orphaned grandchildren get reparented to us.
/// Only available on Linux; no-op on other platforms.
pub fn set_child_subreaper() {
    #[cfg(target_os = "linux")]
    unsafe {
        libc::prctl(libc::PR_SET_CHILD_SUBREAPER, 1, 0, 0, 0);
    }
}


================================================
FILE: data/rust/morloc-runtime/Cargo.toml
================================================
[package]
name = "morloc-runtime"
version = "0.81.0"
edition = "2021"
description = "Morloc runtime library: shared memory, serialization, IPC, packet protocol"
# Version is intentionally synchronized with the morloc compiler version
# (see ../../../package.yaml). The C-FFI manifest reader rejects
# manifests whose recorded morloc_version differs from this crate's
# CARGO_PKG_VERSION at parse time. Bumping the morloc compiler version
# requires bumping this version in lockstep.

[lib]
crate-type = ["cdylib", "staticlib", "rlib"]

[dependencies]
morloc-manifest = { path = "../morloc-manifest" }
libc = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
rmp = "0.8"
rmp-serde = { workspace = true }
twox-hash = { workspace = true }
nix = { workspace = true }
thiserror = { workspace = true }

[build-dependencies]
cbindgen = "0.28"
# cc crate no longer needed -- all C files ported to Rust


================================================
FILE: data/rust/morloc-runtime/build.rs
================================================
fn main() {
    let target = std::env::var("TARGET").unwrap_or_default();
    println!("cargo:rustc-link-lib=pthread");
    if target.contains("linux") {
        println!("cargo:rustc-link-lib=rt");
    }
    // The morloc compiler version is sourced from CARGO_PKG_VERSION
    // (this crate's Cargo.toml), which is intentionally kept in
    // lockstep with the morloc Haskell package.yaml.
}


================================================
FILE: data/rust/morloc-runtime/cbindgen.toml
================================================
language = "C"
header = "/* Generated by cbindgen - do not edit manually */"
autogen_warning = ""
include_version = false
documentation_style = "c99"
no_includes = true

[export]
prefix = ""

[fn]
prefix = ""

[parse]
parse_deps = false


================================================
FILE: data/rust/morloc-runtime/src/arrow_ffi.rs
================================================
//! Arrow C Data Interface implementation.
//! Replaces arrow.c. Provides SHM ↔ Arrow conversion.

use std::ffi::{c_char, c_void};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::shm::{self, RelPtr};

const ARROW_SHM_MAGIC: u32 = 0xA770DA7A;
const ARROW_BUFFER_ALIGN: usize = 64;

fn arrow_align_up(x: usize) -> usize {
    (x + ARROW_BUFFER_ALIGN - 1) & !(ARROW_BUFFER_ALIGN - 1)
}

// ── Arrow C Data Interface structs (matching Apache spec) ────────────────────

#[repr(C)]
pub struct ArrowSchema {
    pub format: *const c_char,
    pub name: *const c_char,
    pub metadata: *const c_char,
    pub flags: i64,
    pub n_children: i64,
    pub children: *mut *mut ArrowSchema,
    pub dictionary: *mut ArrowSchema,
    pub release: Option<unsafe extern "C" fn(*mut ArrowSchema)>,
    pub private_data: *mut c_void,
}

#[repr(C)]
pub struct ArrowArray {
    pub length: i64,
    pub null_count: i64,
    pub offset: i64,
    pub n_buffers: i64,
    pub n_children: i64,
    pub buffers: *mut *const c_void,
    pub children: *mut *mut ArrowArray,
    pub dictionary: *mut ArrowArray,
    pub release: Option<unsafe extern "C" fn(*mut ArrowArray)>,
    pub private_data: *mut c_void,
}

// ── SHM header types ─────────────────────────────────────────────────────────

#[repr(C)]
pub struct ArrowColumnDesc {
    pub col_type: u32,       // morloc_serial_type
    pub length: u64,
    pub null_count: u64,
    pub name_offset: u32,
    pub name_length: u16,
    pub data_offset: u64,
    pub data_size: u64,
}

#[repr(C)]
pub struct ArrowShmHeader {
    pub magic: u32,
    pub n_columns: u32,
    pub n_rows: u64,
    pub total_size: u64,
}

// ── Type mapping ─────────────────────────────────────────────────────────────

// Serial type constants matching C enum
const MORLOC_NIL: u32 = 0;
const MORLOC_BOOL: u32 = 1;
const MORLOC_SINT8: u32 = 2;
const MORLOC_SINT16: u32 = 3;
const MORLOC_SINT32: u32 = 4;
const MORLOC_SINT64: u32 = 5;
const MORLOC_UINT8: u32 = 6;
const MORLOC_UINT16: u32 = 7;
const MORLOC_UINT32: u32 = 8;
const MORLOC_UINT64: u32 = 9;
const MORLOC_FLOAT32: u32 = 10;
const MORLOC_FLOAT64: u32 = 11;
const MORLOC_STRING: u32 = 12;

#[no_mangle]
pub extern "C" fn arrow_element_size(serial_type: u32) -> usize {
    match serial_type {
        MORLOC_BOOL | MORLOC_SINT8 | MORLOC_UINT8 => 1,
        MORLOC_SINT16 | MORLOC_UINT16 => 2,
        MORLOC_SINT32 | MORLOC_UINT32 | MORLOC_FLOAT32 => 4,
        MORLOC_SINT64 | MORLOC_UINT64 | MORLOC_FLOAT64 => 8,
        _ => 0,
    }
}

#[no_mangle]
pub extern "C" fn arrow_format_string(serial_type: u32) -> *const c_char {
    match serial_type {
        MORLOC_BOOL => b"b\0".as_ptr() as *const c_char,
        MORLOC_SINT8 => b"c\0".as_ptr() as *const c_char,
        MORLOC_UINT8 => b"C\0".as_ptr() as *const c_char,
        MORLOC_SINT16 => b"s\0".as_ptr() as *const c_char,
        MORLOC_UINT16 => b"S\0".as_ptr() as *const c_char,
        MORLOC_SINT32 => b"i\0".as_ptr() as *const c_char,
        MORLOC_UINT32 => b"I\0".as_ptr() as *const c_char,
        MORLOC_SINT64 => b"l\0".as_ptr() as *const c_char,
        MORLOC_UINT64 => b"L\0".as_ptr() as *const c_char,
        MORLOC_FLOAT32 => b"f\0".as_ptr() as *const c_char,
        MORLOC_FLOAT64 => b"g\0".as_ptr() as *const c_char,
        MORLOC_STRING => b"u\0".as_ptr() as *const c_char,
        _ => ptr::null(),
    }
}

#[no_mangle]
pub unsafe extern "C" fn arrow_format_to_type(format: *const c_char) -> u32 {
    if format.is_null() || *format == 0 || *format.add(1) != 0 {
        return MORLOC_NIL;
    }
    match *format as u8 {
        b'b' => MORLOC_BOOL,
        b'c' => MORLOC_SINT8,
        b'C' => MORLOC_UINT8,
        b's' => MORLOC_SINT16,
        b'S' => MORLOC_UINT16,
        b'i' => MORLOC_SINT32,
        b'I' => MORLOC_UINT32,
        b'l' => MORLOC_SINT64,
        b'L' => MORLOC_UINT64,
        b'f' => MORLOC_FLOAT32,
        b'g' => MORLOC_FLOAT64,
        b'u' => MORLOC_STRING,
        _ => MORLOC_NIL,
    }
}

// ── Column accessors (used by arrow_json.c) ──────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn arrow_column_desc(
    header: *const ArrowShmHeader,
    col_index: u32,
) -> *const ArrowColumnDesc {
    if header.is_null() || col_index >= (*header).n_columns {
        return ptr::null();
    }
    let descs = (header as *const u8).add(std::mem::size_of::<ArrowShmHeader>()) as *const ArrowColumnDesc;
    descs.add(col_index as usize)
}

#[no_mangle]
pub unsafe extern "C" fn arrow_column_data(
    header: *const ArrowShmHeader,
    col_index: u32,
) -> *const c_void {
    let desc = arrow_column_desc(header, col_index);
    if desc.is_null() { return ptr::null(); }
    (header as *const u8).add((*desc).data_offset as usize) as *const c_void
}

#[no_mangle]
pub unsafe extern "C" fn arrow_column_name(
    header: *const ArrowShmHeader,
    col_index: u32,
) -> *const c_char {
    let desc = arrow_column_desc(header, col_index);
    if desc.is_null() { return ptr::null(); }
    (header as *const u8).add((*desc).name_offset as usize) as *const c_char
}

// ── arrow_to_shm ─────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn arrow_to_shm(
    array: *const ArrowArray,
    schema: *const ArrowSchema,
    errmsg: *mut *mut c_char,
) -> RelPtr {
    clear_errmsg(errmsg);

    if array.is_null() || schema.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL array or schema".into()));
        return shm::RELNULL;
    }

    // Verify struct type
    if (*schema).format.is_null() || libc::strcmp((*schema).format, b"+s\0".as_ptr() as *const c_char) != 0 {
        set_errmsg(errmsg, &MorlocError::Other("Expected struct schema (format '+s')".into()));
        return shm::RELNULL;
    }

    let n_cols = (*schema).n_children as usize;
    let n_rows = (*array).length as usize;

    if n_cols == 0 {
        set_errmsg(errmsg, &MorlocError::Other("Arrow struct must have at least one column".into()));
        return shm::RELNULL;
    }

    let header_size = std::mem::size_of::<ArrowShmHeader>();
    let descs_size = n_cols * std::mem::size_of::<ArrowColumnDesc>();

    let mut names_size: usize = 0;
    for i in 0..n_cols {
        let child_schema = *(*schema).children.add(i);
        let name = (*child_schema).name;
        if !name.is_null() { names_size += libc::strlen(name); }
    }

    let data_start = arrow_align_up(header_size + descs_size + names_size);
    let mut total_size = data_start;

    for i in 0..n_cols {
        let child_schema = *(*schema).children.add(i);
        let col_type = arrow_format_to_type((*child_schema).format);
        let elem_size = arrow_element_size(col_type);
        if col_type == MORLOC_STRING {
            let child = *(*array).children.add(i);
            let offsets = if (*child).n_buffers >= 2 { *(*child).buffers.add(1) as *const i32 } else { ptr::null() };
            let str_data_size = if !offsets.is_null() {
                let off = (*child).offset as usize;
                (*offsets.add(off + n_rows) - *offsets.add(off)) as usize
            } else { 0 };
            total_size = arrow_align_up(total_size)
                + (n_rows + 1) * std::mem::size_of::<i32>()
                + str_data_size;
        } else {
            if elem_size == 0 {
                set_errmsg(errmsg, &MorlocError::Other(format!("Unsupported Arrow column type for column {}", i)));
                return shm::RELNULL;
            }
            total_size = arrow_align_up(total_size) + elem_size * n_rows;
        }
    }

    let shm_ptr = match shm::shmalloc(total_size) {
        Ok(p) => p,
        Err(e) => { set_errmsg(errmsg, &e); return shm::RELNULL; }
    };
    ptr::write_bytes(shm_ptr, 0, total_size);

    // Write header
    let header = &mut *(shm_ptr as *mut ArrowShmHeader);
    header.magic = ARROW_SHM_MAGIC;
    header.n_columns = n_cols as u32;
    header.n_rows = n_rows as u64;
    header.total_size = total_size as u64;

    let descs = shm_ptr.add(header_size) as *mut ArrowColumnDesc;
    let mut name_cursor = header_size + descs_size;
    let mut data_cursor = data_start;

    for i in 0..n_cols {
        let child_schema = *(*schema).children.add(i);
        let child_array = *(*array).children.add(i);
        let col_type = arrow_format_to_type((*child_schema).format);

        data_cursor = arrow_align_up(data_cursor);

        let name = if (*child_schema).name.is_null() { b"\0".as_ptr() as *const c_char } else { (*child_schema).name };
        let name_len = libc::strlen(name);

        let desc = &mut *descs.add(i);
        desc.col_type = col_type;
        desc.length = n_rows as u64;
        desc.null_count = (*child_array).null_count as u64;
        desc.name_offset = name_cursor as u32;
        desc.name_length = name_len as u16;
        desc.data_offset = data_cursor as u64;

        if name_len > 0 {
            ptr::copy_nonoverlapping(name as *const u8, shm_ptr.add(name_cursor), name_len);
        }
        name_cursor += name_len;

        if col_type == MORLOC_STRING {
            let src_offsets = if (*child_array).n_buffers >= 2 { *(*child_array).buffers.add(1) as *const i32 } else { ptr::null() };
            let src_data = if (*child_array).n_buffers >= 3 { *(*child_array).buffers.add(2) as *const u8 } else { ptr::null() };
            let arr_offset = (*child_array).offset as usize;

            let dst_offsets = shm_ptr.add(data_cursor) as *mut i32;
            let base = if !src_offsets.is_null() { *src_offsets.add(arr_offset) } else { 0 };
            for r in 0..=n_rows {
                *dst_offsets.add(r) = if !src_offsets.is_null() { *src_offsets.add(arr_offset + r) - base } else { 0 };
            }
            let offsets_size = (n_rows + 1) * std::mem::size_of::<i32>();

            let str_data_size = if !src_offsets.is_null() {
                (*src_offsets.add(arr_offset + n_rows) - base) as usize
            } else { 0 };
            if str_data_size > 0 && !src_data.is_null() {
                ptr::copy_nonoverlapping(src_data.add(base as usize), shm_ptr.add(data_cursor + offsets_size), str_data_size);
            }

            let buf_size = offsets_size + str_data_size;
            desc.data_size = buf_size as u64;
            data_cursor += buf_size;
        } else {
            let elem_size = arrow_element_size(col_type);
            let buf_size = elem_size * n_rows;
            desc.data_size = buf_size as u64;

            if (*child_array).n_buffers >= 2 && !(*(*child_array).buffers.add(1)).is_null() {
                let src = (*(*child_array).buffers.add(1) as *const u8).add((*child_array).offset as usize * elem_size);
                if buf_size > 0 {
                    ptr::copy_nonoverlapping(src, shm_ptr.add(data_cursor), buf_size);
                }
            }
            data_cursor += buf_size;
        }
    }

    match shm::abs2rel(shm_ptr) {
        Ok(r) => r,
        Err(e) => { set_errmsg(errmsg, &e); shm::RELNULL }
    }
}

// ── arrow_validate ───────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn arrow_validate(
    header: *const ArrowShmHeader,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    if header.is_null() { set_errmsg(errmsg, &MorlocError::Other("NULL arrow header".into())); return 1; }
    if (*header).magic != ARROW_SHM_MAGIC { set_errmsg(errmsg, &MorlocError::Other("Invalid arrow SHM magic".into())); return 1; }
    if schema.is_null() { set_errmsg(errmsg, &MorlocError::Other("NULL schema for arrow validation".into())); return 1; }
    // MORLOC_MAP = 16
    if (*schema).serial_type != crate::schema::SerialType::Map as u32 { set_errmsg(errmsg, &MorlocError::Other("Expected MORLOC_MAP schema for arrow table".into())); return 1; }

    let n_cols = (*header).n_columns as usize;
    if n_cols != (*schema).size {
        set_errmsg(errmsg, &MorlocError::Other(format!("Column count mismatch: arrow has {}, schema has {}", n_cols, (*schema).size)));
        return 1;
    }

    for i in 0..n_cols {
        let desc = arrow_column_desc(header, i as u32);
        if desc.is_null() {
            set_errmsg(errmsg, &MorlocError::Other(format!("NULL column descriptor at index {}", i)));
            return 1;
        }
        let param_schema = *(*schema).parameters.add(i);
        if (*desc).col_type != (*param_schema).serial_type as u32 {
            set_errmsg(errmsg, &MorlocError::Other(format!("Column {} type mismatch", i)));
            return 1;
        }
    }

    0
}

// ── Release callbacks for arrow_from_shm ─────────────────────────────────────

unsafe extern "C" fn arrow_shm_child_schema_release(schema: *mut ArrowSchema) {
    if schema.is_null() { return; }
    if !(*schema).name.is_null() { libc::free((*schema).name as *mut c_void); }
    (*schema).name = ptr::null();
    (*schema).release = None;
}

unsafe extern "C" fn arrow_shm_child_array_release(array: *mut ArrowArray) {
    if array.is_null() { return; }
    if !(*array).buffers.is_null() { libc::free((*array).buffers as *mut c_void); }
    (*array).buffers = ptr::null_mut();
    (*array).release = None;
}

unsafe extern "C" fn arrow_shm_schema_release(schema: *mut ArrowSchema) {
    if schema.is_null() { return; }
    for i in 0..(*schema).n_children as usize {
        let child = *(*schema).children.add(i);
        if !child.is_null() {
            if let Some(release) = (*child).release { release(child); }
            libc::free(child as *mut c_void);
        }
    }
    libc::free((*schema).children as *mut c_void);
    (*schema).children = ptr::null_mut();
    (*schema).release = None;
}

unsafe extern "C" fn arrow_shm_array_release(array: *mut ArrowArray) {
    if array.is_null() { return; }
    for i in 0..(*array).n_children as usize {
        let child = *(*array).children.add(i);
        if !child.is_null() {
            if let Some(release) = (*child).release { release(child); }
            libc::free(child as *mut c_void);
        }
    }
    libc::free((*array).children as *mut c_void);
    (*array).children = ptr::null_mut();
    if !(*array).buffers.is_null() { libc::free((*array).buffers as *mut c_void); }
    (*array).buffers = ptr::null_mut();
    (*array).release = None;
}

// ── arrow_from_shm ───────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn arrow_from_shm(
    header: *const ArrowShmHeader,
    out_schema: *mut ArrowSchema,
    out_array: *mut ArrowArray,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    if header.is_null() { set_errmsg(errmsg, &MorlocError::Other("NULL arrow header".into())); return 1; }
    if (*header).magic != ARROW_SHM_MAGIC { set_errmsg(errmsg, &MorlocError::Other("Invalid arrow SHM magic".into())); return 1; }

    let n_cols = (*header).n_columns as usize;
    let n_rows = (*header).n_rows as i64;

    // Parent schema (struct type)
    ptr::write_bytes(out_schema, 0, 1);
    (*out_schema).format = b"+s\0".as_ptr() as *const c_char;
    (*out_schema).n_children = n_cols as i64;
    (*out_schema).children = libc::calloc(n_cols, std::mem::size_of::<*mut ArrowSchema>()) as *mut *mut ArrowSchema;
    (*out_schema).release = Some(arrow_shm_schema_release);

    // Parent array
    ptr::write_bytes(out_array, 0, 1);
    (*out_array).length = n_rows;
    (*out_array).n_buffers = 1;
    (*out_array).buffers = libc::calloc(1, std::mem::size_of::<*const c_void>()) as *mut *const c_void;
    (*out_array).n_children = n_cols as i64;
    (*out_array).children = libc::calloc(n_cols, std::mem::size_of::<*mut ArrowArray>()) as *mut *mut ArrowArray;
    (*out_array).release = Some(arrow_shm_array_release);

    for i in 0..n_cols {
        let desc = arrow_column_desc(header, i as u32);

        // Child schema
        let child_s = libc::calloc(1, std::mem::size_of::<ArrowSchema>()) as *mut ArrowSchema;
        (*child_s).release = Some(arrow_shm_child_schema_release);
        *(*out_schema).children.add(i) = child_s;

        (*child_s).format = arrow_format_string((*desc).col_type);
        let raw_name = arrow_column_name(header, i as u32);
        let name_len = (*desc).name_length as usize;
        let name_copy = libc::calloc(name_len + 1, 1) as *mut c_char;
        if !raw_name.is_null() && name_len > 0 {
            ptr::copy_nonoverlapping(raw_name as *const u8, name_copy as *mut u8, name_len);
        }
        (*child_s).name = name_copy;

        // Child array
        let child_a = libc::calloc(1, std::mem::size_of::<ArrowArray>()) as *mut ArrowArray;
        (*child_a).release = Some(arrow_shm_child_array_release);
        *(*out_array).children.add(i) = child_a;

        (*child_a).length = n_rows;
        (*child_a).null_count = (*desc).null_count as i64;

        let col_buf = arrow_column_data(header, i as u32);
        if (*desc).col_type == MORLOC_STRING {
            (*child_a).n_buffers = 3;
            (*child_a).buffers = libc::calloc(3, std::mem::size_of::<*const c_void>()) as *mut *const c_void;
            *(*child_a).buffers.add(1) = col_buf; // offsets
            *(*child_a).buffers.add(2) = (col_buf as *const u8).add((n_rows as usize + 1) * std::mem::size_of::<i32>()) as *const c_void;
        } else {
            (*child_a).n_buffers = 2;
            (*child_a).buffers = libc::calloc(2, std::mem::size_of::<*const c_void>()) as *mut *const c_void;
            *(*child_a).buffers.add(1) = col_buf; // zero-copy data
        }
    }

    0
}

// ── Arrow JSON/Table output (replaces arrow_json.c) ──────────────────────────

unsafe fn print_arrow_value(desc: *const ArrowColumnDesc, col_data: *const u8, row: u64) {
    let row = row as usize;
    match (*desc).col_type {
        MORLOC_BOOL => {
            let v = *col_data.add(row);
            if v != 0 { libc::printf(b"true\0".as_ptr() as *const c_char); }
            else { libc::printf(b"false\0".as_ptr() as *const c_char); }
        }
        MORLOC_SINT8 => { libc::printf(b"%d\0".as_ptr() as *const c_char, *(col_data as *const i8).add(row) as i32); }
        MORLOC_SINT16 => { libc::printf(b"%d\0".as_ptr() as *const c_char, *(col_data as *const i16).add(row) as i32); }
        MORLOC_SINT32 => { libc::printf(b"%d\0".as_ptr() as *const c_char, *(col_data as *const i32).add(row)); }
        MORLOC_SINT64 => { libc::printf(b"%ld\0".as_ptr() as *const c_char, *(col_data as *const i64).add(row)); }
        MORLOC_UINT8 => { libc::printf(b"%u\0".as_ptr() as *const c_char, *col_data.add(row) as u32); }
        MORLOC_UINT16 => { libc::printf(b"%u\0".as_ptr() as *const c_char, *(col_data as *const u16).add(row) as u32); }
        MORLOC_UINT32 => { libc::printf(b"%u\0".as_ptr() as *const c_char, *(col_data as *const u32).add(row)); }
        MORLOC_UINT64 => { libc::printf(b"%lu\0".as_ptr() as *const c_char, *(col_data as *const u64).add(row)); }
        MORLOC_FLOAT32 => { libc::printf(b"%.7g\0".as_ptr() as *const c_char, *(col_data as *const f32).add(row) as f64); }
        MORLOC_FLOAT64 => { libc::printf(b"%.15g\0".as_ptr() as *const c_char, *(col_data as *const f64).add(row)); }
        MORLOC_STRING => {
            let offsets = col_data as *const i32;
            let str_data = offsets.add((*desc).length as usize + 1) as *const u8;
            let start = *offsets.add(row) as usize;
            let end = *offsets.add(row + 1) as usize;
            libc::putchar(b'"' as i32);
            for i in start..end {
                let c = *str_data.add(i);
                match c {
                    b'"' => { libc::printf(b"\\\"\0".as_ptr() as *const c_char); }
                    b'\\' => { libc::printf(b"\\\\\0".as_ptr() as *const c_char); }
                    b'\n' => { libc::printf(b"\\n\0".as_ptr() as *const c_char); }
                    b'\r' => { libc::printf(b"\\r\0".as_ptr() as *const c_char); }
                    b'\t' => { libc::printf(b"\\t\0".as_ptr() as *const c_char); }
                    _ if c < 32 => { libc::printf(b"\\u%04x\0".as_ptr() as *const c_char, c as u32); }
                    _ => { libc::putchar(c as i32); }
                }
            }
            libc::putchar(b'"' as i32);
        }
        _ => { libc::printf(b"null\0".as_ptr() as *const c_char); }
    }
}

#[no_mangle]
pub unsafe extern "C" fn print_arrow_as_json(
    data: *const c_void,
    errmsg: *mut *mut c_char,
) -> bool {
    use crate::error::{clear_errmsg, set_errmsg, MorlocError};
    clear_errmsg(errmsg);

    let header = data as *const ArrowShmHeader;
    if header.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL arrow data".into()));
        return false;
    }
    if (*header).magic != ARROW_SHM_MAGIC {
        set_errmsg(errmsg, &MorlocError::Other(format!("Invalid arrow SHM magic: 0x{:08x}", (*header).magic)));
        return false;
    }

    let n_cols = (*header).n_columns;
    let n_rows = (*header).n_rows;

    libc::putchar(b'[' as i32);
    for r in 0..n_rows {
        if r > 0 { libc::putchar(b',' as i32); }
        libc::putchar(b'{' as i32);
        for c in 0..n_cols {
            if c > 0 { libc::putchar(b',' as i32); }
            let desc = arrow_column_desc(header, c);
            let name = arrow_column_name(header, c);
            let col_data = arrow_column_data(header, c);
            if !name.is_null() {
                libc::printf(b"\"%.*s\":\0".as_ptr() as *const c_char, (*desc).name_length as i32, name);
            }
            if !desc.is_null() && !col_data.is_null() {
                print_arrow_value(desc, col_data as *const u8, r);
            } else {
                libc::printf(b"null\0".as_ptr() as *const c_char);
            }
        }
        libc::putchar(b'}' as i32);
    }
    libc::printf(b"]\n\0".as_ptr() as *const c_char);
    true
}

#[no_mangle]
pub unsafe extern "C" fn print_arrow_as_table(
    data: *const c_void,
    errmsg: *mut *mut c_char,
) -> bool {
    use crate::error::{clear_errmsg, set_errmsg, MorlocError};
    clear_errmsg(errmsg);

    let header = data as *const ArrowShmHeader;
    if header.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL arrow data".into()));
        return false;
    }
    if (*header).magic != ARROW_SHM_MAGIC {
        set_errmsg(errmsg, &MorlocError::Other(format!("Invalid arrow SHM magic: 0x{:08x}", (*header).magic)));
        return false;
    }

    let n_cols = (*header).n_columns;
    let n_rows = (*header).n_rows;

    for c in 0..n_cols {
        if c > 0 { libc::putchar(b'\t' as i32); }
        let desc = arrow_column_desc(header, c);
        let name = arrow_column_name(header, c);
        if !name.is_null() && !desc.is_null() {
            libc::printf(b"%.*s\0".as_ptr() as *const c_char, (*desc).name_length as i32, name);
        }
    }
    libc::putchar(b'\n' as i32);

    for r in 0..n_rows {
        for c in 0..n_cols {
            if c > 0 { libc::putchar(b'\t' as i32); }
            let desc = arrow_column_desc(header, c);
            let col_data = arrow_column_data(header, c);
            if !desc.is_null() && !col_data.is_null() {
                print_arrow_value(desc, col_data as *const u8, r);
            }
        }
        libc::putchar(b'\n' as i32);
    }
    true
}


================================================
FILE: data/rust/morloc-runtime/src/cache.rs
================================================
//! File-based packet caching with xxHash keys.
//! Replaces cache.c.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::hash;
use crate::shm;

// ── hash_voidstar ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn hash_voidstar(
    data: *const c_void,
    schema: *const CSchema,
    seed: u64,
    errmsg: *mut *mut c_char,
) -> u64 {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match hash_voidstar_inner(data as *const u8, &rs, seed) {
        Ok(h) => h,
        Err(e) => {
            set_errmsg(errmsg, &e);
            0
        }
    }
}

fn hash_voidstar_inner(
    data: *const u8,
    schema: &crate::schema::Schema,
    seed: u64,
) -> Result<u64, MorlocError> {
    use crate::schema::SerialType;

    // SAFETY: data points to voidstar data in SHM with layout described by schema.
    // All reads (Array headers, element data) are within schema-defined bounds.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &*(data as *const shm::Array);
                let elem_width = if schema.parameters.is_empty() {
                    1 // string bytes
                } else {
                    schema.parameters[0].width
                };
                let elem_data = shm::rel2abs(arr.data)?;

                if schema.is_fixed_width() || schema.serial_type == SerialType::String {
                    let total = elem_width * arr.size;
                    let bytes = std::slice::from_raw_parts(elem_data, total);
                    Ok(hash::xxh64_with_seed(bytes, seed))
                } else {
                    let mut h = seed;
                    for i in 0..arr.size {
                        h = hash_voidstar_inner(
                            elem_data.add(i * elem_width),
                            &schema.parameters[0],
                            h,
                        )?;
                    }
                    Ok(h)
                }
            }
            SerialType::Tuple | SerialType::Map => {
                if schema.is_fixed_width() {
                    let bytes = std::slice::from_raw_parts(data, schema.width);
                    Ok(hash::xxh64_with_seed(bytes, seed))
                } else {
                    let mut h = seed;
                    for i in 0..schema.parameters.len() {
                        h = hash_voidstar_inner(
                            data.add(schema.offsets[i]),
                            &schema.parameters[i],
                            h,
                        )?;
                    }
                    Ok(h)
                }
            }
            _ => {
                let bytes = std::slice::from_raw_parts(data, schema.width);
                Ok(hash::xxh64_with_seed(bytes, seed))
            }
        }
    }
}

// ── hash_morloc_packet ─────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn hash_morloc_packet(
    packet: *const u8,
    schema: *const CSchema,
    seed: u64,
    hash_out: *mut u64,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    *hash_out = 0;

    extern "C" {
        fn read_morloc_packet_header(
            msg: *const u8,
            errmsg: *mut *mut c_char,
        ) -> *const crate::packet::PacketHeader;
        fn morloc_packet_size(packet: *const u8, errmsg: *mut *mut c_char) -> usize;
        fn get_morloc_data_packet_value(
            data: *const u8,
            schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
    }

    let mut err: *mut c_char = ptr::null_mut();
    let header = read_morloc_packet_header(packet, &mut err);
    if header.is_null() {
        if !err.is_null() {
            *errmsg = err;
        }
        return false;
    }

    let cmd_type = (*header).command_type();
    if cmd_type == crate::packet::PACKET_TYPE_CALL {
        let midx = { (*header).command.call.midx };
        *hash_out = crate::utility::mix(seed, midx as u64);
        let offset = { (*header).offset } as usize;
        let length = { (*header).length } as usize;
        let arg_data = packet.add(32 + offset);
        let mut arg_start = 0usize;
        while arg_start < length {
            let arg_size = morloc_packet_size(arg_data.add(arg_start), &mut err);
            if !err.is_null() {
                *errmsg = err;
                return false;
            }
            let arg_bytes = std::slice::from_raw_parts(arg_data.add(arg_start), arg_size);
            *hash_out = crate::utility::mix(*hash_out, hash::xxh64_with_seed(arg_bytes, *hash_out));
            arg_start += arg_size;
        }
    } else if cmd_type == crate::packet::PACKET_TYPE_DATA {
        let voidstar = get_morloc_data_packet_value(packet, schema, &mut err);
        if voidstar.is_null() {
            if !err.is_null() {
                *errmsg = err;
            }
            return false;
        }
        let rs = CSchema::to_rust(schema);
        match hash_voidstar_inner(voidstar, &rs, seed) {
            Ok(h) => *hash_out = h,
            Err(e) => {
                set_errmsg(errmsg, &e);
                return false;
            }
        }
    } else {
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!("Cannot hash packet with command 0x{:02x}", cmd_type)),
        );
        return false;
    }

    true
}

// ── Cache filename generation ──────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_cache_filename_ext(
    key: u64,
    cache_path: *const c_char,
    ext: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);
    let path = CStr::from_ptr(cache_path).to_string_lossy();
    let extension = CStr::from_ptr(ext).to_string_lossy();
    let filename = format!("{}/{:016x}{}", path, key, extension);
    match CString::new(filename) {
        Ok(cs) => cs.into_raw(),
        Err(_) => {
            set_errmsg(errmsg, &MorlocError::Other("CString conversion failed".into()));
            ptr::null_mut()
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn make_cache_filename(
    key: u64,
    cache_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    let ext = CString::new(".packet").unwrap();
    make_cache_filename_ext(key, cache_path, ext.as_ptr(), errmsg)
}

// ── Cache operations ───────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn put_cache_packet(
    voidstar: *const u8,
    schema: *const CSchema,
    key: u64,
    cache_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);

    extern "C" {
        fn make_mpk_data_packet(filename: *const c_char, schema: *const CSchema) -> *mut u8;
        fn morloc_packet_size(packet: *const u8, errmsg: *mut *mut c_char) -> usize;
        fn pack_with_schema(
            mlc: *const c_void, schema: *const CSchema,
            mpk: *mut *mut c_char, mpk_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
        fn write_atomic(
            filename: *const c_char, data: *const u8, size: usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let mut err: *mut c_char = ptr::null_mut();

    // Generate filenames
    let pkt_filename = make_cache_filename(key, cache_path, &mut err);
    if pkt_filename.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }

    let dat_ext = CString::new(".dat").unwrap();
    let dat_filename = make_cache_filename_ext(key, cache_path, dat_ext.as_ptr(), &mut err);
    if dat_filename.is_null() {
        libc::free(pkt_filename as *mut c_void);
        *errmsg = err;
        return ptr::null_mut();
    }

    // Create data packet pointing to the .dat file
    let data_packet = make_mpk_data_packet(dat_filename, schema);
    if data_packet.is_null() {
        libc::free(pkt_filename as *mut c_void);
        libc::free(dat_filename as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Other("Failed to create data packet".into()));
        return ptr::null_mut();
    }

    let pkt_size = morloc_packet_size(data_packet, &mut err);

    // Pack voidstar to msgpack
    let mut mpk_data: *mut c_char = ptr::null_mut();
    let mut mpk_size: usize = 0;
    let rc = pack_with_schema(voidstar as *const c_void, schema, &mut mpk_data, &mut mpk_size, &mut err);
    if rc != 0 {
        libc::free(data_packet as *mut c_void);
        libc::free(pkt_filename as *mut c_void);
        libc::free(dat_filename as *mut c_void);
        *errmsg = err;
        return ptr::null_mut();
    }

    // Write packet file
    write_atomic(pkt_filename, data_packet, pkt_size, &mut err);
    libc::free(data_packet as *mut c_void);
    if !err.is_null() {
        libc::free(mpk_data as *mut c_void);
        libc::free(pkt_filename as *mut c_void);
        libc::free(dat_filename as *mut c_void);
        *errmsg = err;
        return ptr::null_mut();
    }

    // Write data file
    write_atomic(dat_filename, mpk_data as *const u8, mpk_size, &mut err);
    libc::free(mpk_data as *mut c_void);
    libc::free(dat_filename as *mut c_void);
    if !err.is_null() {
        libc::free(pkt_filename as *mut c_void);
        *errmsg = err;
        return ptr::null_mut();
    }

    // Return the packet filename
    let result = libc::strdup(pkt_filename);
    libc::free(pkt_filename as *mut c_void);
    result
}

#[no_mangle]
pub unsafe extern "C" fn get_cache_packet(
    key: u64,
    cache_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();

    let filename = make_cache_filename(key, cache_path, &mut err);
    if filename.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }

    extern "C" {
        fn read_binary_file(
            filename: *const c_char, file_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
    }

    let mut file_size: usize = 0;
    let data = read_binary_file(filename, &mut file_size, &mut err);
    libc::free(filename as *mut c_void);
    if data.is_null() {
        *errmsg = err;
    }
    data
}

#[no_mangle]
pub unsafe extern "C" fn del_cache_packet(
    key: u64,
    cache_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();

    let filename = make_cache_filename(key, cache_path, &mut err);
    if filename.is_null() {
        *errmsg = err;
        return false;
    }

    let rc = libc::unlink(filename);
    if rc != 0 {
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!(
                "Failed to delete cache file '{}'",
                CStr::from_ptr(filename).to_string_lossy()
            )),
        );
        libc::free(filename as *mut c_void);
        return false;
    }
    libc::free(filename as *mut c_void);
    true
}

#[no_mangle]
pub unsafe extern "C" fn check_cache_packet(
    key: u64,
    cache_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();

    let filename = make_cache_filename(key, cache_path, &mut err);
    if filename.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }

    let mut sb: libc::stat = std::mem::zeroed();
    if libc::stat(filename, &mut sb) == 0 {
        let result = libc::strdup(filename);
        libc::free(filename as *mut c_void);
        return result;
    }
    libc::free(filename as *mut c_void);
    ptr::null_mut() // Not an error — cache miss
}


================================================
FILE: data/rust/morloc-runtime/src/cli.rs
================================================
//! CLI argument handling and voidstar utility functions.
//! Replaces cli.c.

use std::ffi::{c_char, c_void, CStr};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::packet;
use crate::shm;

// ── argument_t lifecycle ───────────────────────────────────────────────────

// argument_t is defined in eval.h (C). We use it opaquely via libc pointers.
// The struct: { value: *mut c_char, fields: *mut *mut c_char, default_fields: *mut *mut c_char, size: usize }
#[repr(C)]
pub struct ArgumentT {
    pub value: *mut c_char,
    pub fields: *mut *mut c_char,
    pub default_fields: *mut *mut c_char,
    pub size: usize,
}

#[no_mangle]
pub unsafe extern "C" fn initialize_positional(value: *mut c_char) -> *mut ArgumentT {
    let arg = libc::calloc(1, std::mem::size_of::<ArgumentT>()) as *mut ArgumentT;
    if arg.is_null() {
        return ptr::null_mut();
    }
    (*arg).value = if value.is_null() {
        ptr::null_mut()
    } else {
        libc::strdup(value)
    };
    (*arg).size = 0;
    arg
}

#[no_mangle]
pub unsafe extern "C" fn initialize_unrolled(
    size: usize,
    default_value: *mut c_char,
    fields: *mut *mut c_char,
    default_fields: *mut *mut c_char,
) -> *mut ArgumentT {
    let arg = libc::calloc(1, std::mem::size_of::<ArgumentT>()) as *mut ArgumentT;
    if arg.is_null() {
        return ptr::null_mut();
    }
    (*arg).value = if default_value.is_null() {
        ptr::null_mut()
    } else {
        libc::strdup(default_value)
    };
    (*arg).size = size;

    (*arg).fields = libc::calloc(size, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
    for i in 0..size {
        let f = *fields.add(i);
        if !f.is_null() {
            *(*arg).fields.add(i) = libc::strdup(f);
        }
    }

    (*arg).default_fields =
        libc::calloc(size, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
    for i in 0..size {
        let d = *default_fields.add(i);
        if !d.is_null() {
            *(*arg).default_fields.add(i) = libc::strdup(d);
        }
    }

    arg
}

#[no_mangle]
pub unsafe extern "C" fn free_argument_t(arg: *mut ArgumentT) {
    if arg.is_null() {
        return;
    }
    if !(*arg).value.is_null() {
        libc::free((*arg).value as *mut c_void);
    }
    if !(*arg).fields.is_null() {
        for i in 0..(*arg).size {
            let f = *(*arg).fields.add(i);
            if !f.is_null() {
                libc::free(f as *mut c_void);
            }
        }
        libc::free((*arg).fields as *mut c_void);
    }
    if !(*arg).default_fields.is_null() {
        for i in 0..(*arg).size {
            let d = *(*arg).default_fields.add(i);
            if !d.is_null() {
                libc::free(d as *mut c_void);
            }
        }
        libc::free((*arg).default_fields as *mut c_void);
    }
    libc::free(arg as *mut c_void);
}

// ── shfree_by_schema ───────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn shfree_by_schema(
    ptr: *mut c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    if ptr.is_null() || schema.is_null() {
        return true;
    }
    let rs = CSchema::to_rust(schema);
    match shfree_by_schema_inner(ptr as *mut u8, &rs) {
        Ok(_) => true,
        Err(e) => {
            set_errmsg(errmsg, &e);
            false
        }
    }
}

fn shfree_by_schema_inner(
    ptr: *mut u8,
    schema: &crate::schema::Schema,
) -> Result<(), MorlocError> {
    use crate::schema::SerialType;

    // SAFETY: ptr points to voidstar data in SHM with layout described by schema.
    // We recursively visit sub-structures and zero metadata before the parent shfree.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &*(ptr as *const shm::Array);
                if arr.data > 0 {
                    if !schema.parameters.is_empty() && !schema.parameters[0].is_fixed_width() {
                        let arr_data = shm::rel2abs(arr.data)?;
                        let elem_width = schema.parameters[0].width;
                        for i in 0..arr.size {
                            shfree_by_schema_inner(
                                arr_data.add(i * elem_width),
                                &schema.parameters[0],
                            )?;
                        }
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    let child = ptr.add(schema.offsets[i]);
                    shfree_by_schema_inner(child, &schema.parameters[i])?;
                }
            }
            SerialType::Tensor => {
                // shape and data are inline, freed by parent shfree
            }
            _ => {
                // fixed-size: no sub-data
            }
        }
        // Zero this node's metadata
        std::ptr::write_bytes(ptr, 0, schema.width);
    }
    Ok(())
}

// ── adjust_voidstar_relptrs ────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn adjust_voidstar_relptrs(
    data: *mut c_void,
    schema: *const CSchema,
    base_rel: shm::RelPtr,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match adjust_relptrs_inner(data as *mut u8, &rs, base_rel) {
        Ok(_) => 0,
        Err(e) => {
            set_errmsg(errmsg, &e);
            1
        }
    }
}

fn adjust_relptrs_inner(
    data: *mut u8,
    schema: &crate::schema::Schema,
    base_rel: shm::RelPtr,
) -> Result<(), MorlocError> {
    use crate::schema::SerialType;

    // SAFETY: data points to a voidstar blob in SHM. We adjust relptrs in-place;
    // all pointer arithmetic stays within the blob's bounds as defined by schema.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &mut *(data as *mut shm::Array);
                arr.data += base_rel;
                if !schema.parameters.is_empty() && !schema.parameters[0].is_fixed_width() {
                    let arr_data = shm::rel2abs(arr.data)?;
                    let elem_width = schema.parameters[0].width;
                    for i in 0..arr.size {
                        adjust_relptrs_inner(
                            arr_data.add(i * elem_width),
                            &schema.parameters[0],
                            base_rel,
                        )?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    adjust_relptrs_inner(
                        data.add(schema.offsets[i]),
                        &schema.parameters[i],
                        base_rel,
                    )?;
                }
            }
            SerialType::Optional => {
                let tag = *data;
                if tag != 0 && !schema.parameters.is_empty() {
                    let inner_offset = schema.offsets.first().copied().unwrap_or(
                        shm::align_up(1, schema.parameters[0].alignment().max(1)),
                    );
                    adjust_relptrs_inner(
                        data.add(inner_offset),
                        &schema.parameters[0],
                        base_rel,
                    )?;
                }
            }
            SerialType::Tensor => {
                let tensor = &mut *(data as *mut shm::Tensor);
                if tensor.total_elements > 0 {
                    tensor.shape += base_rel;
                    tensor.data += base_rel;
                }
            }
            _ => {}
        }
    }
    Ok(())
}

// ── read_voidstar_binary ───────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_voidstar_binary(
    blob: *const u8,
    blob_size: usize,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);

    let base = match shm::shmalloc(blob_size) {
        Ok(p) => p,
        Err(e) => {
            set_errmsg(errmsg, &e);
            return ptr::null_mut();
        }
    };
    std::ptr::copy_nonoverlapping(blob, base, blob_size);

    let base_rel = match shm::abs2rel(base) {
        Ok(r) => r,
        Err(e) => {
            let _ = shm::shfree(base);
            set_errmsg(errmsg, &e);
            return ptr::null_mut();
        }
    };

    if let Err(e) = adjust_relptrs_inner(base, &rs, base_rel) {
        let _ = shm::shfree(base);
        set_errmsg(errmsg, &e);
        return ptr::null_mut();
    }

    base as *mut c_void
}

// ── load_morloc_data_file ──────────────────────────────────────────────────
// This function is complex and calls many C functions (read_json_with_schema,
// unpack_with_schema). Keep delegating to C for now via extern declarations.

#[no_mangle]
pub unsafe extern "C" fn load_morloc_data_file(
    path: *const c_char,
    data: *mut u8,
    data_size: usize,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    clear_errmsg(errmsg);

    extern "C" {
        fn read_json_with_schema(
            dest: *mut u8, json: *mut c_char, schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn unpack_with_schema(
            mpk: *const c_char, mpk_size: usize, schema: *const CSchema,
            mlcptr: *mut *mut c_void, errmsg: *mut *mut c_char,
        ) -> i32;
    }

    if data_size == 0 {
        set_errmsg(errmsg, &MorlocError::Other("Cannot parse 0-length data".into()));
        return ptr::null_mut();
    }

    let path_str = CStr::from_ptr(path).to_string_lossy();
    let mut err: *mut c_char = ptr::null_mut();

    // 1. Extension-based dispatch
    if path_str.ends_with(".json") {
        let json_buf = libc::realloc(data as *mut c_void, data_size + 1) as *mut u8;
        if json_buf.is_null() {
            libc::free(data as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("realloc failed".into()));
            return ptr::null_mut();
        }
        *json_buf.add(data_size) = 0;
        let result = read_json_with_schema(ptr::null_mut(), json_buf as *mut c_char, schema, &mut err);
        if !err.is_null() {
            libc::free(json_buf as *mut c_void);
            *errmsg = err;
            return ptr::null_mut();
        }
        libc::free(json_buf as *mut c_void);
        return result as *mut c_void;
    }

    if path_str.ends_with(".mpk") || path_str.ends_with(".msgpack") {
        let mut result: *mut c_void = ptr::null_mut();
        unpack_with_schema(data as *const c_char, data_size, schema, &mut result, &mut err);
        libc::free(data as *mut c_void);
        if !err.is_null() {
            *errmsg = err;
            return ptr::null_mut();
        }
        return result;
    }

    // 2. Check for morloc packet header
    if data_size >= 32 {
        let magic = *(data as *const u32);
        if magic == packet::PACKET_MAGIC {
            let header_bytes: &[u8; 32] = &*(data as *const [u8; 32]);
            if let Ok(header) = packet::PacketHeader::from_bytes(header_bytes) {
                if !header.is_data() {
                    libc::free(data as *mut c_void);
                    set_errmsg(errmsg, &MorlocError::Other(format!("Expected data packet in '{}'", path_str)));
                    return ptr::null_mut();
                }
                let offset = { header.offset } as usize;
                let length = { header.length } as usize;
                let payload = data.add(32 + offset);
                let format = { header.command.data.format };

                if format == packet::PACKET_FORMAT_VOIDSTAR {
                    let result = read_voidstar_binary(payload, length, schema, &mut err);
                    libc::free(data as *mut c_void);
                    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
                    return result;
                } else if format == packet::PACKET_FORMAT_MSGPACK {
                    let mut result: *mut c_void = ptr::null_mut();
                    unpack_with_schema(payload as *const c_char, length, schema, &mut result, &mut err);
                    libc::free(data as *mut c_void);
                    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
                    return result;
                } else {
                    libc::free(data as *mut c_void);
                    set_errmsg(errmsg, &MorlocError::Other(format!("Unsupported format 0x{:02x} in '{}'", format, path_str)));
                    return ptr::null_mut();
                }
            }
        }
    }

    // 3. Try JSON
    let first_byte = *data;
    let may_be_json = matches!(first_byte,
        b'\'' | b'"' | b'[' | b'{' | b't' | b'f' | b'n' |
        b'\t' | b'\n' | b'\r' | b' ' |
        b'0'..=b'9' | b'-'
    );

    if (data_size > 1 && may_be_json) || (data_size == 1 && first_byte >= b'0' && first_byte <= b'9') {
        let json_buf = libc::realloc(data as *mut c_void, data_size + 1) as *mut u8;
        if !json_buf.is_null() {
            *json_buf.add(data_size) = 0;
            let result = read_json_with_schema(ptr::null_mut(), json_buf as *mut c_char, schema, &mut err);
            if err.is_null() && !result.is_null() {
                libc::free(json_buf as *mut c_void);
                return result as *mut c_void;
            }
            if !err.is_null() { libc::free(err as *mut c_void); err = ptr::null_mut(); }
            // Fall through to try msgpack
            // Note: data pointer may have been invalidated by realloc
            // Use json_buf as the data pointer going forward
            let mut result: *mut c_void = ptr::null_mut();
            unpack_with_schema(json_buf as *const c_char, data_size, schema, &mut result, &mut err);
            libc::free(json_buf as *mut c_void);
            if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
            return result;
        }
    }

    // 4. Try msgpack
    let mut result: *mut c_void = ptr::null_mut();
    unpack_with_schema(data as *const c_char, data_size, schema, &mut result, &mut err);
    libc::free(data as *mut c_void);
    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
    result
}

// ── upload_packet (static helper) ────────────────────────────────────────────

/// Copy a voidstar packet into SHM, adjusting relptrs.
///
/// # Safety
/// `dest` must point to schema.width writable bytes in SHM.
/// `data` must point to a valid voidstar blob within [data, data_end].
unsafe fn upload_packet(
    dest: *mut u8,
    data: *const u8,
    data_end: usize,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);

    match upload_packet_inner(dest, data, data_end, schema, &rs) {
        Ok(_) => 0,
        Err(e) => {
            set_errmsg(errmsg, &e);
            1
        }
    }
}

unsafe fn upload_packet_inner(
    dest: *mut u8,
    data: *const u8,
    data_end: usize,
    schema: *const CSchema,
    rs: &crate::schema::Schema,
) -> Result<(), MorlocError> {
    use crate::schema::SerialType;

    match rs.serial_type {
        SerialType::String | SerialType::Array => {
            if (data as usize + rs.width - 1) <= data_end {
                return Err(MorlocError::Packet("Data is too small to store an array header".into()));
            }
            ptr::copy_nonoverlapping(data, dest, rs.width);
            let arr = &mut *(dest as *mut shm::Array);
            let arr_data_offset = arr.data as usize;
            let arr_data = data.add(arr_data_offset);
            let elem_width = rs.parameters[0].width;
            let arr_size = arr.size * elem_width;

            if (arr_data as usize + arr_size - 1) > data_end {
                return Err(MorlocError::Packet("Data is too small to contain array values".into()));
            }

            let data_ptr = shm::shmemcpy(arr_data, arr_size)?;

            if !rs.is_fixed_width() {
                let elem_schema = &rs.parameters[0];
                // Need the C schema for each element
                let elem_c_schema = (*schema).parameters;
                if !elem_c_schema.is_null() {
                    let elem_cs = *elem_c_schema;
                    for i in 0..arr.size {
                        upload_packet_inner(
                            data_ptr.add(i * elem_width),
                            arr_data.add(i * elem_width),
                            data_end,
                            elem_cs,
                            elem_schema,
                        )?;
                    }
                }
            }

            arr.data = shm::abs2rel(data_ptr)?;
        }
        SerialType::Tuple | SerialType::Map => {
            for i in 0..rs.parameters.len() {
                let elem_cs = if (*schema).parameters.is_null() {
                    return Err(MorlocError::Packet("NULL parameters in schema".into()));
                } else {
                    *(*schema).parameters.add(i)
                };
                upload_packet_inner(
                    dest.add(rs.offsets[i]),
                    data.add(rs.offsets[i]),
                    data_end,
                    elem_cs,
                    &rs.parameters[i],
                )?;
            }
        }
        _ => {
            if (data as usize + rs.width - 1) > data_end {
                return Err(MorlocError::Packet("Given data packet is too small".into()));
            }
            ptr::copy_nonoverlapping(data, dest, rs.width);
        }
    }
    Ok(())
}

// ── parse_cli_data_argument_singular ─────────────────────────────────────────

unsafe fn parse_cli_data_argument_singular(
    mut dest: *mut u8,
    arg: *mut c_char,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);

    extern "C" {
        fn read_json_with_schema(
            dest: *mut u8, json: *mut c_char, schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn file_exists(filename: *const c_char) -> bool;
        fn read_binary_fd(file: *mut libc::FILE, file_size: *mut usize, errmsg: *mut *mut c_char) -> *mut u8;
    }

    let rs = CSchema::to_rust(schema);
    let mut err: *mut c_char = ptr::null_mut();
    let mut fd: *mut libc::FILE = ptr::null_mut();

    // handle STDIN
    let stdin_path = b"/dev/stdin\0";
    let dash_path = b"-\0";
    if libc::strcmp(arg, stdin_path.as_ptr() as *const c_char) == 0
        || libc::strcmp(arg, dash_path.as_ptr() as *const c_char) == 0
    {
        fd = libc::fdopen(libc::STDIN_FILENO, b"rb\0".as_ptr() as *const c_char);
    } else if file_exists(arg) {
        fd = libc::fopen(arg, b"rb\0".as_ptr() as *const c_char);
        if fd.is_null() {
            set_errmsg(errmsg, &MorlocError::Other(
                format!("The argument '{}' is a filename, but it can't be read",
                    CStr::from_ptr(arg).to_string_lossy())
            ));
            return ptr::null_mut();
        }
    }

    if fd.is_null() {
        // Literal JSON data
        if dest.is_null() {
            match shm::shcalloc(1, rs.width) {
                Ok(p) => dest = p,
                Err(e) => { set_errmsg(errmsg, &e); return ptr::null_mut(); }
            }
        }
        dest = read_json_with_schema(dest, arg, schema, &mut err);
        if !err.is_null() {
            *errmsg = err;
            return ptr::null_mut();
        }
        return dest;
    }

    // File or stdin
    let mut data_size: usize = 0;
    let data = read_binary_fd(fd, &mut data_size, &mut err);
    // Don't close stdin
    if fd != libc::fdopen(libc::STDIN_FILENO, b"rb\0".as_ptr() as *const c_char) {
        libc::fclose(fd);
    }
    if !err.is_null() {
        if !data.is_null() { libc::free(data as *mut c_void); }
        *errmsg = err;
        return ptr::null_mut();
    }

    // Special case: RPTR packets
    if data_size >= 32 {
        let magic = *(data as *const u32);
        if magic == packet::PACKET_MAGIC {
            let header = &*(data as *const packet::PacketHeader);
            let source = header.command.data.source;
            let format = header.command.data.format;
            if source == packet::PACKET_SOURCE_RPTR && format == packet::PACKET_FORMAT_VOIDSTAR {
                if dest.is_null() {
                    match shm::shcalloc(1, rs.width) {
                        Ok(p) => dest = p,
                        Err(e) => {
                            libc::free(data as *mut c_void);
                            set_errmsg(errmsg, &e);
                            return ptr::null_mut();
                        }
                    }
                }
                let voidstar_ptr = data.add(32 + header.offset as usize);
                if upload_packet(dest, voidstar_ptr, voidstar_ptr as usize + data_size - 1, schema, &mut err) != 0 {
                    libc::free(data as *mut c_void);
                    *errmsg = err;
                    return ptr::null_mut();
                }
                libc::free(data as *mut c_void);
                return dest;
            }
        }
    }

    // All other formats: canonical file loader (takes ownership of data)
    dest = load_morloc_data_file(arg, data, data_size, schema, &mut err) as *mut u8;
    if !err.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }
    dest
}

// ── parse_cli_data_argument_unrolled ─────────────────────────────────────────

unsafe fn parse_cli_data_argument_unrolled(
    mut dest: *mut u8,
    default_value: *mut c_char,
    fields: *mut *mut c_char,
    default_fields: *mut *mut c_char,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    let mut err: *mut c_char = ptr::null_mut();
    let mut using_record_default = false;

    if dest.is_null() {
        match shm::shcalloc(1, rs.width) {
            Ok(p) => dest = p,
            Err(e) => { set_errmsg(errmsg, &e); return ptr::null_mut(); }
        }
    }

    if !default_value.is_null() {
        dest = parse_cli_data_argument_singular(dest, default_value, schema, &mut err);
        if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
        using_record_default = true;
    }

    use crate::schema::SerialType;
    match rs.serial_type {
        SerialType::Tuple | SerialType::Map => {
            for i in 0..rs.parameters.len() {
                let element_dest = dest.add(rs.offsets[i]);
                let field_val = *fields.add(i);
                let elem_cs = *(*schema).parameters.add(i);

                if !field_val.is_null() {
                    // Free memory from default for this field
                    shfree_by_schema(element_dest as *mut c_void, elem_cs, &mut err);
                    if !err.is_null() { libc::free(err as *mut c_void); err = ptr::null_mut(); }

                    let result = parse_cli_data_argument_singular(
                        element_dest, field_val, elem_cs, &mut err,
                    );
                    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
                    let _ = result; // result writes into element_dest
                } else if using_record_default {
                    continue;
                } else {
                    let default_field = *default_fields.add(i);
                    if !default_field.is_null() {
                        let result = parse_cli_data_argument_singular(
                            element_dest, default_field, elem_cs, &mut err,
                        );
                        if !err.is_null() { *errmsg = err; return ptr::null_mut(); }
                        let _ = result;
                    } else {
                        set_errmsg(errmsg, &MorlocError::Other(
                            format!("Field {} missing with no default or default record", i)
                        ));
                        return ptr::null_mut();
                    }
                }
            }
        }
        _ => {
            set_errmsg(errmsg, &MorlocError::Other("Only record and tuple types may be unrolled".into()));
            return ptr::null_mut();
        }
    }
    dest
}

// ── parse_cli_data_argument ──────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn parse_cli_data_argument(
    dest: *mut u8,
    arg: *const ArgumentT,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();

    let result = if (*arg).fields.is_null() {
        parse_cli_data_argument_singular(dest, (*arg).value, schema, &mut err)
    } else {
        parse_cli_data_argument_unrolled(
            dest, (*arg).value, (*arg).fields, (*arg).default_fields, schema, &mut err,
        )
    };

    if !err.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }
    if result.is_null() {
        return ptr::null_mut();
    }

    let relptr = match shm::abs2rel(result) {
        Ok(r) => r,
        Err(e) => { set_errmsg(errmsg, &e); return ptr::null_mut(); }
    };

    // Call the Rust make_standard_data_packet FFI
    crate::packet_ffi::make_standard_data_packet(relptr, schema)
}

// ── make_call_packet_from_cli ────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_call_packet_from_cli(
    dest: *mut u8,
    mid: u32,
    args: *mut *mut ArgumentT,   // NULL-terminated
    arg_schema_strs: *mut *mut c_char, // NULL-terminated
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();

    // Count and parse schemas
    let mut nschemas: usize = 0;
    while !(*arg_schema_strs.add(nschemas)).is_null() {
        nschemas += 1;
    }

    let mut schemas: Vec<*mut CSchema> = Vec::with_capacity(nschemas);
    for i in 0..nschemas {
        let schema = crate::ffi::parse_schema(*arg_schema_strs.add(i), &mut err);
        if !err.is_null() {
            for s in &schemas { CSchema::free(*s); }
            *errmsg = err;
            return ptr::null_mut();
        }
        schemas.push(schema);
    }

    // Count args
    let mut nargs: usize = 0;
    while !(*args.add(nargs)).is_null() {
        nargs += 1;
    }

    // Parse each argument into a data packet
    let mut packet_args: Vec<*const u8> = Vec::with_capacity(nargs);
    for i in 0..nargs {
        let packet = parse_cli_data_argument(dest, *args.add(i), schemas[i], &mut err);
        if !err.is_null() {
            for p in &packet_args { libc::free(*p as *mut c_void); }
            for s in &schemas { CSchema::free(*s); }
            *errmsg = err;
            return ptr::null_mut();
        }
        packet_args.push(packet as *const u8);
    }

    // Build call packet
    let call_packet = crate::packet_ffi::make_morloc_local_call_packet(
        mid, packet_args.as_ptr(), nargs, &mut err,
    );

    for p in &packet_args { libc::free(*p as *mut c_void); }
    for s in &schemas { CSchema::free(*s); }

    if !err.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }
    call_packet
}


================================================
FILE: data/rust/morloc-runtime/src/cschema.rs
================================================
//! C-compatible Schema type for FFI.
//! This module is always compiled (even with no-ffi-exports feature).

use std::ffi::{c_char, CStr, CString};
use std::ptr;

use crate::schema::{Schema, SerialType};

/// C-compatible Schema struct matching the C `Schema` layout.
#[repr(C)]
pub struct CSchema {
    pub serial_type: u32,
    pub size: usize,
    pub width: usize,
    pub offsets: *mut usize,
    pub hint: *mut c_char,
    pub parameters: *mut *mut CSchema,
    pub keys: *mut *mut c_char,
}

impl CSchema {
    pub fn from_rust(schema: &Schema) -> *mut CSchema {
        let cs = Box::new(CSchema {
            serial_type: schema.serial_type as u32,
            size: schema.size,
            width: schema.width,
            offsets: if schema.offsets.is_empty() {
                ptr::null_mut()
            } else {
                let mut v = schema.offsets.clone().into_boxed_slice();
                let p = v.as_mut_ptr();
                std::mem::forget(v);
                p
            },
            hint: match &schema.hint {
                Some(s) => CString::new(s.as_str()).unwrap_or_default().into_raw(),
                None => ptr::null_mut(),
            },
            parameters: if schema.parameters.is_empty() {
                ptr::null_mut()
            } else {
                let mut ptrs: Vec<*mut CSchema> = schema
                    .parameters
                    .iter()
                    .map(|p| CSchema::from_rust(p))
                    .collect();
                let p = ptrs.as_mut_ptr();
                std::mem::forget(ptrs);
                p
            },
            keys: if schema.keys.is_empty() {
                ptr::null_mut()
            } else {
                let mut ptrs: Vec<*mut c_char> = schema
                    .keys
                    .iter()
                    .map(|k| CString::new(k.as_str()).unwrap_or_default().into_raw())
                    .collect();
                let p = ptrs.as_mut_ptr();
                std::mem::forget(ptrs);
                p
            },
        });
        Box::into_raw(cs)
    }

    /// Convert a C-allocated CSchema to a Rust Schema by deep-copying all data.
    ///
    /// # Safety
    /// `cs` must be null or a valid pointer to a CSchema allocated by `from_rust`
    /// or equivalent C code. All child pointers must be valid for `cs.size` entries.
    pub unsafe fn to_rust(cs: *const CSchema) -> Schema {
        if cs.is_null() {
            return Schema::primitive(SerialType::Nil);
        }
        let cs = &*cs;
        // SAFETY: SerialType is #[repr(u32)] and cs.serial_type was set from a valid SerialType.
        let serial_type = std::mem::transmute::<u32, SerialType>(cs.serial_type);

        let offsets = if cs.offsets.is_null() || cs.size == 0 {
            Vec::new()
        } else {
            let n = match serial_type {
                SerialType::Tuple | SerialType::Map => cs.size,
                SerialType::Optional | SerialType::Tensor => 1,
                _ => 0,
            };
            if n > 0 {
                std::slice::from_raw_parts(cs.offsets, n).to_vec()
            } else {
                Vec::new()
            }
        };

        let parameters = if cs.parameters.is_null() || cs.size == 0 {
            Vec::new()
        } else {
            (0..cs.size)
                .map(|i| CSchema::to_rust(*cs.parameters.add(i)))
                .collect()
        };

        let keys = if cs.keys.is_null() || cs.size == 0 {
            Vec::new()
        } else {
            (0..cs.size)
                .filter_map(|i| {
                    let p = *cs.keys.add(i);
                    if p.is_null() { None }
                    else { Some(CStr::from_ptr(p).to_string_lossy().into_owned()) }
                })
                .collect()
        };

        let hint = if cs.hint.is_null() {
            None
        } else {
            Some(CStr::from_ptr(cs.hint).to_string_lossy().into_owned())
        };

        Schema {
            serial_type,
            size: cs.size,
            width: cs.width,
            offsets,
            hint,
            parameters,
            keys,
        }
    }

    /// Free a CSchema and all its children (same logic as ffi::free_schema).
    ///
    /// # Safety
    /// `schema` must be null or a valid pointer previously returned by `from_rust`.
    pub unsafe fn free(schema: *mut CSchema) {
        if schema.is_null() { return; }
        let cs = Box::from_raw(schema);
        // SAFETY: cs.serial_type was set from a valid SerialType in from_rust.
        let st = std::mem::transmute::<u32, SerialType>(cs.serial_type);
        if !cs.offsets.is_null() {
            let n = match st {
                SerialType::Tuple | SerialType::Map => cs.size,
                SerialType::Optional | SerialType::Tensor => 1,
                _ => 0,
            };
            if n > 0 { let _ = Vec::from_raw_parts(cs.offsets, n, n); }
        }
        if !cs.hint.is_null() { let _ = CString::from_raw(cs.hint); }
        if !cs.parameters.is_null() && cs.size > 0 {
            let ptrs = Vec::from_raw_parts(cs.parameters, cs.size, cs.size);
            for p in ptrs { CSchema::free(p); }
        }
        if !cs.keys.is_null() && cs.size > 0 {
            let ptrs = Vec::from_raw_parts(cs.keys, cs.size, cs.size);
            for p in ptrs { if !p.is_null() { let _ = CString::from_raw(p); } }
        }
    }
}


================================================
FILE: data/rust/morloc-runtime/src/daemon_ffi.rs
================================================
//! C ABI wrappers for daemon subsystems.
//! Replaces daemon.c. Uses serde_json, HashMap, VecDeque, and std::thread.

use std::collections::HashMap;
use std::collections::VecDeque;
use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;
use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
use std::sync::{Arc, Condvar, Mutex};

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::hash;
use crate::http_ffi::{DaemonMethod, DaemonRequest, HttpRequest};

// -- Constants ----------------------------------------------------------------

const DEFAULT_XXHASH_SEED: u64 = 0;
const MAX_LP_MESSAGE: u32 = 64 * 1024 * 1024;

// -- Global state -------------------------------------------------------------

static SHUTDOWN_REQUESTED: AtomicBool = AtomicBool::new(false);
static G_EVAL_TIMEOUT: AtomicI32 = AtomicI32::new(30);

// SAFETY: These globals are set once during daemon_run initialization (single-threaded)
// and only read afterwards. The daemon is single-threaded for request dispatch.
static mut G_POOL_ALIVE_FN: Option<unsafe extern "C" fn(usize) -> bool> = None;
static mut G_N_POOLS: usize = 0;
static mut G_BINDING_STORE: *mut BindingStore = ptr::null_mut();

// -- C-compatible types -------------------------------------------------------

/// Matches morloc_socket_t from call.h
#[repr(C)]
pub struct MorlocSocket {
    pub lang: *mut c_char,
    pub syscmd: *mut *mut c_char,
    pub socket_filename: *mut c_char,
    pub pid: i32,
}

/// Matches daemon_config_t from daemon.h
#[repr(C)]
pub struct DaemonConfig {
    pub unix_socket_path: *const c_char,
    pub tcp_port: i32,
    pub http_port: i32,
    pub pool_check_fn: Option<unsafe extern "C" fn(*mut MorlocSocket, usize)>,
    pub pool_alive_fn: Option<unsafe extern "C" fn(usize) -> bool>,
    pub n_pools: usize,
    pub eval_timeout: i32,
}

/// Matches daemon_response_t from daemon.h
#[repr(C)]
pub struct DaemonResponse {
    pub id: *mut c_char,
    pub success: bool,
    pub result_json: *mut c_char,
    pub error: *mut c_char,
}

// -- Binding store (replaces linear-probe hash table with HashMap) ------------

struct BindingEntry {
    hash: u64,
    expr: String,
    #[allow(dead_code)]
    artifact_dir: String,
    type_sig: Option<String>,
    names: Vec<String>,
}

struct BindingStore {
    entries: HashMap<u64, BindingEntry>,
    /// Index from name -> hash for name-based lookup
    name_index: HashMap<String, u64>,
    base_dir: String,
}

impl BindingStore {
    fn new(base_dir: &str) -> Self {
        let _ = std::fs::create_dir_all(base_dir);
        BindingStore {
            entries: HashMap::new(),
            name_index: HashMap::new(),
            base_dir: base_dir.to_string(),
        }
    }

    fn lookup_hash(&self, hash: u64) -> Option<&BindingEntry> {
        self.entries.get(&hash)
    }

    fn lookup_name(&self, name: &str) -> Option<&BindingEntry> {
        let hash = self.name_index.get(name)?;
        self.entries.get(hash)
    }

    fn add_name(&mut self, hash: u64, name: &str) {
        if let Some(entry) = self.entries.get_mut(&hash) {
            if !entry.names.contains(&name.to_string()) {
                entry.names.push(name.to_string());
            }
        }
        self.name_index.insert(name.to_string(), hash);
    }

    fn bind(&mut self, expr: &str, name: Option<&str>, eval_timeout: i32) -> Option<u64> {
        let hv = hash::xxh64_with_seed(expr.as_bytes(), DEFAULT_XXHASH_SEED);

        if self.entries.contains_key(&hv) {
            if let Some(n) = name {
                self.add_name(hv, n);
            }
            return Some(hv);
        }

        let hash_hex = format!("{:016x}", hv);
        let artifact_dir = format!("{}/{}", self.base_dir, hash_hex);

        // Fork morloc eval --save
        unsafe {
            let mut stdout_pipe = [0i32; 2];
            let mut stderr_pipe = [0i32; 2];
            if libc::pipe(stdout_pipe.as_mut_ptr()) != 0
                || libc::pipe(stderr_pipe.as_mut_ptr()) != 0
            {
                return None;
            }

            let pid = libc::fork();
            if pid < 0 {
                libc::close(stdout_pipe[0]);
                libc::close(stdout_pipe[1]);
                libc::close(stderr_pipe[0]);
                libc::close(stderr_pipe[1]);
                return None;
            }

            if pid == 0 {
                // Child
                libc::close(stdout_pipe[0]);
                libc::close(stderr_pipe[0]);
                libc::dup2(stdout_pipe[1], libc::STDOUT_FILENO);
                libc::dup2(stderr_pipe[1], libc::STDERR_FILENO);
                libc::close(stdout_pipe[1]);
                libc::close(stderr_pipe[1]);

                if eval_timeout > 0 {
                    let cpu_limit = libc::rlimit {
                        rlim_cur: eval_timeout as libc::rlim_t,
                        rlim_max: (eval_timeout + 5) as libc::rlim_t,
                    };
                    libc::setrlimit(libc::RLIMIT_CPU, &cpu_limit);
                    let as_limit = libc::rlimit {
                        rlim_cur: 2 * 1024 * 1024 * 1024,
                        rlim_max: 2 * 1024 * 1024 * 1024,
                    };
                    libc::setrlimit(libc::RLIMIT_AS, &as_limit);
                }

                let cmd = CString::new("morloc").unwrap();
                let arg_eval = CString::new("eval").unwrap();
                let arg_save = CString::new("--save").unwrap();
                let arg_hex = CString::new(hash_hex.as_str()).unwrap();
                let arg_expr = CString::new(expr).unwrap();
                libc::execlp(
                    cmd.as_ptr(),
                    cmd.as_ptr(),
                    arg_eval.as_ptr(),
                    arg_save.as_ptr(),
                    arg_hex.as_ptr(),
                    arg_expr.as_ptr(),
                    ptr::null::<c_char>(),
                );
                libc::_exit(127);
            }

            // Parent
            libc::close(stdout_pipe[1]);
            libc::close(stderr_pipe[1]);

            let mut stderr_buf = vec![0u8; 4096];
            let mut stderr_len: usize = 0;
            loop {
                let n = libc::read(
                    stderr_pipe[0],
                    stderr_buf.as_mut_ptr().add(stderr_len) as *mut c_void,
                    stderr_buf.len() - stderr_len - 1,
                );
                if n <= 0 {
                    break;
                }
                stderr_len += n as usize;
            }
            libc::close(stdout_pipe[0]);
            libc::close(stderr_pipe[0]);

            let mut status: i32 = 0;
            libc::waitpid(pid, &mut status, 0);

            if !libc::WIFEXITED(status) || libc::WEXITSTATUS(status) != 0 {
                stderr_buf.truncate(stderr_len);
                let msg = String::from_utf8_lossy(&stderr_buf);
                eprintln!("binding_store_bind: morloc eval --save failed: {}", msg);
                return None;
            }
        }

        let entry = BindingEntry {
            hash: hv,
            expr: expr.to_string(),
            artifact_dir,
            type_sig: None,
            names: Vec::new(),
        };
        self.entries.insert(hv, entry);
        if let Some(n) = name {
            self.add_name(hv, n);
        }

        Some(hv)
    }

    fn list_json(&self) -> String {
        #[derive(serde::Serialize)]
        struct BindingInfo {
            hash: String,
            expr: String,
            #[serde(skip_serializing_if = "Option::is_none")]
            r#type: Option<String>,
            names: Vec<String>,
        }
        #[derive(serde::Serialize)]
        struct BindingsList {
            bindings: Vec<BindingInfo>,
        }
        let bindings: Vec<BindingInfo> = self
            .entries
            .values()
            .map(|e| BindingInfo {
                hash: format!("{:016x}", e.hash),
                expr: e.expr.clone(),
                r#type: e.type_sig.clone(),
                names: e.names.clone(),
            })
            .collect();
        serde_json::to_string(&BindingsList { bindings }).unwrap_or_default()
    }

    fn unbind(&mut self, name: &str) -> bool {
        let hash = match self.name_index.remove(name) {
            Some(h) => h,
            None => return false,
        };
        if let Some(entry) = self.entries.get_mut(&hash) {
            entry.names.retain(|n| n != name);
        }
        true
    }
}

// -- C-exported binding store functions ---------------------------------------

#[no_mangle]
pub unsafe extern "C" fn binding_store_init(base_dir: *const c_char) -> *mut c_void {
    let dir = CStr::from_ptr(base_dir).to_string_lossy().into_owned();
    let store = Box::new(BindingStore::new(&dir));
    Box::into_raw(store) as *mut c_void
}

#[no_mangle]
pub unsafe extern "C" fn binding_store_free(store: *mut c_void) {
    if !store.is_null() {
        drop(Box::from_raw(store as *mut BindingStore));
    }
}

// -- Request parsing (serde_json) ---------------------------------------------

#[derive(serde::Deserialize)]
struct JsonRequest {
    id: Option<String>,
    method: Option<String>,
    command: Option<String>,
    args: Option<serde_json::Value>,
    expr: Option<String>,
    name: Option<String>,
}

#[no_mangle]
pub unsafe extern "C" fn daemon_parse_request(
    json: *const c_char,
    len: usize,
    errmsg: *mut *mut c_char,
) -> *mut DaemonRequest {
    clear_errmsg(errmsg);

    let slice = std::slice::from_raw_parts(json as *const u8, len);
    let text = match std::str::from_utf8(slice) {
        Ok(s) => s,
        Err(_) => {
            set_errmsg(errmsg, &MorlocError::Other("Invalid UTF-8 in request".into()));
            return ptr::null_mut();
        }
    };

    let parsed: JsonRequest = match serde_json::from_str(text) {
        Ok(r) => r,
        Err(e) => {
            set_errmsg(
                errmsg,
                &MorlocError::Other(format!("Failed to parse request JSON: {}", e)),
            );
            return ptr::null_mut();
        }
    };

    let req = libc::calloc(1, std::mem::size_of::<DaemonRequest>()) as *mut DaemonRequest;
    if req.is_null() {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to allocate daemon_request_t".into()),
        );
        return ptr::null_mut();
    }

    if let Some(id) = &parsed.id {
        let c = CString::new(id.as_str()).unwrap_or_default();
        (*req).id = libc::strdup(c.as_ptr());
    }

    if let Some(method) = &parsed.method {
        (*req).method = match method.as_str() {
            "call" => DaemonMethod::Call,
            "discover" => DaemonMethod::Discover,
            "health" => DaemonMethod::Health,
            "eval" => DaemonMethod::Eval,
            "typecheck" => DaemonMethod::Typecheck,
            "bind" => DaemonMethod::Bind,
            "bindings" => DaemonMethod::Bindings,
            "unbind" => DaemonMethod::Unbind,
            _ => {
                daemon_free_request(req);
                set_errmsg(
                    errmsg,
                    &MorlocError::Other(format!("Unknown method: {}", method)),
                );
                return ptr::null_mut();
            }
        };
    }

    if let Some(cmd) = &parsed.command {
        let c = CString::new(cmd.as_str()).unwrap_or_default();
        (*req).command = libc::strdup(c.as_ptr());
    }

    if let Some(args) = &parsed.args {
        let args_str = serde_json::to_string(args).unwrap_or_default();
        let c = CString::new(args_str).unwrap_or_default();
        (*req).args_json = libc::strdup(c.as_ptr());
    }

    if let Some(expr) = &parsed.expr {
        let c = CString::new(expr.as_str()).unwrap_or_default();
        (*req).expr = libc::strdup(c.as_ptr());
    }

    if let Some(name) = &parsed.name {
        let c = CString::new(name.as_str()).unwrap_or_default();
        (*req).name = libc::strdup(c.as_ptr());
    }

    req
}

// -- Response parsing (serde_json) --------------------------------------------

#[derive(serde::Deserialize)]
struct JsonResponse {
    id: Option<String>,
    status: Option<String>,
    result: Option<serde_json::Value>,
    error: Option<String>,
}

#[no_mangle]
pub unsafe extern "C" fn daemon_parse_response(
    json: *const c_char,
    len: usize,
    errmsg: *mut *mut c_char,
) -> *mut DaemonResponse {
    clear_errmsg(errmsg);

    let slice = std::slice::from_raw_parts(json as *const u8, len);
    let text = match std::str::from_utf8(slice) {
        Ok(s) => s,
        Err(_) => {
            set_errmsg(errmsg, &MorlocError::Other("Invalid UTF-8 in response".into()));
            return ptr::null_mut();
        }
    };

    let parsed: JsonResponse = match serde_json::from_str(text) {
        Ok(r) => r,
        Err(e) => {
            set_errmsg(
                errmsg,
                &MorlocError::Other(format!("Failed to parse response JSON: {}", e)),
            );
            return ptr::null_mut();
        }
    };

    let resp = libc::calloc(1, std::mem::size_of::<DaemonResponse>()) as *mut DaemonResponse;
    if resp.is_null() {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to allocate daemon_response_t".into()),
        );
        return ptr::null_mut();
    }

    if let Some(id) = &parsed.id {
        let c = CString::new(id.as_str()).unwrap_or_default();
        (*resp).id = libc::strdup(c.as_ptr());
    }

    (*resp).success = parsed
        .status
        .as_deref()
        .map(|s| s == "ok")
        .unwrap_or(false);

    if let Some(result) = &parsed.result {
        let s = serde_json::to_string(result).unwrap_or_default();
        let c = CString::new(s).unwrap_or_default();
        (*resp).result_json = libc::strdup(c.as_ptr());
    }

    if let Some(error) = &parsed.error {
        let c = CString::new(error.as_str()).unwrap_or_default();
        (*resp).error = libc::strdup(c.as_ptr());
    }

    resp
}

// -- Free functions -----------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn daemon_free_request(req: *mut DaemonRequest) {
    if req.is_null() {
        return;
    }
    if !(*req).id.is_null() {
        libc::free((*req).id as *mut c_void);
    }
    if !(*req).command.is_null() {
        libc::free((*req).command as *mut c_void);
    }
    if !(*req).args_json.is_null() {
        libc::free((*req).args_json as *mut c_void);
    }
    if !(*req).expr.is_null() {
        libc::free((*req).expr as *mut c_void);
    }
    if !(*req).name.is_null() {
        libc::free((*req).name as *mut c_void);
    }
    libc::free(req as *mut c_void);
}

#[no_mangle]
pub unsafe extern "C" fn daemon_free_response(resp: *mut DaemonResponse) {
    if resp.is_null() {
        return;
    }
    if !(*resp).id.is_null() {
        libc::free((*resp).id as *mut c_void);
    }
    if !(*resp).result_json.is_null() {
        libc::free((*resp).result_json as *mut c_void);
    }
    if !(*resp).error.is_null() {
        libc::free((*resp).error as *mut c_void);
    }
    libc::free(resp as *mut c_void);
}

// -- Response serialization (serde_json) --------------------------------------

#[no_mangle]
pub unsafe extern "C" fn daemon_serialize_response(
    response: *mut DaemonResponse,
    out_len: *mut usize,
) -> *mut c_char {
    let mut map = serde_json::Map::new();

    if !(*response).id.is_null() {
        let id = CStr::from_ptr((*response).id).to_string_lossy();
        map.insert("id".into(), serde_json::Value::String(id.into_owned()));
    }

    map.insert(
        "status".into(),
        serde_json::Value::String(
            if (*response).success { "ok" } else { "error" }.into(),
        ),
    );

    if (*response).success && !(*response).result_json.is_null() {
        let raw = CStr::from_ptr((*response).result_json).to_string_lossy();
        // Try to parse as JSON value; if it fails, store as raw string
        match serde_json::from_str::<serde_json::Value>(&raw) {
            Ok(v) => {
                map.insert("result".into(), v);
            }
            Err(_) => {
                map.insert("result".into(), serde_json::Value::String(raw.into_owned()));
            }
        }
    }

    if !(*response).success && !(*response).error.is_null() {
        let err = CStr::from_ptr((*response).error).to_string_lossy();
        map.insert("error".into(), serde_json::Value::String(err.into_owned()));
    }

    let json_str = serde_json::to_string(&map).unwrap_or_else(|_| "{}".into());
    if !out_len.is_null() {
        *out_len = json_str.len();
    }
    let c = CString::new(json_str).unwrap_or_default();
    libc::strdup(c.as_ptr())
}

// -- Discovery ----------------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn daemon_build_discovery(manifest: *mut c_void) -> *mut c_char {
    extern "C" {
        fn manifest_to_discovery_json(manifest: *const c_void) -> *mut c_char;
    }
    manifest_to_discovery_json(manifest)
}

// -- Eval timeout -------------------------------------------------------------

#[no_mangle]
pub extern "C" fn daemon_set_eval_timeout(timeout_sec: i32) {
    let t = if timeout_sec > 0 { timeout_sec } else { 30 };
    G_EVAL_TIMEOUT.store(t, Ordering::Relaxed);
}

// -- Fork-based eval/typecheck ------------------------------------------------

/// Fork `morloc <subcmd> <expr>`, capture stdout/stderr, return a DaemonResponse.
unsafe fn fork_morloc_command(subcmd: &str, expr: *const c_char) -> *mut DaemonResponse {
    let resp = libc::calloc(1, std::mem::size_of::<DaemonResponse>()) as *mut DaemonResponse;

    let mut stdout_pipe = [0i32; 2];
    let mut stderr_pipe = [0i32; 2];
    if libc::pipe(stdout_pipe.as_mut_ptr()) != 0 || libc::pipe(stderr_pipe.as_mut_ptr()) != 0 {
        (*resp).success = false;
        let c = CString::new(format!("Failed to create pipes for {}", subcmd)).unwrap_or_default();
        (*resp).error = libc::strdup(c.as_ptr());
        return resp;
    }

    let pid = libc::fork();
    if pid < 0 {
        (*resp).success = false;
        let c = CString::new(format!("Failed to fork for {}", subcmd)).unwrap_or_default();
        (*resp).error = libc::strdup(c.as_ptr());
        libc::close(stdout_pipe[0]);
        libc::close(stdout_pipe[1]);
        libc::close(stderr_pipe[0]);
        libc::close(stderr_pipe[1]);
        return resp;
    }

    if pid == 0 {
        // Child
        libc::close(stdout_pipe[0]);
        libc::close(stderr_pipe[0]);
        libc::dup2(stdout_pipe[1], libc::STDOUT_FILENO);
        libc::dup2(stderr_pipe[1], libc::STDERR_FILENO);
        libc::close(stdout_pipe[1]);
        libc::close(stderr_pipe[1]);

        let timeout = G_EVAL_TIMEOUT.load(Ordering::Relaxed);
        if timeout > 0 {
            let cpu_limit = libc::rlimit {
                rlim_cur: timeout as libc::rlim_t,
                rlim_max: (timeout + 5) as libc::rlim_t,
            };
            libc::setrlimit(libc::RLIMIT_CPU, &cpu_limit);
            let as_limit = libc::rlimit {
                rlim_cur: 2 * 1024 * 1024 * 1024,
                rlim_max: 2 * 1024 * 1024 * 1024,
            };
            libc::setrlimit(libc::RLIMIT_AS, &as_limit);
        }

        let cmd = CString::new("morloc").unwrap();
        let arg_subcmd = CString::new(subcmd).unwrap();
        libc::execlp(
            cmd.as_ptr(),
            cmd.as_ptr(),
            arg_subcmd.as_ptr(),
            expr,
            ptr::null::<c_char>(),
        );
        libc::_exit(127);
    }

    // Parent
    libc::close(stdout_pipe[1]);
    libc::close(stderr_pipe[1]);

    let stdout_buf = read_fd_to_vec(stdout_pipe[0]);
    libc::close(stdout_pipe[0]);
    let stderr_buf = read_fd_to_vec(stderr_pipe[0]);
    libc::close(stderr_pipe[0]);

    let mut status: i32 = 0;
    libc::waitpid(pid, &mut status, 0);

    if libc::WIFEXITED(status) && libc::WEXITSTATUS(status) == 0 {
        let mut out = String::from_utf8_lossy(&stdout_buf).into_owned();
        // Trim trailing newlines
        while out.ends_with('\n') || out.ends_with('\r') {
            out.pop();
        }
        (*resp).success = true;
        let c = CString::new(out).unwrap_or_default();
        (*resp).result_json = libc::strdup(c.as_ptr());
    } else {
        (*resp).success = false;
        let errmsg = if !stderr_buf.is_empty() {
            String::from_utf8_lossy(&stderr_buf).into_owned()
        } else if libc::WIFSIGNALED(status) {
            format!("morloc {} killed by signal {}", subcmd, libc::WTERMSIG(status))
        } else {
            let code = if libc::WIFEXITED(status) {
                libc::WEXITSTATUS(status)
            } else {
                -1
            };
            format!("morloc {} exited with code {}", subcmd, code)
        };
        let c = CString::new(errmsg).unwrap_or_default();
        (*resp).error = libc::strdup(c.as_ptr());
    }

    resp
}

/// Read an fd to completion into a Vec<u8>.
unsafe fn read_fd_to_vec(fd: i32) -> Vec<u8> {
    let mut buf = Vec::with_capacity(65536);
    let mut tmp = [0u8; 8192];
    loop {
        let n = libc::read(fd, tmp.as_mut_ptr() as *mut c_void, tmp.len());
        if n <= 0 {
            break;
        }
        buf.extend_from_slice(&tmp[..n as usize]);
    }
    buf
}

// -- Dispatch -----------------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn daemon_dispatch(
    manifest: *mut c_void,
    request: *mut DaemonRequest,
    sockets: *mut MorlocSocket,
    _shm_basename: *const c_char,
) -> *mut DaemonResponse {
    let resp = libc::calloc(1, std::mem::size_of::<DaemonResponse>()) as *mut DaemonResponse;

    // Echo request id
    if !(*request).id.is_null() {
        (*resp).id = libc::strdup((*request).id);
    }

    match (*request).method {
        DaemonMethod::Health => {
            (*resp).success = true;
            if let Some(alive_fn) = G_POOL_ALIVE_FN {
                let mut arr = Vec::with_capacity(G_N_POOLS);
                for i in 0..G_N_POOLS {
                    arr.push(serde_json::Value::Bool(alive_fn(i)));
                }
                let json = serde_json::to_string(&arr).unwrap_or_default();
                let c = CString::new(json).unwrap_or_default();
                (*resp).result_json = libc::strdup(c.as_ptr());
            }
            return resp;
        }
        DaemonMethod::Discover => {
            (*resp).success = true;
            (*resp).result_json = daemon_build_discovery(manifest);
            return resp;
        }
        DaemonMethod::Eval => {
            if (*request).expr.is_null() {
                (*resp).success = false;
                let c = CString::new("Missing 'expr' field in eval request").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }

            // Check binding store for cached expression
            if !G_BINDING_STORE.is_null() {
                let expr_str = CStr::from_ptr((*request).expr).to_string_lossy();
                let store = &*G_BINDING_STORE;
                let hv = hash::xxh64_with_seed(expr_str.as_bytes(), DEFAULT_XXHASH_SEED);
                let _cached = store
                    .lookup_hash(hv)
                    .or_else(|| store.lookup_name(&expr_str));
                // TODO: direct binary execution for bound functions
            }

            let eval_resp = fork_morloc_command("eval", (*request).expr);
            if !(*request).id.is_null() {
                (*eval_resp).id = libc::strdup((*request).id);
            }
            libc::free(resp as *mut c_void);
            return eval_resp;
        }
        DaemonMethod::Typecheck => {
            if (*request).expr.is_null() {
                (*resp).success = false;
                let c = CString::new("Missing 'expr' field in typecheck request").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
            let tc_resp = fork_morloc_command("typecheck", (*request).expr);
            if !(*request).id.is_null() {
                (*tc_resp).id = libc::strdup((*request).id);
            }
            libc::free(resp as *mut c_void);
            return tc_resp;
        }
        DaemonMethod::Bind => {
            if (*request).expr.is_null() {
                (*resp).success = false;
                let c = CString::new("Missing 'expr' field in bind request").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
            if G_BINDING_STORE.is_null() {
                (*resp).success = false;
                let c = CString::new("Binding store not initialized").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
            let store = &mut *G_BINDING_STORE;
            let expr_str = CStr::from_ptr((*request).expr).to_string_lossy().into_owned();
            let name = if (*request).name.is_null() {
                None
            } else {
                Some(CStr::from_ptr((*request).name).to_string_lossy().into_owned())
            };
            let timeout = G_EVAL_TIMEOUT.load(Ordering::Relaxed);
            match store.bind(&expr_str, name.as_deref(), timeout) {
                Some(hv) => {
                    let mut map = serde_json::Map::new();
                    map.insert(
                        "hash".into(),
                        serde_json::Value::String(format!("{:016x}", hv)),
                    );
                    map.insert("expr".into(), serde_json::Value::String(expr_str));
                    if let Some(n) = &name {
                        map.insert("name".into(), serde_json::Value::String(n.clone()));
                    }
                    if let Some(entry) = store.lookup_hash(hv) {
                        if let Some(ref ts) = entry.type_sig {
                            map.insert("type".into(), serde_json::Value::String(ts.clone()));
                        }
                    }
                    let json = serde_json::to_string(&map).unwrap_or_default();
                    (*resp).success = true;
                    let c = CString::new(json).unwrap_or_default();
                    (*resp).result_json = libc::strdup(c.as_ptr());
                }
                None => {
                    (*resp).success = false;
                    let c =
                        CString::new("Failed to compile and bind expression").unwrap_or_default();
                    (*resp).error = libc::strdup(c.as_ptr());
                }
            }
            return resp;
        }
        DaemonMethod::Bindings => {
            (*resp).success = true;
            if G_BINDING_STORE.is_null() {
                let c = CString::new("{\"bindings\":[]}").unwrap();
                (*resp).result_json = libc::strdup(c.as_ptr());
            } else {
                let store = &*G_BINDING_STORE;
                let json = store.list_json();
                let c = CString::new(json).unwrap_or_default();
                (*resp).result_json = libc::strdup(c.as_ptr());
            }
            return resp;
        }
        DaemonMethod::Unbind => {
            let name_ptr = if !(*request).command.is_null() {
                (*request).command
            } else {
                (*request).name
            };
            if name_ptr.is_null() {
                (*resp).success = false;
                let c = CString::new("Missing binding name").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
            if G_BINDING_STORE.is_null() {
                (*resp).success = false;
                let c = CString::new("Binding store not initialized").unwrap();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
            let store = &mut *G_BINDING_STORE;
            let name = CStr::from_ptr(name_ptr).to_string_lossy();
            if store.unbind(&name) {
                (*resp).success = true;
                let c = CString::new("{\"removed\":true}").unwrap();
                (*resp).result_json = libc::strdup(c.as_ptr());
            } else {
                (*resp).success = false;
                let c = CString::new(format!("Binding not found: {}", name)).unwrap_or_default();
                (*resp).error = libc::strdup(c.as_ptr());
            }
            return resp;
        }
        DaemonMethod::Call => {
            // Fall through to call dispatch below
        }
    }

    // DAEMON_CALL
    if (*request).command.is_null() {
        (*resp).success = false;
        let c = CString::new("Missing 'command' field in call request").unwrap();
        (*resp).error = libc::strdup(c.as_ptr());
        return resp;
    }

    // Delegate to the C functions that handle manifest lookup, arg parsing,
    // schema handling, and pool communication. These are all already ported
    // to Rust in other _ffi modules, so we declare them as extern "C".
    extern "C" {
        fn parse_schema(schema: *const c_char, errmsg: *mut *mut c_char) -> *mut CSchema;
        fn free_schema(schema: *mut CSchema);
        fn initialize_positional(value: *mut c_char) -> *mut c_void;
        fn free_argument_t(arg: *mut c_void);
        fn parse_cli_data_argument(
            dest: *mut u8,
            arg: *const c_void,
            schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn make_call_packet_from_cli(
            dest: *mut u8,
            mid: u32,
            args: *mut *mut c_void,
            arg_schema_strs: *mut *mut c_char,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn send_and_receive_over_socket(
            socket_path: *const c_char,
            packet: *const u8,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn get_morloc_data_packet_error_message(
            data: *const u8,
            errmsg: *mut *mut c_char,
        ) -> *mut c_char;
        fn get_morloc_data_packet_value(
            data: *const u8,
            schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn voidstar_to_json_string(
            data: *const c_void,
            schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut c_char;
        fn morloc_eval(
            expr: *mut c_void,  // actually *mut MorlocExpression
            return_schema: *mut CSchema,
            arg_voidstar: *mut *mut u8,
            arg_schemas: *mut *mut CSchema,
            nargs: usize,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
    }

    // The manifest is the canonical v2 C struct from manifest_ffi.rs.
    // No local mirror needed -- import the real type and walk it.
    use crate::manifest_ffi::{Manifest as ManifestC, ManifestArgKind, ManifestCommand};

    let mv = manifest as *const ManifestC;
    let command_name = CStr::from_ptr((*request).command);
    let mut cmd: *const ManifestCommand = ptr::null();
    for i in 0..(*mv).n_commands {
        let c = &*(*mv).commands.add(i);
        if CStr::from_ptr(c.name) == command_name {
            cmd = c;
            break;
        }
    }

    if cmd.is_null() {
        (*resp).success = false;
        let msg = format!(
            "Unknown command: {}",
            command_name.to_string_lossy()
        );
        let c = CString::new(msg).unwrap_or_default();
        (*resp).error = libc::strdup(c.as_ptr());
        return resp;
    }

    let cmd = &*cmd;
    let expected_nargs = cmd.n_args;

    // Parse JSON args into argument_t** array
    let mut err: *mut c_char = ptr::null_mut();
    let args: *mut *mut c_void;

    if !(*request).args_json.is_null() {
        // Parse the JSON array
        let args_str = CStr::from_ptr((*request).args_json).to_string_lossy();
        let parsed_args: Vec<serde_json::Value> = match serde_json::from_str(&args_str) {
            Ok(v) => v,
            Err(e) => {
                (*resp).success = false;
                let c = CString::new(format!("Failed to parse args: {}", e)).unwrap_or_default();
                (*resp).error = libc::strdup(c.as_ptr());
                return resp;
            }
        };

        if parsed_args.len() != expected_nargs {
            (*resp).success = false;
            let c = CString::new(format!(
                "Expected {} arguments, got {}",
                expected_nargs,
                parsed_args.len()
            ))
            .unwrap_or_default();
            (*resp).error = libc::strdup(c.as_ptr());
            return resp;
        }

        args = libc::calloc(expected_nargs + 1, std::mem::size_of::<*mut c_void>())
            as *mut *mut c_void;
        for (i, val) in parsed_args.iter().enumerate() {
            let val_str = match val {
                serde_json::Value::String(s) => format!("\"{}\"", s),
                other => other.to_string(),
            };
            let c = CString::new(val_str).unwrap_or_default();
            let dup = libc::strdup(c.as_ptr());
            *args.add(i) = initialize_positional(dup);
            libc::free(dup as *mut c_void);
        }
        *args.add(expected_nargs) = ptr::null_mut();
    } else {
        if expected_nargs > 0 {
            // Check if any are positional (required)
            // For simplicity, match the C behavior: require args if n_args > 0
            (*resp).success = false;
            let c = CString::new("Missing 'args' field in call request").unwrap();
            (*resp).error = libc::strdup(c.as_ptr());
            return resp;
        }
        args =
            libc::calloc(1, std::mem::size_of::<*mut c_void>()) as *mut *mut c_void;
        *args = ptr::null_mut();
    }

    if cmd.is_pure {
        // Pure command: evaluate expression tree
        let mut nargs: usize = 0;
        while !(*args.add(nargs)).is_null() {
            nargs += 1;
        }

        // v2: schemas live on each ManifestArg. Walk cmd.args in
        // declaration order, INCLUDING flags (they consume an arg
        // slot in the parsed list and need a corresponding schema
        // entry to keep alignment). For flags, fall back to the
        // boolean schema "b".
        static FLAG_SCHEMA: &[u8] = b"b\0";
        let mut arg_schema_strs: Vec<*mut c_char> = Vec::with_capacity(nargs);
        for i in 0..cmd.n_args {
            let a = &*cmd.args.add(i);
            let s = if a.kind == ManifestArgKind::Flag || a.schema.is_null() {
                FLAG_SCHEMA.as_ptr() as *mut c_char
            } else {
                a.schema
            };
            arg_schema_strs.push(s);
        }

        let arg_schemas_arr =
            libc::calloc(nargs, std::mem::size_of::<*mut CSchema>()) as *mut *mut CSchema;
        let arg_packets =
            libc::calloc(nargs, std::mem::size_of::<*mut u8>()) as *mut *mut u8;
        let arg_voidstars =
            libc::calloc(nargs, std::mem::size_of::<*mut u8>()) as *mut *mut u8;

        let mut cleanup_and_fail = false;

        for i in 0..nargs {
            let schema_str = arg_schema_strs.get(i).copied().unwrap_or(ptr::null_mut());
            *arg_schemas_arr.add(i) = parse_schema(schema_str, &mut err);
            if !err.is_null() {
                (*resp).success = false;
                (*resp).error = err;
                cleanup_and_fail = true;
                break;
            }

            *arg_packets.add(i) = parse_cli_data_argument(
                ptr::null_mut(),
                *args.add(i),
                *arg_schemas_arr.add(i),
                &mut err,
            );
            if !err.is_null() {
                (*resp).success = false;
                (*resp).error = err;
                cleanup_and_fail = true;
                break;
            }

            *arg_voidstars.add(i) = get_morloc_data_packet_value(
                *arg_packets.add(i),
                *arg_schemas_arr.add(i),
                &mut err,
            );
            if !err.is_null() {
                (*resp).success = false;
                (*resp).error = err;
                cleanup_and_fail = true;
                break;
            }
        }

        if !cleanup_and_fail {
            let return_schema = parse_schema(cmd.ret.schema, &mut err);
            if !err.is_null() {
                (*resp).success = false;
                (*resp).error = err;
            } else {
                let result_abs = morloc_eval(
                    cmd.expr as *mut c_void,
                    return_schema,
                    arg_voidstars,
                    arg_schemas_arr,
                    nargs,
                    &mut err,
                );
                if !err.is_null() {
                    (*resp).success = false;
                    (*resp).error = err;
                } else {
                    let json = voidstar_to_json_string(
                        result_abs as *const c_void,
                        return_schema as *const CSchema,
                        &mut err,
                    );
                    if !err.is_null() {
                        (*resp).success = false;
                        (*resp).error = err;
                    } else {
                        (*resp).success = true;
                        (*resp).result_json = json;
                    }
                }
                free_schema(return_schema);
            }
        }

        // Cleanup
        for i in 0..nargs {
            let s = *arg_schemas_arr.add(i);
            if !s.is_null() {
                free_schema(s);
            }
            let p = *arg_packets.add(i);
            if !p.is_null() {
                libc::free(p as *mut c_void);
            }
        }
        libc::free(arg_schemas_arr as *mut c_void);
        libc::free(arg_packets as *mut c_void);
        libc::free(arg_voidstars as *mut c_void);
    } else {
        // Remote command: send call packet to pool. v2 stores schemas
        // per-arg, but make_call_packet_from_cli wants a NULL-terminated
        // flat array. ManifestCommand exposes a helper that materializes
        // the flat view; the outer pointer array is owned by us and
        // freed below, but the inner C strings remain owned by the
        // ManifestArg objects.
        let arg_schemas_flat = cmd.build_arg_schemas_array();
        let call_packet = make_call_packet_from_cli(
            ptr::null_mut(),
            cmd.mid,
            args,
            arg_schemas_flat,
            &mut err,
        );
        libc::free(arg_schemas_flat as *mut c_void);
        if !err.is_null() {
            (*resp).success = false;
            (*resp).error = err;
        } else {
            let socket_path = (*sockets.add(cmd.pool_index)).socket_filename;
            let result_packet =
                send_and_receive_over_socket(socket_path, call_packet, &mut err);
            libc::free(call_packet as *mut c_void);

            if !err.is_null() {
                (*resp).success = false;
                (*resp).error = err;
            } else {
                let packet_error =
                    get_morloc_data_packet_error_message(result_packet, &mut err);
                if !packet_error.is_null() {
                    (*resp).success = false;
                    (*resp).error = libc::strdup(packet_error);
                    libc::free(result_packet as *mut c_void);
                } else if !err.is_null() {
                    (*resp).success = false;
                    (*resp).error = err;
                    libc::free(result_packet as *mut c_void);
                } else {
                    let return_schema = parse_schema(cmd.ret.schema, &mut err);
                    if !err.is_null() {
                        (*resp).success = false;
                        (*resp).error = err;
                        libc::free(result_packet as *mut c_void);
                    } else {
                        let packet_value = get_morloc_data_packet_value(
                            result_packet,
                            return_schema as *const CSchema,
                            &mut err,
                        );
                        if !err.is_null() {
                            (*resp).success = false;
                            (*resp).error = err;
                        } else {
                            let json = voidstar_to_json_string(
                                packet_value as *const c_void,
                                return_schema as *const CSchema,
                                &mut err,
                            );
                            if !err.is_null() {
                                (*resp).success = false;
                                (*resp).error = err;
                            } else {
                                (*resp).success = true;
                                (*resp).result_json = json;
                            }
                        }
                        free_schema(return_schema);
                        libc::free(result_packet as *mut c_void);
                    }
                }
            }
        }
    }

    // Free args
    let mut i = 0;
    while !(*args.add(i)).is_null() {
        free_argument_t(*args.add(i));
        i += 1;
    }
    libc::free(args as *mut c_void);

    resp
}

// -- Length-prefixed message protocol -----------------------------------------

unsafe fn read_lp_message(
    fd: i32,
    out_len: *mut usize,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);

    let mut len_buf = [0u8; 4];
    let n = libc::recv(
        fd,
        len_buf.as_mut_ptr() as *mut c_void,
        4,
        libc::MSG_WAITALL,
    );
    if n != 4 {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to read message length prefix".into()),
        );
        return ptr::null_mut();
    }

    let msg_len = ((len_buf[0] as u32) << 24)
        | ((len_buf[1] as u32) << 16)
        | ((len_buf[2] as u32) << 8)
        | (len_buf[3] as u32);

    if msg_len > MAX_LP_MESSAGE {
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!("Message too large: {} bytes", msg_len)),
        );
        return ptr::null_mut();
    }

    let msg = libc::malloc(msg_len as usize + 1) as *mut c_char;
    if msg.is_null() {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to allocate message buffer".into()),
        );
        return ptr::null_mut();
    }

    let mut total: usize = 0;
    while total < msg_len as usize {
        let n = libc::recv(
            fd,
            msg.add(total) as *mut c_void,
            msg_len as usize - total,
            0,
        );
        if n <= 0 {
            libc::free(msg as *mut c_void);
            set_errmsg(
                errmsg,
                &MorlocError::Other(format!(
                    "Failed to read message body (got {} of {} bytes)",
                    total, msg_len
                )),
            );
            return ptr::null_mut();
        }
        total += n as usize;
    }
    *msg.add(msg_len as usize) = 0;

    if !out_len.is_null() {
        *out_len = msg_len as usize;
    }
    msg
}

unsafe fn write_lp_message(
    fd: i32,
    data: *const c_char,
    len: usize,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);

    let len_buf: [u8; 4] = [
        ((len >> 24) & 0xFF) as u8,
        ((len >> 16) & 0xFF) as u8,
        ((len >> 8) & 0xFF) as u8,
        (len & 0xFF) as u8,
    ];

    let n = libc::send(
        fd,
        len_buf.as_ptr() as *const c_void,
        4,
        crate::utility::SEND_NOSIGNAL,
    );
    if n != 4 {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to write message length prefix".into()),
        );
        return false;
    }

    let mut total: usize = 0;
    while total < len {
        let n = libc::send(
            fd,
            (data as *const u8).add(total) as *const c_void,
            len - total,
            crate::utility::SEND_NOSIGNAL,
        );
        if n <= 0 {
            set_errmsg(
                errmsg,
                &MorlocError::Other("Failed to write message body".into()),
            );
            return false;
        }
        total += n as usize;
    }

    true
}

// -- Connection handlers ------------------------------------------------------

unsafe fn handle_lp_connection(
    client_fd: i32,
    manifest: *mut c_void,
    sockets: *mut MorlocSocket,
    shm_basename: *const c_char,
) {
    let mut errmsg: *mut c_char = ptr::null_mut();
    let mut msg_len: usize = 0;

    // Peek to distinguish a probe connection (immediate EOF) from a real
    // client.  The router's readiness check connects then closes without
    // sending data; silently ignore those.
    let mut peek_buf = [0u8; 1];
    let peek_n = libc::recv(client_fd, peek_buf.as_mut_ptr() as *mut c_void, 1, libc::MSG_PEEK);
    if peek_n == 0 {
        // Clean EOF — probe connection, silently close.
        libc::close(client_fd);
        return;
    }

    let msg = read_lp_message(client_fd, &mut msg_len, &mut errmsg);
    if !errmsg.is_null() {
        let err_str = CStr::from_ptr(errmsg).to_string_lossy();
        eprintln!("daemon: read error: {}", err_str);
        libc::free(errmsg as *mut c_void);
        libc::close(client_fd);
        return;
    }

    let req = daemon_parse_request(msg, msg_len, &mut errmsg);
    libc::free(msg as *mut c_void);
    if !errmsg.is_null() {
        let mut err_resp: DaemonResponse = std::mem::zeroed();
        err_resp.success = false;
        err_resp.error = errmsg;
        let mut resp_len: usize = 0;
        let resp_json = daemon_serialize_response(&mut err_resp, &mut resp_len);
        let mut write_err: *mut c_char = ptr::null_mut();
        write_lp_message(client_fd, resp_json, resp_len, &mut write_err);
        libc::free(resp_json as *mut c_void);
        if !write_err.is_null() {
            libc::free(write_err as *mut c_void);
        }
        libc::free(errmsg as *mut c_void);
        libc::close(client_fd);
        return;
    }

    let resp = daemon_dispatch(manifest, req, sockets, shm_basename);

    let mut resp_len: usize = 0;
    let resp_json = daemon_serialize_response(resp, &mut resp_len);

    let mut write_err: *mut c_char = ptr::null_mut();
    write_lp_message(client_fd, resp_json, resp_len, &mut write_err);
    if !write_err.is_null() {
        let err_str = CStr::from_ptr(write_err).to_string_lossy();
        eprintln!("daemon: write error: {}", err_str);
        libc::free(write_err as *mut c_void);
    }

    libc::free(resp_json as *mut c_void);
    daemon_free_request(req);
    daemon_free_response(resp);
    libc::close(client_fd);
}

unsafe fn handle_http_connection(
    client_fd: i32,
    manifest: *mut c_void,
    sockets: *mut MorlocSocket,
    shm_basename: *const c_char,
) {
    extern "C" {
        fn http_parse_request(fd: i32, errmsg: *mut *mut c_char) -> *mut HttpRequest;
        fn http_free_request(req: *mut HttpRequest);
        fn http_write_response(
            fd: i32,
            status: i32,
            content_type: *const c_char,
            body: *const c_char,
            body_len: usize,
        ) -> bool;
        fn http_to_daemon_request(
            req: *mut HttpRequest,
            errmsg: *mut *mut c_char,
        ) -> *mut DaemonRequest;
    }

    let mut errmsg: *mut c_char = ptr::null_mut();
    let http_req = http_parse_request(client_fd, &mut errmsg);
    if !errmsg.is_null() {
        let body = b"{\"status\":\"error\",\"error\":\"Bad request\"}\0";
        let ct = b"application/json\0";
        http_write_response(
            client_fd,
            400,
            ct.as_ptr() as *const c_char,
            body.as_ptr() as *const c_char,
            body.len() - 1,
        );
        libc::free(errmsg as *mut c_void);
        libc::close(client_fd);
        return;
    }

    let req = http_to_daemon_request(http_req, &mut errmsg);
    if !errmsg.is_null() {
        let body = b"{\"status\":\"error\",\"error\":\"Invalid request\"}\0";
        let ct = b"application/json\0";
        http_write_response(
            client_fd,
            400,
            ct.as_ptr() as *const c_char,
            body.as_ptr() as *const c_char,
            body.len() - 1,
        );
        http_free_request(http_req);
        libc::free(errmsg as *mut c_void);
        libc::close(client_fd);
        return;
    }
    http_free_request(http_req);

    let resp = daemon_dispatch(manifest, req, sockets, shm_basename);

    let mut resp_len: usize = 0;
    let resp_json = daemon_serialize_response(resp, &mut resp_len);

    // Append newline for terminal-friendly output
    let resp_body = libc::malloc(resp_len + 2) as *mut u8;
    ptr::copy_nonoverlapping(resp_json as *const u8, resp_body, resp_len);
    *resp_body.add(resp_len) = b'\n';
    *resp_body.add(resp_len + 1) = 0;

    let status = if (*resp).success { 200 } else { 500 };
    let ct = b"application/json\0";
    http_write_response(
        client_fd,
        status,
        ct.as_ptr() as *const c_char,
        resp_body as *const c_char,
        resp_len + 1,
    );

    libc::free(resp_body as *mut c_void);
    libc::free(resp_json as *mut c_void);
    daemon_free_request(req);
    daemon_free_response(resp);
    libc::close(client_fd);
}

// -- Thread pool (VecDeque + Condvar instead of linked list + pthread) --------

#[derive(Clone, Copy)]
struct DaemonJob {
    client_fd: i32,
    conn_type: i32, // 0 = length-prefixed (unix/tcp), 2 = http
}

struct JobQueue {
    jobs: VecDeque<DaemonJob>,
}

struct WorkerContext {
    queue: Mutex<JobQueue>,
    cond: Condvar,
    manifest: *mut c_void,
    sockets: *mut MorlocSocket,
    shm_basename: *const c_char,
}

// SAFETY: WorkerContext is shared between threads but all raw pointers
// within it point to read-only or thread-safe C data.
unsafe impl Send for WorkerContext {}
unsafe impl Sync for WorkerContext {}

fn set_socket_timeouts(fd: i32, timeout_sec: i32) {
    unsafe {
        let tv = libc::timeval {
            tv_sec: timeout_sec as _,
            tv_usec: 0,
        };
        libc::setsockopt(
            fd,
            libc::SOL_SOCKET,
            libc::SO_RCVTIMEO,
            &tv as *const libc::timeval as *const c_void,
            std::mem::size_of::<libc::timeval>() as libc::socklen_t,
        );
        libc::setsockopt(
            fd,
            libc::SOL_SOCKET,
            libc::SO_SNDTIMEO,
            &tv as *const libc::timeval as *const c_void,
            std::mem::size_of::<libc::timeval>() as libc::socklen_t,
        );
    }
}

// -- Main daemon event loop ---------------------------------------------------

const MAX_LISTENERS: usize = 3;

#[no_mangle]
pub unsafe extern "C" fn daemon_run(
    config: *mut DaemonConfig,
    manifest: *mut c_void,
    sockets: *mut MorlocSocket,
    n_pools: usize,
    shm_basename: *const c_char,
) {
    // Set globals
    G_POOL_ALIVE_FN = (*config).pool_alive_fn;
    G_N_POOLS = n_pools;
    let timeout = if (*config).eval_timeout > 0 {
        (*config).eval_timeout
    } else {
        30
    };
    G_EVAL_TIMEOUT.store(timeout, Ordering::Relaxed);

    // Initialize binding store
    if G_BINDING_STORE.is_null() {
        let store = Box::new(BindingStore::new("/tmp/morloc-bindings"));
        G_BINDING_STORE = Box::into_raw(store);
    }

    // Install signal handlers
    SHUTDOWN_REQUESTED.store(false, Ordering::Relaxed);
    let handler: libc::sighandler_t =
        std::mem::transmute::<extern "C" fn(i32), libc::sighandler_t>(daemon_signal_handler_fn);
    libc::signal(libc::SIGTERM, handler);
    libc::signal(libc::SIGINT, handler);

    let mut fds = [libc::pollfd {
        fd: -1,
        events: 0,
        revents: 0,
    }; MAX_LISTENERS];
    let mut fd_types = [0i32; MAX_LISTENERS]; // 0=unix, 1=tcp, 2=http
    let mut nfds: usize = 0;

    // Unix socket
    if !(*config).unix_socket_path.is_null() {
        let sock_fd = libc::socket(libc::AF_UNIX, libc::SOCK_STREAM, 0);
        if sock_fd < 0 {
            eprintln!("daemon: failed to create unix socket");
            return;
        }
        let mut addr: libc::sockaddr_un = std::mem::zeroed();
        addr.sun_family = libc::AF_UNIX as libc::sa_family_t;
        let path_bytes = CStr::from_ptr((*config).unix_socket_path).to_bytes();
        let copy_len = path_bytes.len().min(addr.sun_path.len() - 1);
        ptr::copy_nonoverlapping(
            path_bytes.as_ptr() as *const c_char,
            addr.sun_path.as_mut_ptr(),
            copy_len,
        );
        libc::unlink((*config).unix_socket_path);
        if libc::bind(
            sock_fd,
            &addr as *const libc::sockaddr_un as *const libc::sockaddr,
            std::mem::size_of::<libc::sockaddr_un>() as libc::socklen_t,
        ) < 0
        {
            eprintln!("daemon: failed to bind unix socket");
            libc::close(sock_fd);
            return;
        }
        libc::listen(sock_fd, 64);
        fds[nfds].fd = sock_fd;
        fds[nfds].events = libc::POLLIN as i16;
        fd_types[nfds] = 0;
        nfds += 1;
    }

    // TCP
    if (*config).tcp_port > 0 {
        let tcp_fd = libc::socket(libc::AF_INET, libc::SOCK_STREAM, 0);
        if tcp_fd < 0 {
            eprintln!("daemon: failed to create tcp socket");
            return;
        }
        let opt: i32 = 1;
        libc::setsockopt(
            tcp_fd,
            libc::SOL_SOCKET,
            libc::SO_REUSEADDR,
            &opt as *const i32 as *const c_void,
            std::mem::size_of::<i32>() as libc::socklen_t,
        );
        let mut addr: libc::sockaddr_in = std::mem::zeroed();
        addr.sin_family = libc::AF_INET as libc::sa_family_t;
        addr.sin_addr.s_addr = u32::from_be(0x7f000001); // INADDR_LOOPBACK
        addr.sin_port = ((*config).tcp_port as u16).to_be();
        if libc::bind(
            tcp_fd,
            &addr as *const libc::sockaddr_in as *const libc::sockaddr,
            std::mem::size_of::<libc::sockaddr_in>() as libc::socklen_t,
        ) < 0
        {
            eprintln!(
                "daemon: failed to bind tcp port {}",
                (*config).tcp_port
            );
            libc::close(tcp_fd);
            return;
        }
        libc::listen(tcp_fd, 64);
        fds[nfds].fd = tcp_fd;
        fds[nfds].events = libc::POLLIN as i16;
        fd_types[nfds] = 1;
        nfds += 1;
    }

    // HTTP
    if (*config).http_port > 0 {
        let http_fd = libc::socket(libc::AF_INET, libc::SOCK_STREAM, 0);
        if http_fd < 0 {
            eprintln!("daemon: failed to create http socket");
            return;
        }
        let opt: i32 = 1;
        libc::setsockopt(
            http_fd,
            libc::SOL_SOCKET,
            libc::SO_REUSEADDR,
            &opt as *const i32 as *const c_void,
            std::mem::size_of::<i32>() as libc::socklen_t,
        );
        let mut addr: libc::sockaddr_in = std::mem::zeroed();
        addr.sin_family = libc::AF_INET as libc::sa_family_t;
        // HTTP router is externally reachable; bind to all interfaces so that
        // container port mappings (docker -p) can reach it.
        addr.sin_addr.s_addr = libc::INADDR_ANY.to_be();
        addr.sin_port = ((*config).http_port as u16).to_be();
        if libc::bind(
            http_fd,
            &addr as *const libc::sockaddr_in as *const libc::sockaddr,
            std::mem::size_of::<libc::sockaddr_in>() as libc::socklen_t,
        ) < 0
        {
            eprintln!(
                "daemon: failed to bind http port {}",
                (*config).http_port
            );
            libc::close(http_fd);
            return;
        }
        libc::listen(http_fd, 64);
        fds[nfds].fd = http_fd;
        fds[nfds].events = libc::POLLIN as i16;
        fd_types[nfds] = 2;
        nfds += 1;
    }

    if nfds == 0 {
        eprintln!("daemon: no listeners configured, exiting");
        return;
    }

    // Start worker thread pool
    let ctx = Arc::new(WorkerContext {
        queue: Mutex::new(JobQueue {
            jobs: VecDeque::new(),
        }),
        cond: Condvar::new(),
        manifest,
        sockets,
        shm_basename,
    });

    let n_workers = n_pools.saturating_add(4).clamp(4, 32);
    let mut workers = Vec::with_capacity(n_workers);
    for _ in 0..n_workers {
        let ctx = Arc::clone(&ctx);
        workers.push(std::thread::spawn(move || {
            daemon_worker_fn(ctx);
        }));
    }

    // Main event loop
    while !SHUTDOWN_REQUESTED.load(Ordering::Relaxed) {
        let ready = libc::poll(fds.as_mut_ptr(), nfds as libc::nfds_t, 1000);
        if ready < 0 {
            if crate::utility::errno_val() == libc::EINTR {
                continue;
            }
            eprintln!("daemon: poll error");
            break;
        }

        // Check and restart crashed pools
        if let Some(check_fn) = (*config).pool_check_fn {
            check_fn(sockets, n_pools);
        }

        if ready == 0 {
            continue;
        }

        for i in 0..nfds {
            if fds[i].revents & libc::POLLIN as i16 == 0 {
                continue;
            }
            let client_fd = libc::accept(fds[i].fd, ptr::null_mut(), ptr::null_mut());
            if client_fd < 0 {
                if crate::utility::errno_val() == libc::EINTR
                    || crate::utility::errno_val() == libc::EAGAIN
                {
                    continue;
                }
                eprintln!("daemon: accept error");
                continue;
            }
            crate::utility::set_nosigpipe(client_fd);
            set_socket_timeouts(client_fd, 30);

            let job = DaemonJob {
                client_fd,
                conn_type: fd_types[i],
            };
            let mut q = ctx.queue.lock().unwrap();
            q.jobs.push_back(job);
            ctx.cond.notify_one();
        }
    }

    // Wake all workers and join
    ctx.cond.notify_all();
    for w in workers {
        let _ = w.join();
    }

    // Drain remaining jobs
    {
        let mut q = ctx.queue.lock().unwrap();
        while let Some(job) = q.jobs.pop_front() {
            libc::close(job.client_fd);
        }
    }

    // Close listener sockets
    for i in 0..nfds {
        libc::close(fds[i].fd);
    }

    if !(*config).unix_socket_path.is_null() {
        libc::unlink((*config).unix_socket_path);
    }
}

fn daemon_worker_fn(ctx: Arc<WorkerContext>) {
    loop {
        if SHUTDOWN_REQUESTED.load(Ordering::Relaxed) {
            break;
        }

        let job = {
            let mut q = ctx.queue.lock().unwrap();
            loop {
                if let Some(job) = q.jobs.pop_front() {
                    break Some(job);
                }
                if SHUTDOWN_REQUESTED.load(Ordering::Relaxed) {
                    break None;
                }
                // Wait with timeout so we recheck shutdown
                let (guard, _timeout) = ctx
                    .cond
                    .wait_timeout(q, std::time::Duration::from_millis(100))
                    .unwrap();
                q = guard;
            }
        };

        let job = match job {
            Some(j) => j,
            None => continue,
        };

        unsafe {
            if job.conn_type == 2 {
                handle_http_connection(
                    job.client_fd,
                    ctx.manifest,
                    ctx.sockets,
                    ctx.shm_basename,
                );
            } else {
                handle_lp_connection(
                    job.client_fd,
                    ctx.manifest,
                    ctx.sockets,
                    ctx.shm_basename,
                );
            }
        }
    }
}

// Signal handler (must be async-signal-safe)
extern "C" fn daemon_signal_handler_fn(_sig: i32) {
    SHUTDOWN_REQUESTED.store(true, Ordering::Relaxed);
}


================================================
FILE: data/rust/morloc-runtime/src/error.rs
================================================
use std::ffi::{CString, c_char};

#[derive(Debug, thiserror::Error)]
pub enum MorlocError {
    #[error("shared memory error: {0}")]
    Shm(String),
    #[error("packet error: {0}")]
    Packet(String),
    #[error("schema error: {0}")]
    Schema(String),
    #[error("serialization error: {0}")]
    Serialization(String),
    #[error("IPC error: {0}")]
    Ipc(String),
    #[error("IO error: {0}")]
    Io(#[from] std::io::Error),
    #[error("null pointer")]
    NullPointer,
    #[error("{0}")]
    Other(String),
}

/// Write a MorlocError into the C ERRMSG convention.
///
/// # Safety
/// `errmsg` must be a valid, non-dangling pointer to a `*mut c_char` (i.e., `char**`).
/// The caller is responsible for freeing the allocated string via `CString::from_raw`
/// or `libc::free`.
pub unsafe fn set_errmsg(errmsg: *mut *mut c_char, err: &MorlocError) {
    if !errmsg.is_null() {
        if let Ok(cstr) = CString::new(err.to_string()) {
            *errmsg = cstr.into_raw();
        }
    }
}

/// Clear the ERRMSG pointer (must be called at FFI entry).
///
/// # Safety
/// `errmsg` must be a valid pointer to a `*mut c_char`.
pub unsafe fn clear_errmsg(errmsg: *mut *mut c_char) {
    if !errmsg.is_null() {
        *errmsg = std::ptr::null_mut();
    }
}


================================================
FILE: data/rust/morloc-runtime/src/eval_ffi.rs
================================================
//! Expression evaluator and constructor functions.
//! Replaces eval.c. Uses HashMap instead of linked-list dict_t.

use std::collections::HashMap;
use std::ffi::{c_char, c_void, CStr};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::manifest_ffi::*;
use crate::shm::{self, AbsPtr, RelPtr};

// ── Constructor functions (called by manifest_ffi.rs and daemon.c) ───────────

#[no_mangle]
pub unsafe extern "C" fn make_morloc_bound_var(
    schema_str: *const c_char,
    varname: *mut c_char,
    errmsg: *mut *mut c_char,
) -> *mut MorlocExpression {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();
    let schema = crate::ffi::parse_schema(schema_str, &mut err);
    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }

    let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
    if expr.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate bound variable expression".into()));
        return ptr::null_mut();
    }
    (*expr).etype = MorlocExpressionType::Bnd;
    (*expr).schema = schema;
    (*expr).expr.bnd_expr = varname;
    expr
}

#[no_mangle]
pub unsafe extern "C" fn make_morloc_literal(
    schema_str: *const c_char,
    lit: Primitive,
    errmsg: *mut *mut c_char,
) -> *mut MorlocExpression {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();
    let schema = crate::ffi::parse_schema(schema_str, &mut err);
    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }

    let data = libc::malloc(std::mem::size_of::<MorlocData>()) as *mut MorlocData;
    if data.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate literal data".into()));
        return ptr::null_mut();
    }
    (*data).is_voidstar = false;
    (*data).data = DataUnion { lit_val: std::mem::ManuallyDrop::new(lit) };

    let expr = libc::malloc(std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
    if expr.is_null() {
        libc::free(data as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate literal expression".into()));
        return ptr::null_mut();
    }
    (*expr).etype = MorlocExpressionType::Dat;
    (*expr).schema = schema;
    (*expr).expr.data_expr = data;
    expr
}

#[no_mangle]
pub unsafe extern "C" fn make_morloc_pattern(
    schema_str: *const c_char,
    pattern: *mut MorlocPattern,
    errmsg: *mut *mut c_char,
) -> *mut MorlocExpression {
    clear_errmsg(errmsg);
    let mut err: *mut c_char = ptr::null_mut();
    let schema = crate::ffi::parse_schema(schema_str, &mut err);
    if !err.is_null() { *errmsg = err; return ptr::null_mut(); }

    let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
    if expr.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate pattern expression".into()));
        return ptr::null_mut();
    }
    (*expr).etype = MorlocExpressionType::Pat;
    (*expr).schema = schema;
    (*expr).expr.pattern_expr = pattern;
    expr
}

#[no_mangle]
pub extern "C" fn make_morloc_pattern_end() -> *mut MorlocPattern {
    // SAFETY: calloc returns zeroed memory suitable for MorlocPattern.
    // We initialize all fields before returning.
    unsafe {
        let pat = libc::calloc(1, std::mem::size_of::<MorlocPattern>()) as *mut MorlocPattern;
        if pat.is_null() { return ptr::null_mut(); }
        (*pat).ptype = MorlocPatternType::End;
        (*pat).size = 0;
        (*pat).fields = PatternFields { indices: ptr::null_mut() };
        (*pat).selectors = ptr::null_mut();
        pat
    }
}

// Varargs constructors (make_morloc_container, make_morloc_app,
// make_morloc_lambda, make_morloc_interpolation, make_morloc_pattern_idx,
// make_morloc_pattern_key) are only used by generated C++ pool code.
// They cannot be implemented in stable Rust due to C-variadic ABI.
// The C-gcc build path (morloc init) provides them from the original eval.c.
// The Rust hybrid build does not call them (only morloc_eval and the
// non-varargs constructors are needed).

// ── Core evaluator ───────────────────────────────────────────────────────────

type BndVars<'a> = HashMap<&'a str, AbsPtr>;

/// Convert key-based pattern selectors to index-based using the schema's key names.
///
/// # Safety
/// `pattern` and `schema` must be valid, non-null pointers to C-allocated structures.
/// `schema` keys array must have `schema.size` entries.
unsafe fn convert_keys_to_indices(
    pattern: *mut MorlocPattern,
    schema: *const CSchema,
) -> Result<(), MorlocError> {
    let pat = &mut *pattern;
    let n_params = (*schema).size;

    if n_params > 1 {
        for i in 0..pat.size {
            let child_schema = *(*schema).parameters.add(i);
            convert_keys_to_indices(*pat.selectors.add(i), child_schema)?;
        }
    }

    if pat.ptype == MorlocPatternType::ByKey {
        let indices = libc::calloc(n_params, std::mem::size_of::<usize>()) as *mut usize;
        for i in 0..pat.size {
            let key = CStr::from_ptr(*pat.fields.keys.add(i)).to_str().unwrap_or("");
            let mut found = false;
            for j in 0..n_params {
                let record_key = CStr::from_ptr(*(*schema).keys.add(j)).to_str().unwrap_or("");
                if key == record_key {
                    found = true;
                    *indices.add(i) = j;
                    break;
                }
            }
            if !found {
                libc::free(indices as *mut c_void);
                return Err(MorlocError::Other(format!("Pattern contains key missing in schema: {}", key)));
            }
            libc::free(*pat.fields.keys.add(i) as *mut c_void);
        }
        pat.ptype = MorlocPatternType::ByIndex;
        libc::free(pat.fields.keys as *mut c_void);
        pat.fields.indices = indices;
    }

    Ok(())
}

/// Extract fields from a voidstar value using a pattern, copying them into dest.
///
/// # Safety
/// All pointer arguments must be valid and point to correctly-typed C structures.
/// `value` must point to voidstar data matching `value_schema`.
unsafe fn apply_getter(
    dest: AbsPtr,
    return_index: &mut usize,
    return_schema: *const CSchema,
    pattern: *mut MorlocPattern,
    value_schema: *const CSchema,
    value: AbsPtr,
) -> Result<AbsPtr, MorlocError> {
    let pat = &*pattern;

    match pat.ptype {
        MorlocPatternType::ByIndex => {
            for i in 0..pat.size {
                let idx = *pat.fields.indices.add(i);
                apply_getter(
                    dest, return_index, return_schema,
                    *pat.selectors.add(i),
                    *(*value_schema).parameters.add(idx),
                    value.add(*(*value_schema).offsets.add(idx)),
                )?;
            }
        }
        MorlocPatternType::ByKey => {
            convert_keys_to_indices(pattern, value_schema)?;
            return apply_getter(dest, return_index, return_schema, pattern, value_schema, value);
        }
        MorlocPatternType::End => {
            let (element_dest, element_width) = if (*return_schema).size > 1 {
                (dest.add(*(*return_schema).offsets.add(*return_index)),
                 (*(*(*return_schema).parameters.add(*return_index))).width)
            } else {
                (dest, (*return_schema).width)
            };
            *return_index += 1;
            ptr::copy_nonoverlapping(value, element_dest, element_width);
        }
    }

    Ok(dest)
}

/// Copy value into dest, preserving fields not selected by pattern.
///
/// # Safety
/// All pointer arguments must be valid. Schema sizes must match.
unsafe fn apply_setter_copy(
    dest: AbsPtr,
    return_schema: *const CSchema,
    pattern: *mut MorlocPattern,
    value_schema: *const CSchema,
    value: AbsPtr,
) -> Result<(), MorlocError> {
    let pat = &*pattern;
    match pat.ptype {
        MorlocPatternType::ByKey => {
            convert_keys_to_indices(pattern, value_schema)?;
            return apply_setter_copy(dest, return_schema, pattern, value_schema, value);
        }
        MorlocPatternType::ByIndex => {
            if (*value_schema).size != (*return_schema).size {
                return Err(MorlocError::Other("Expected setter return and input sizes to be the same".into()));
            }
            for i in 0..(*value_schema).size {
                let new_dest = dest.add(*(*return_schema).offsets.add(i));
                let new_value = value.add(*(*value_schema).offsets.add(i));
                let mut changed = false;
                for j in 0..pat.size {
                    if i == *pat.fields.indices.add(j) {
                        apply_setter_copy(
                            new_dest,
                            *(*return_schema).parameters.add(i),
                            *pat.selectors.add(j),
                            *(*value_schema).parameters.add(i),
                            new_value,
                        )?;
                        changed = true;
                        break;
                    }
                }
                if !changed {
                    let w = (*(*(*value_schema).parameters.add(i))).width;
                    ptr::copy_nonoverlapping(new_value, new_dest, w);
                }
            }
        }
        MorlocPatternType::End => {}
    }
    Ok(())
}

/// Overwrite pattern-selected fields in dest with provided set_values.
///
/// # Safety
/// All pointer arguments must be valid. set_values must have enough entries.
unsafe fn apply_setter_set(
    dest: AbsPtr,
    return_schema: *const CSchema,
    pattern: *mut MorlocPattern,
    value_schema: *const CSchema,
    value: AbsPtr,
    set_schemas: *mut *mut CSchema,
    set_values: *mut AbsPtr,
    set_idx: &mut usize,
) -> Result<(), MorlocError> {
    let pat = &*pattern;
    match pat.ptype {
        MorlocPatternType::ByIndex => {
            for pi in 0..pat.size {
                let di = *pat.fields.indices.add(pi);
                apply_setter_set(
                    dest.add(*(*return_schema).offsets.add(di)),
                    *(*return_schema).parameters.add(di),
                    *pat.selectors.add(pi),
                    *(*value_schema).parameters.add(di),
                    value.add(*(*value_schema).offsets.add(di)),
                    set_schemas, set_values, set_idx,
                )?;
            }
        }
        MorlocPatternType::End => {
            ptr::copy_nonoverlapping(*set_values.add(*set_idx), dest, (*return_schema).width);
            *set_idx += 1;
        }
        MorlocPatternType::ByKey => {
            return Err(MorlocError::Other("Key patterns should have been resolved in copy step".into()));
        }
    }
    Ok(())
}

/// Recursively evaluate a morloc expression, writing results into SHM.
///
/// # Safety
/// `expr` must be a valid MorlocExpression pointer (or null for error).
/// If `dest` is non-null, it must point to `width` bytes of writable SHM.
unsafe fn morloc_eval_r(
    expr: *mut MorlocExpression,
    dest: AbsPtr,
    width: usize,
    bndvars: &mut BndVars,
) -> Result<AbsPtr, MorlocError> {
    if expr.is_null() {
        return Err(MorlocError::Other("Empty expression".into()));
    }

    let schema = (*expr).schema;
    let (dest, width) = if dest.is_null() {
        let w = (*schema).width;
        let d = shm::shcalloc(1, w)?;
        (d, w)
    } else {
        if width != (*schema).width {
            return Err(MorlocError::Other("Unexpected data size".into()));
        }
        (dest, width)
    };

    match (*expr).etype {
        MorlocExpressionType::Dat => {
            let data = (*expr).expr.data_expr;
            if (*data).is_voidstar {
                return Ok((*data).data.voidstar as AbsPtr);
            }

            let stype = (*schema).serial_type;
            if stype == crate::schema::SerialType::String as u32 {
                // String: allocate in SHM
                let s = std::mem::ManuallyDrop::into_inner(ptr::read(&(*data).data.lit_val)).s;
                let str_size = if s.is_null() { 0 } else { libc::strlen(s) };
                let str_relptr: RelPtr = if str_size > 0 {
                    let abs = shm::shmemcpy(s as *const u8, str_size)?;
                    shm::abs2rel(abs)?
                } else {
                    -1isize as RelPtr
                };
                let arr = shm::Array { size: str_size, data: str_relptr };
                ptr::copy_nonoverlapping(&arr as *const shm::Array as *const u8, dest, width);
            } else if stype == crate::schema::SerialType::Array as u32 {
                let arr_data = (*data).data.array_val;
                let arr_size = (*arr_data).size;
                let elem_schema = (*arr_data).schema;
                let elem_width = (*elem_schema).width;
                let arr_reldata: RelPtr = if arr_size > 0 {
                    let arr_abs = shm::shcalloc(arr_size, elem_width)?;
                    for i in 0..arr_size {
                        morloc_eval_r(
                            *(*arr_data).values.add(i),
                            arr_abs.add(i * elem_width),
                            elem_width,
                            bndvars,
                        )?;
                    }
                    shm::abs2rel(arr_abs)?
                } else {
                    -1isize as RelPtr
                };
                let arr = shm::Array { size: arr_size, data: arr_reldata };
                ptr::copy_nonoverlapping(&arr as *const shm::Array as *const u8, dest, width);
            } else if stype == crate::schema::SerialType::Tuple as u32
                   || stype == crate::schema::SerialType::Map as u32 {
                for i in 0..(*schema).size {
                    let elem_width = (*(*(*schema).parameters.add(i))).width;
                    let elem_dest = dest.add(*(*schema).offsets.add(i));
                    let element = *(*data).data.tuple_val.add(i);
                    morloc_eval_r(element, elem_dest, elem_width, bndvars)?;
                }
            } else {
                // All primitives: just copy width bytes from the union
                ptr::copy_nonoverlapping(
                    &(*data).data as *const DataUnion as *const u8,
                    dest,
                    width,
                );
            }
        }

        MorlocExpressionType::App => {
            let app = (*expr).expr.app_expr;
            let nargs = (*app).nargs;

            // Evaluate all arguments
            let mut arg_results: Vec<AbsPtr> = Vec::with_capacity(nargs);
            for i in 0..nargs {
                let r = morloc_eval_r(*(*app).args.add(i), ptr::null_mut(), 0, bndvars)?;
                arg_results.push(r);
            }

            match (*app).atype {
                MorlocAppExpressionType::Pattern => {
                    if nargs == 1 {
                        let mut return_index: usize = 0;
                        apply_getter(
                            dest, &mut return_index, schema,
                            (*app).function.pattern,
                            (*(*(*app).args)).schema,
                            arg_results[0],
                        )?;
                    } else if nargs > 1 {
                        // Setter: first arg is the value, rest are set values
                        let mut set_schemas: Vec<*mut CSchema> = Vec::with_capacity(nargs - 1);
                        for i in 1..nargs {
                            set_schemas.push((*(*(*app).args.add(i))).schema);
                        }
                        apply_setter_copy(
                            dest, schema, (*app).function.pattern,
                            (*(*(*app).args)).schema, arg_results[0],
                        )?;
                        let mut set_idx: usize = 0;
                        apply_setter_set(
                            dest, schema, (*app).function.pattern,
                            (*(*(*app).args)).schema, arg_results[0],
                            set_schemas.as_mut_ptr(), arg_results[1..].as_ptr() as *mut AbsPtr,
                            &mut set_idx,
                        )?;
                    } else {
                        return Err(MorlocError::Other("No arguments provided to pattern".into()));
                    }
                }

                MorlocAppExpressionType::Lambda => {
                    let lam = (*app).function.lambda;
                    // Bind arguments
                    for i in 0..nargs {
                        let var = CStr::from_ptr(*(*lam).args.add(i)).to_str().unwrap_or("");
                        bndvars.insert(var, arg_results[i]);
                    }
                    morloc_eval_r((*lam).body, dest, width, bndvars)?;
                    // Clean up bindings
                    for i in 0..nargs {
                        let var = CStr::from_ptr(*(*lam).args.add(i)).to_str().unwrap_or("");
                        bndvars.remove(var);
                    }
                }

                MorlocAppExpressionType::Format => {
                    let strings = (*app).function.fmt;
                    let mut result_size: usize = 0;
                    let mut string_lengths: Vec<usize> = Vec::with_capacity(nargs + 1);

                    for i in 0..=nargs {
                        let len = libc::strlen(*strings.add(i));
                        string_lengths.push(len);
                        result_size += len;
                    }
                    for i in 0..nargs {
                        let arr = &*(arg_results[i] as *const shm::Array);
                        result_size += arr.size;
                    }

                    let new_string = shm::shmalloc(result_size)?;
                    let result_array = &mut *(dest as *mut shm::Array);
                    result_array.size = result_size;
                    result_array.data = shm::abs2rel(new_string)?;

                    let mut cursor = new_string;
                    for i in 0..=nargs {
                        ptr::copy_nonoverlapping(*strings.add(i) as *const u8, cursor, string_lengths[i]);
                        cursor = cursor.add(string_lengths[i]);
                        if i < nargs {
                            let arr = &*(arg_results[i] as *const shm::Array);
                            if arr.size > 0 {
                                let arr_data = shm::rel2abs(arr.data)?;
                                ptr::copy_nonoverlapping(arr_data, cursor, arr.size);
                                cursor = cursor.add(arr.size);
                            }
                        }
                    }
                }
            }
        }

        MorlocExpressionType::Bnd => {
            let varname = CStr::from_ptr((*expr).expr.bnd_expr).to_str().unwrap_or("");
            let bnd_value = bndvars.get(varname).copied()
                .ok_or_else(|| MorlocError::Other(format!("Unbound variable {}", varname)))?;
            ptr::copy_nonoverlapping(bnd_value, dest, (*schema).width);
        }

        MorlocExpressionType::Show => {
            // Serialize child to JSON string
            let child = (*expr).expr.unary_expr;
            let child_schema = (*child).schema;
            let child_result = morloc_eval_r(child, ptr::null_mut(), 0, bndvars)?;

            extern "C" {
                fn voidstar_to_json_string(data: *const c_void, schema: *const CSchema, errmsg: *mut *mut c_char) -> *mut c_char;
            }
            let mut err: *mut c_char = ptr::null_mut();
            let json = voidstar_to_json_string(child_result as *const c_void, child_schema, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }

            let json_len = libc::strlen(json);
            let str_relptr: RelPtr = if json_len > 0 {
                let abs = shm::shmemcpy(json as *const u8, json_len)?;
                libc::free(json as *mut c_void);
                shm::abs2rel(abs)?
            } else {
                libc::free(json as *mut c_void);
                -1isize as RelPtr
            };
            let arr = shm::Array { size: json_len, data: str_relptr };
            ptr::copy_nonoverlapping(&arr as *const shm::Array as *const u8, dest, width);
        }

        MorlocExpressionType::Read => {
            // Deserialize JSON string to typed data, return optional
            let child = (*expr).expr.unary_expr;
            let child_result = morloc_eval_r(child, ptr::null_mut(), 0, bndvars)?;
            let str_arr = &*(child_result as *const shm::Array);

            let opt_dest = dest;
            let inner_schema = *(*schema).parameters;

            if str_arr.size > 0 {
                let str_abs = shm::rel2abs(str_arr.data)?;
                let json_str = libc::malloc(str_arr.size + 1) as *mut c_char;
                if json_str.is_null() {
                    return Err(MorlocError::Other("Failed to allocate for @read".into()));
                }
                ptr::copy_nonoverlapping(str_abs, json_str as *mut u8, str_arr.size);
                *json_str.add(str_arr.size) = 0;

                extern "C" {
                    fn read_json_with_schema(dest: *mut u8, json: *mut c_char, schema: *const CSchema, errmsg: *mut *mut c_char) -> *mut u8;
                }
                let inner_offset = *(*schema).offsets;
                let mut parse_err: *mut c_char = ptr::null_mut();
                let parsed = read_json_with_schema(opt_dest.add(inner_offset), json_str, inner_schema, &mut parse_err);
                libc::free(json_str as *mut c_void);
                if !parse_err.is_null() {
                    libc::free(parse_err as *mut c_void);
                    *opt_dest = 0; // None
                } else {
                    *opt_dest = if parsed.is_null() { 0 } else { 1 };
                }
            } else {
                *opt_dest = 0; // None
            }
        }

        MorlocExpressionType::Hash => {
            // Hash child data and return hex string
            let child = (*expr).expr.unary_expr;
            let child_schema = (*child).schema;
            let child_result = morloc_eval_r(child, ptr::null_mut(), 0, bndvars)?;

            extern "C" {
                fn mlc_hash(data: *const c_void, schema: *const CSchema, errmsg: *mut *mut c_char) -> *mut c_char;
            }
            let mut err: *mut c_char = ptr::null_mut();
            let hex = mlc_hash(child_result as *const c_void, child_schema, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }

            let hex_len = libc::strlen(hex);
            let str_relptr: RelPtr = if hex_len > 0 {
                let abs = shm::shmemcpy(hex as *const u8, hex_len)?;
                libc::free(hex as *mut c_void);
                shm::abs2rel(abs)?
            } else {
                libc::free(hex as *mut c_void);
                -1isize as RelPtr
            };
            let arr = shm::Array { size: hex_len, data: str_relptr };
            ptr::copy_nonoverlapping(&arr as *const shm::Array as *const u8, dest, width);
        }

        MorlocExpressionType::Save => {
            // Save value to file at path
            let save = (*expr).expr.save_expr;
            let value_expr = (*save).value;
            let path_expr = (*save).path;
            let fmt = CStr::from_ptr((*save).format).to_str().unwrap_or("voidstar");

            let value_schema = (*value_expr).schema;
            let value_result = morloc_eval_r(value_expr, ptr::null_mut(), 0, bndvars)?;
            let path_result = morloc_eval_r(path_expr, ptr::null_mut(), 0, bndvars)?;

            // Extract path string from voidstar Array
            let path_arr = &*(path_result as *const shm::Array);
            let path_abs = shm::rel2abs(path_arr.data)?;
            let path_cstr = libc::malloc(path_arr.size + 1) as *mut c_char;
            if path_cstr.is_null() {
                return Err(MorlocError::Other("Failed to allocate for @save path".into()));
            }
            ptr::copy_nonoverlapping(path_abs, path_cstr as *mut u8, path_arr.size);
            *path_cstr.add(path_arr.size) = 0;

            extern "C" {
                fn mlc_save(data: *const c_void, schema: *const CSchema, path: *const c_char, errmsg: *mut *mut c_char) -> i32;
                fn mlc_save_json(data: *const c_void, schema: *const CSchema, path: *const c_char, errmsg: *mut *mut c_char) -> i32;
                fn mlc_save_voidstar(data: *const c_void, schema: *const CSchema, path: *const c_char, errmsg: *mut *mut c_char) -> i32;
            }
            let mut err: *mut c_char = ptr::null_mut();
            let rc = match fmt {
                "json" => mlc_save_json(value_result as *const c_void, value_schema, path_cstr, &mut err),
                "msgpack" => mlc_save(value_result as *const c_void, value_schema, path_cstr, &mut err),
                _ => mlc_save_voidstar(value_result as *const c_void, value_schema, path_cstr, &mut err),
            };
            libc::free(path_cstr as *mut c_void);
            if rc != 0 && !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            // Return unit (zero-fill dest)
            ptr::write_bytes(dest, 0, width);
        }

        MorlocExpressionType::Load => {
            // Load data from file, return optional
            let child = (*expr).expr.unary_expr;
            let child_result = morloc_eval_r(child, ptr::null_mut(), 0, bndvars)?;

            // Extract path string from voidstar Array
            let path_arr = &*(child_result as *const shm::Array);
            let path_abs = shm::rel2abs(path_arr.data)?;
            let path_cstr = libc::malloc(path_arr.size + 1) as *mut c_char;
            if path_cstr.is_null() {
                return Err(MorlocError::Other("Failed to allocate for @load path".into()));
            }
            ptr::copy_nonoverlapping(path_abs, path_cstr as *mut u8, path_arr.size);
            *path_cstr.add(path_arr.size) = 0;

            extern "C" {
                fn mlc_load(path: *const c_char, schema: *const CSchema, errmsg: *mut *mut c_char) -> *mut c_void;
            }
            let opt_dest = dest;
            let inner_schema = *(*schema).parameters;
            let inner_offset = *(*schema).offsets;

            let mut err: *mut c_char = ptr::null_mut();
            let loaded = mlc_load(path_cstr, inner_schema, &mut err);
            libc::free(path_cstr as *mut c_void);

            if loaded.is_null() {
                if !err.is_null() {
                    libc::free(err as *mut c_void);
                }
                *opt_dest = 0; // None
            } else {
                // Copy loaded voidstar data into the optional's inner slot
                let inner_width = (*inner_schema).width;
                ptr::copy_nonoverlapping(loaded as *const u8, opt_dest.add(inner_offset), inner_width);
                libc::free(loaded as *mut c_void);
                *opt_dest = 1; // Some
            }
        }

        _ => {
            return Err(MorlocError::Other("Illegal top expression".into()));
        }
    }

    Ok(dest)
}

// ── Public entry point ────���─────────────────────────────────��────────────────

#[no_mangle]
pub unsafe extern "C" fn morloc_eval(
    expr: *mut MorlocExpression,
    return_schema: *mut CSchema,
    arg_voidstar: *mut *mut u8,
    arg_schemas: *mut *mut CSchema,
    nargs: usize,
    errmsg: *mut *mut c_char,
) -> AbsPtr {
    clear_errmsg(errmsg);

    let mut bndvars: BndVars = HashMap::new();
    let new_expr: *mut MorlocExpression;
    let mut allocated_wrappers: Vec<*mut c_void> = Vec::new();

    let eval_expr = match (*expr).etype {
        MorlocExpressionType::Lam | MorlocExpressionType::Pat => {
            // Wrap CLI args as voidstar data expressions and apply
            let arg_exprs = libc::calloc(nargs, std::mem::size_of::<*mut MorlocExpression>()) as *mut *mut MorlocExpression;
            allocated_wrappers.push(arg_exprs as *mut c_void);

            for i in 0..nargs {
                let ae = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
                (*ae).etype = MorlocExpressionType::Dat;
                (*ae).schema = *arg_schemas.add(i);
                let ad = libc::calloc(1, std::mem::size_of::<MorlocData>()) as *mut MorlocData;
                (*ad).is_voidstar = true;
                (*ad).data.voidstar = *arg_voidstar.add(i) as *mut c_void;
                (*ae).expr.data_expr = ad;
                *arg_exprs.add(i) = ae;
                allocated_wrappers.push(ad as *mut c_void);
                allocated_wrappers.push(ae as *mut c_void);
            }

            let app = libc::calloc(1, std::mem::size_of::<MorlocAppExpression>()) as *mut MorlocAppExpression;
            (*app).atype = if (*expr).etype == MorlocExpressionType::Lam {
                (*app).function.lambda = (*expr).expr.lam_expr;
                MorlocAppExpressionType::Lambda
            } else {
                (*app).function.pattern = (*expr).expr.pattern_expr;
                MorlocAppExpressionType::Pattern
            };
            (*app).args = arg_exprs;
            (*app).nargs = nargs;
            allocated_wrappers.push(app as *mut c_void);

            new_expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*new_expr).etype = MorlocExpressionType::App;
            (*new_expr).schema = return_schema;
            (*new_expr).expr.app_expr = app;
            allocated_wrappers.push(new_expr as *mut c_void);

            new_expr
        }
        _ => expr,
    };

    let result = morloc_eval_r(eval_expr, ptr::null_mut(), 0, &mut bndvars);

    // Free wrapper nodes
    for p in &allocated_wrappers {
        libc::free(*p);
    }

    match result {
        Ok(ptr) => ptr,
        Err(e) => {
            set_errmsg(errmsg, &e);
            ptr::null_mut()
        }
    }
}


================================================
FILE: data/rust/morloc-runtime/src/ffi.rs
================================================
//! C ABI wrappers for libmorloc.so
//!
//! These `extern "C"` functions match the signatures in morloc.h.
//! Internally they call the Rust implementations and convert between
//! Rust Result<T,E> and the C ERRMSG convention (char** last arg).

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::schema::{self};
use crate::shm::{self, AbsPtr, BlockHeader, RelPtr, ShmHeader, VolPtr};
pub use crate::cschema::CSchema;

// ── Macro for ERRMSG-pattern FFI wrappers ──────────────────────────────────

/// Wrap a Rust Result-returning expression into the C ERRMSG convention.
/// On success: clears errmsg, returns the value.
/// On error: sets errmsg, returns $fail.
macro_rules! ffi_try {
    ($errmsg:expr, $fail:expr, $body:expr) => {{
        unsafe { clear_errmsg($errmsg) };
        match $body {
            Ok(val) => val,
            Err(e) => {
                unsafe { set_errmsg($errmsg, &e) };
                $fail
            }
        }
    }};
}

// CSchema type and conversions are in cschema.rs (always compiled).

// ── SHM functions ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn shinit(
    shm_basename: *const c_char,
    volume_index: usize,
    shm_size: usize,
    errmsg: *mut *mut c_char,
) -> *mut ShmHeader {
    let basename = CStr::from_ptr(shm_basename).to_string_lossy();
    ffi_try!(errmsg, ptr::null_mut(), shm::shinit(&basename, volume_index, shm_size))
}

#[no_mangle]
pub unsafe extern "C" fn shopen(
    volume_index: usize,
    errmsg: *mut *mut c_char,
) -> *mut ShmHeader {
    ffi_try!(
        errmsg,
        ptr::null_mut(),
        shm::shopen(volume_index).and_then(|opt| opt.ok_or(MorlocError::Shm("volume not found".into())))
    )
}

#[no_mangle]
pub unsafe extern "C" fn shclose(errmsg: *mut *mut c_char) -> bool {
    ffi_try!(errmsg, false, shm::shclose().map(|_| true))
}

#[no_mangle]
pub unsafe extern "C" fn shm_set_fallback_dir(dir: *const c_char) {
    if !dir.is_null() {
        let d = CStr::from_ptr(dir).to_string_lossy();
        shm::shm_set_fallback_dir(&d);
    }
}

#[no_mangle]
pub unsafe extern "C" fn shmalloc(size: usize, errmsg: *mut *mut c_char) -> *mut c_void {
    ffi_try!(errmsg, ptr::null_mut(), shm::shmalloc(size).map(|p| p as *mut c_void))
}

#[no_mangle]
pub unsafe extern "C" fn shmemcpy(
    src: *mut c_void,
    size: usize,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    ffi_try!(
        errmsg,
        ptr::null_mut(),
        shm::shmemcpy(src as *const u8, size).map(|p| p as *mut c_void)
    )
}

#[no_mangle]
pub unsafe extern "C" fn shcalloc(
    nmemb: usize,
    size: usize,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    ffi_try!(errmsg, ptr::null_mut(), shm::shcalloc(nmemb, size).map(|p| p as *mut c_void))
}

#[no_mangle]
pub unsafe extern "C" fn shrealloc(
    ptr: *mut c_void,
    size: usize,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    // TODO: implement shrealloc in shm.rs
    let _ = (ptr, size);
    set_errmsg(errmsg, &MorlocError::Shm("shrealloc not yet implemented".into()));
    ptr::null_mut()
}

#[no_mangle]
pub unsafe extern "C" fn shfree(ptr: *mut c_void, errmsg: *mut *mut c_char) -> bool {
    ffi_try!(errmsg, false, shm::shfree(ptr as AbsPtr).map(|_| true))
}

#[no_mangle]
pub unsafe extern "C" fn shincref(ptr: *mut c_void, errmsg: *mut *mut c_char) -> bool {
    ffi_try!(errmsg, false, shm::shincref(ptr as AbsPtr).map(|_| true))
}

// shfree_by_schema is provided by cli.c

#[no_mangle]
pub unsafe extern "C" fn total_shm_size() -> usize {
    shm::total_shm_size()
}

#[no_mangle]
pub unsafe extern "C" fn rel2abs(ptr: RelPtr, errmsg: *mut *mut c_char) -> *mut c_void {
    ffi_try!(errmsg, ptr::null_mut(), shm::rel2abs(ptr).map(|p| p as *mut c_void))
}

#[no_mangle]
pub unsafe extern "C" fn abs2rel(ptr: *mut c_void, errmsg: *mut *mut c_char) -> RelPtr {
    ffi_try!(errmsg, shm::RELNULL, shm::abs2rel(ptr as AbsPtr))
}

#[no_mangle]
pub unsafe extern "C" fn abs2shm(ptr: *mut c_void, errmsg: *mut *mut c_char) -> *mut ShmHeader {
    ffi_try!(errmsg, ptr::null_mut(), shm::abs2shm(ptr as AbsPtr))
}

#[no_mangle]
pub unsafe extern "C" fn abs2blk(ptr: *mut c_void, errmsg: *mut *mut c_char) -> *mut BlockHeader {
    clear_errmsg(errmsg);
    if ptr.is_null() {
        set_errmsg(errmsg, &MorlocError::NullPointer);
        return ptr::null_mut();
    }
    let blk = (ptr as *mut u8).sub(std::mem::size_of::<BlockHeader>()) as *mut BlockHeader;
    if (*blk).magic != shm::BLK_MAGIC {
        set_errmsg(errmsg, &MorlocError::Shm("Bad block magic".into()));
        return ptr::null_mut();
    }
    blk
}

#[no_mangle]
pub unsafe extern "C" fn vol2rel(ptr: VolPtr, shm_ptr: *const ShmHeader) -> RelPtr {
    shm::vol2rel(ptr, &*shm_ptr)
}

#[no_mangle]
pub unsafe extern "C" fn vol2abs(ptr: VolPtr, shm_ptr: *const ShmHeader) -> *mut c_void {
    shm::vol2abs(ptr, shm_ptr) as *mut c_void
}

// ── Schema functions ───────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn parse_schema(
    schema_str: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut CSchema {
    clear_errmsg(errmsg);
    if schema_str.is_null() {
        set_errmsg(errmsg, &MorlocError::NullPointer);
        return ptr::null_mut();
    }
    let s = CStr::from_ptr(schema_str).to_string_lossy();
    match schema::parse_schema(&s) {
        Ok(schema) => CSchema::from_rust(&schema),
        Err(e) => {
            set_errmsg(errmsg, &e);
            ptr::null_mut()
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn schema_to_string(schema: *const CSchema) -> *mut c_char {
    if schema.is_null() {
        return ptr::null_mut();
    }
    let rs = CSchema::to_rust(schema);
    let s = schema::schema_to_string(&rs);
    match CString::new(s) {
        Ok(cs) => cs.into_raw(),
        Err(_) => ptr::null_mut(),
    }
}

#[no_mangle]
pub unsafe extern "C" fn free_schema(schema: *mut CSchema) {
    CSchema::free(schema);
}

#[no_mangle]
pub unsafe extern "C" fn schema_is_fixed_width(schema: *const CSchema) -> bool {
    if schema.is_null() {
        return true;
    }
    let rs = CSchema::to_rust(schema);
    rs.is_fixed_width()
}

#[no_mangle]
pub unsafe extern "C" fn schema_alignment(schema: *const CSchema) -> usize {
    if schema.is_null() {
        return 1;
    }
    let rs = CSchema::to_rust(schema);
    rs.alignment()
}

// Hash: morloc_xxh64 is provided by utility.c (via xxhash.h inline)

// ── Serialization ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn pack_with_schema(
    mlc: *const c_void,
    schema: *const CSchema,
    mpkptr: *mut *mut c_char,
    mpk_size: *mut usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    *mpkptr = ptr::null_mut();
    *mpk_size = 0;

    let rs = CSchema::to_rust(schema);
    match crate::mpack::pack_with_schema(mlc as AbsPtr, &rs) {
        Ok(data) => {
            *mpk_size = data.len();
            let buf = libc::malloc(data.len()) as *mut u8;
            if buf.is_null() {
                set_errmsg(errmsg, &MorlocError::Shm("malloc failed".into()));
                return 1;
            }
            std::ptr::copy_nonoverlapping(data.as_ptr(), buf, data.len());
            *mpkptr = buf as *mut c_char;
            0
        }
        Err(e) => {
            set_errmsg(errmsg, &e);
            1
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn pack(
    mlc: *const c_void,
    schema_str: *const c_char,
    mpkptr: *mut *mut c_char,
    mpk_size: *mut usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    let s = CStr::from_ptr(schema_str).to_string_lossy();
    let schema = match schema::parse_schema(&s) {
        Ok(s) => s,
        Err(e) => {
            set_errmsg(errmsg, &e);
            return 1;
        }
    };
    let cs = CSchema::from_rust(&schema);
    let result = pack_with_schema(mlc, cs, mpkptr, mpk_size, errmsg);
    free_schema(cs);
    result
}

#[no_mangle]
pub unsafe extern "C" fn unpack_with_schema(
    mpk: *const c_char,
    mpk_size: usize,
    schema: *const CSchema,
    mlcptr: *mut *mut c_void,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    *mlcptr = ptr::null_mut();

    let data = std::slice::from_raw_parts(mpk as *const u8, mpk_size);
    let rs = CSchema::to_rust(schema);
    match crate::mpack::unpack_with_schema(data, &rs) {
        Ok(ptr) => {
            *mlcptr = ptr as *mut c_void;
            0
        }
        Err(e) => {
            set_errmsg(errmsg, &e);
            1
        }
    }
}

// quoted, print_voidstar, pretty_print_voidstar, read_json_with_schema
// are provided by json.c

// ── Schema utility functions needed by C code ──────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn calculate_voidstar_size(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> usize {
    clear_errmsg(errmsg);
    if data.is_null() || schema.is_null() {
        return 0;
    }
    let rs = CSchema::to_rust(schema);
    match calc_voidstar_size_inner(data as *const u8, &rs) {
        Ok(size) => size,
        Err(e) => {
            set_errmsg(errmsg, &e);
            0
        }
    }
}

pub fn calc_voidstar_size_inner(
    data: *const u8,
    schema: &crate::schema::Schema,
) -> Result<usize, MorlocError> {
    use crate::schema::SerialType;
    use crate::shm::{self, Array, Tensor};

    // SAFETY: data points to voidstar data in SHM with layout described by schema.
    // We only read Array/Tensor headers and follow relptrs to compute total size.
    unsafe {
        match schema.serial_type {
            SerialType::String => {
                let arr = &*(data as *const Array);
                Ok(std::mem::size_of::<Array>() + arr.size)
            }
            SerialType::Array => {
                let arr = &*(data as *const Array);
                let mut size = std::mem::size_of::<Array>();
                if arr.size == 0 {
                    return Ok(size);
                }
                let elem_schema = &schema.parameters[0];
                let elem_width = elem_schema.width;
                size += elem_schema.alignment().saturating_sub(1);

                if schema.is_fixed_width() {
                    size += elem_width * arr.size;
                } else {
                    let elem_data = shm::rel2abs(arr.data)?;
                    for i in 0..arr.size {
                        size += calc_voidstar_size_inner(
                            elem_data.add(i * elem_width),
                            elem_schema,
                        )?;
                    }
                }
                Ok(size)
            }
            SerialType::Optional => {
                let tag = *data;
                let mut size = schema.width;
                if tag != 0 {
                    let inner_offset = schema.offsets.first().copied().unwrap_or(
                        shm::align_up(1, schema.parameters[0].alignment().max(1)),
                    );
                    let inner_total = calc_voidstar_size_inner(
                        data.add(inner_offset),
                        &schema.parameters[0],
                    )?;
                    if inner_total > schema.parameters[0].width {
                        size += inner_total - schema.parameters[0].width;
                    }
                }
                Ok(size)
            }
            SerialType::Tensor => {
                let tensor = &*(data as *const Tensor);
                let ndim = schema.offsets.first().copied().unwrap_or(0);
                let elem_width = schema.parameters[0].width;
                let mut size = std::mem::size_of::<Tensor>();
                size += schema.parameters[0].alignment().saturating_sub(1);
                size += ndim * std::mem::size_of::<i64>();
                size += schema.parameters[0].alignment().saturating_sub(1);
                size += tensor.total_elements * elem_width;
                Ok(size)
            }
            SerialType::Tuple | SerialType::Map => {
                if schema.is_fixed_width() {
                    Ok(schema.width)
                } else {
                    let mut size = schema.width;
                    for i in 0..schema.parameters.len() {
                        let elem_total = calc_voidstar_size_inner(
                            data.add(schema.offsets[i]),
                            &schema.parameters[i],
                        )?;
                        if elem_total > schema.parameters[i].width {
                            size += elem_total - schema.parameters[i].width;
                        }
                    }
                    Ok(size)
                }
            }
            _ => Ok(schema.width),
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn get_ptr(
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    clear_errmsg(errmsg);
    if schema.is_null() {
        return ptr::null_mut();
    }
    let rs = CSchema::to_rust(schema);
    ffi_try!(errmsg, ptr::null_mut(), shm::shmalloc(rs.width).map(|p| p as *mut c_void))
}


================================================
FILE: data/rust/morloc-runtime/src/hash.rs
================================================
//! xxHash64 wrapper using the twox-hash crate.
//! Replaces the 1500-line xxhash.h header.

use std::hash::Hasher;
use twox_hash::XxHash64;

const DEFAULT_SEED: u64 = 0;

/// Compute xxHash64 of a byte slice with the default seed.
pub fn xxh64(data: &[u8]) -> u64 {
    let mut hasher = XxHash64::with_seed(DEFAULT_SEED);
    hasher.write(data);
    hasher.finish()
}

/// Compute xxHash64 with a custom seed.
pub fn xxh64_with_seed(data: &[u8], seed: u64) -> u64 {
    let mut hasher = XxHash64::with_seed(seed);
    hasher.write(data);
    hasher.finish()
}

/// Mix multiple hash values together (for composite keys).
pub fn mix(a: u64, b: u64) -> u64 {
    // Use xxHash to mix two 64-bit values
    let mut hasher = XxHash64::with_seed(a);
    hasher.write(&b.to_le_bytes());
    hasher.finish()
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_xxh64_empty() {
        let h = xxh64(b"");
        assert_ne!(h, 0); // xxHash of empty with seed 0 is a known non-zero value
    }

    #[test]
    fn test_xxh64_deterministic() {
        let a = xxh64(b"hello");
        let b = xxh64(b"hello");
        assert_eq!(a, b);
    }

    #[test]
    fn test_xxh64_different_inputs() {
        let a = xxh64(b"hello");
        let b = xxh64(b"world");
        assert_ne!(a, b);
    }

    #[test]
    fn test_mix_commutative_ish() {
        // mix is not commutative by design
        let ab = mix(1, 2);
        let ba = mix(2, 1);
        assert_ne!(ab, ba);
    }
}


================================================
FILE: data/rust/morloc-runtime/src/http_ffi.rs
================================================
//! C ABI wrappers for HTTP request/response handling.
//! Replaces http.c.

use std::ffi::{c_char, c_void};
use std::ptr;

use crate::error::{clear_errmsg, set_errmsg, MorlocError};

const HTTP_MAX_HEADERS: usize = 8192;
const HTTP_MAX_REQUEST: usize = 4 * 1024 * 1024;

// ── C-compatible types ───────────────────────────────────────────────────────

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum HttpMethod {
    Get = 0,
    Post = 1,
    Delete = 2,
    Options = 3,
}

#[repr(C)]
pub struct HttpRequest {
    pub method: HttpMethod,
    pub path: [c_char; 256],
    pub body: *mut c_char,
    pub body_len: usize,
}

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum DaemonMethod {
    Call = 0,
    Discover = 1,
    Health = 2,
    Eval = 3,
    Typecheck = 4,
    Bind = 5,
    Bindings = 6,
    Unbind = 7,
}

#[repr(C)]
pub struct DaemonRequest {
    pub id: *mut c_char,
    pub method: DaemonMethod,
    pub command: *mut c_char,
    pub args_json: *mut c_char,
    pub expr: *mut c_char,
    pub name: *mut c_char,
}

// ── http_parse_request ───────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn http_parse_request(
    fd: i32,
    errmsg: *mut *mut c_char,
) -> *mut HttpRequest {
    clear_errmsg(errmsg);

    // Read headers byte by byte until \r\n\r\n
    let mut header_buf = vec![0u8; HTTP_MAX_HEADERS];
    let mut header_len: usize = 0;
    let mut header_end_pos: Option<usize> = None;

    while header_len < HTTP_MAX_HEADERS - 1 {
        let n = libc::recv(fd, header_buf.as_mut_ptr().add(header_len) as *mut c_void, 1, 0);
        if n <= 0 {
            set_errmsg(errmsg, &MorlocError::Other("Connection closed while reading HTTP headers".into()));
            return ptr::null_mut();
        }
        header_len += 1;

        if header_len >= 4 {
            let tail = &header_buf[header_len - 4..header_len];
            if tail == b"\r\n\r\n" {
                header_end_pos = Some(header_len - 4);
                break;
            }
        }
    }

    let header_end = match header_end_pos {
        Some(p) => p,
        None => {
            set_errmsg(errmsg, &MorlocError::Other("HTTP headers too large or malformed".into()));
            return ptr::null_mut();
        }
    };

    let header_str = std::str::from_utf8(&header_buf[..header_len]).unwrap_or("");

    // Allocate request
    let req = libc::calloc(1, std::mem::size_of::<HttpRequest>()) as *mut HttpRequest;
    if req.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate http_request_t".into()));
        return ptr::null_mut();
    }

    // Parse method
    if header_str.starts_with("GET ") {
        (*req).method = HttpMethod::Get;
    } else if header_str.starts_with("POST ") {
        (*req).method = HttpMethod::Post;
    } else if header_str.starts_with("DELETE ") {
        (*req).method = HttpMethod::Delete;
    } else if header_str.starts_with("OPTIONS ") {
        (*req).method = HttpMethod::Options;
    } else {
        libc::free(req as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Other("Unsupported HTTP method".into()));
        return ptr::null_mut();
    }

    // Parse path
    let first_space = header_str.find(' ').unwrap_or(0) + 1;
    let path_end = header_str[first_space..].find(' ').map(|p| first_space + p).unwrap_or(first_space);
    let path = &header_str[first_space..path_end];
    // Strip query string
    let path = path.split('?').next().unwrap_or(path);
    let path_len = path.len().min(255);
    ptr::copy_nonoverlapping(path.as_ptr(), (*req).path.as_mut_ptr() as *mut u8, path_len);
    (*req).path[path_len] = 0;

    // Find Content-Length
    let mut content_length: usize = 0;
    let header_lower = header_str.to_ascii_lowercase();
    if let Some(pos) = header_lower.find("content-length:") {
        let after = &header_str[pos + 15..];
        let trimmed = after.trim_start();
        if let Some(end) = trimmed.find(|c: char| !c.is_ascii_digit()) {
            content_length = trimmed[..end].parse().unwrap_or(0);
        } else {
            content_length = trimmed.parse().unwrap_or(0);
        }
    }

    // Read body
    if content_length > 0 {
        if content_length > HTTP_MAX_REQUEST {
            libc::free(req as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other(format!("HTTP body too large: {} bytes", content_length)));
            return ptr::null_mut();
        }

        let body = libc::malloc(content_length + 1) as *mut u8;
        if body.is_null() {
            libc::free(req as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Failed to allocate HTTP body buffer".into()));
            return ptr::null_mut();
        }

        // Some body bytes may be in header_buf after \r\n\r\n
        let after_headers = header_end + 4;
        let already_read = (header_len - after_headers).min(content_length);
        if already_read > 0 {
            ptr::copy_nonoverlapping(header_buf.as_ptr().add(after_headers), body, already_read);
        }

        let mut total = already_read;
        while total < content_length {
            let n = libc::recv(fd, body.add(total) as *mut c_void, content_length - total, 0);
            if n <= 0 {
                libc::free(body as *mut c_void);
                libc::free(req as *mut c_void);
                set_errmsg(errmsg, &MorlocError::Other("Connection closed while reading HTTP body".into()));
                return ptr::null_mut();
            }
            total += n as usize;
        }
        *body.add(content_length) = 0;
        (*req).body = body as *mut c_char;
        (*req).body_len = content_length;
    }

    req
}

#[no_mangle]
pub unsafe extern "C" fn http_free_request(req: *mut HttpRequest) {
    if req.is_null() { return; }
    if !(*req).body.is_null() {
        libc::free((*req).body as *mut c_void);
    }
    libc::free(req as *mut c_void);
}

// ── http_write_response ──────────────────────────────────────────────────────

fn http_status_text(status: i32) -> &'static str {
    match status {
        200 => "OK",
        400 => "Bad Request",
        404 => "Not Found",
        405 => "Method Not Allowed",
        500 => "Internal Server Error",
        _ => "Unknown",
    }
}

#[no_mangle]
pub unsafe extern "C" fn http_write_response(
    fd: i32,
    status: i32,
    content_type: *const c_char,
    body: *const c_char,
    body_len: usize,
) -> bool {
    let ct = if content_type.is_null() {
        "application/json"
    } else {
        std::ffi::CStr::from_ptr(content_type).to_str().unwrap_or("application/json")
    };

    let header = format!(
        "HTTP/1.1 {} {}\r\n\
         Content-Type: {}\r\n\
         Content-Length: {}\r\n\
         Connection: close\r\n\
         Access-Control-Allow-Origin: *\r\n\
         Access-Control-Allow-Methods: GET, POST, OPTIONS\r\n\
         Access-Control-Allow-Headers: Content-Type\r\n\
         \r\n",
        status, http_status_text(status), ct, body_len
    );

    let n = libc::send(fd, header.as_ptr() as *const c_void, header.len(), crate::utility::SEND_NOSIGNAL);
    if n < 0 { return false; }

    if !body.is_null() && body_len > 0 {
        let mut total: usize = 0;
        while total < body_len {
            let n = libc::send(fd, (body as *const u8).add(total) as *const c_void, body_len - total, crate::utility::SEND_NOSIGNAL);
            if n <= 0 { return false; }
            total += n as usize;
        }
    }

    true
}

// ── http_to_daemon_request ───────────────────────────────────────────────────

/// Extract a JSON string value after a key like "expr": "..."
fn extract_json_string(body: &str, key: &str) -> Option<String> {
    let search = format!("\"{}\"", key);
    let pos = body.find(&search)?;
    let after = &body[pos + search.len()..];
    let after = after.trim_start();
    let after = after.strip_prefix(':')?;
    let after = after.trim_start();
    if !after.starts_with('"') { return None; }
    let after = &after[1..]; // skip opening quote
    let mut result = String::new();
    let mut chars = after.chars();
    loop {
        match chars.next() {
            Some('\\') => {
                if let Some(c) = chars.next() {
                    result.push(c);
                }
            }
            Some('"') => break,
            Some(c) => result.push(c),
            None => break,
        }
    }
    Some(result)
}

#[no_mangle]
pub unsafe extern "C" fn http_to_daemon_request(
    req: *mut HttpRequest,
    errmsg: *mut *mut c_char,
) -> *mut DaemonRequest {
    clear_errmsg(errmsg);

    let dreq = libc::calloc(1, std::mem::size_of::<DaemonRequest>()) as *mut DaemonRequest;
    if dreq.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("Failed to allocate daemon_request_t".into()));
        return ptr::null_mut();
    }

    let path = std::ffi::CStr::from_ptr((*req).path.as_ptr())
        .to_str().unwrap_or("");
    let method = (*req).method;

    let body_str = if !(*req).body.is_null() && (*req).body_len > 0 {
        std::str::from_utf8(std::slice::from_raw_parts((*req).body as *const u8, (*req).body_len))
            .unwrap_or("")
    } else {
        ""
    };

    // GET /health
    if method == HttpMethod::Get && path == "/health" {
        (*dreq).method = DaemonMethod::Health;
        return dreq;
    }

    // GET /discover
    if method == HttpMethod::Get && path == "/discover" {
        (*dreq).method = DaemonMethod::Discover;
        return dreq;
    }

    // POST /eval
    if method == HttpMethod::Post && path == "/eval" {
        (*dreq).method = DaemonMethod::Eval;
        if let Some(expr) = extract_json_string(body_str, "expr") {
            (*dreq).expr = libc::strdup(expr.as_ptr() as *const c_char);
            // strdup from Rust string - need null terminated
            let c = std::ffi::CString::new(expr).unwrap_or_default();
            (*dreq).expr = libc::strdup(c.as_ptr());
        }
        if (*dreq).expr.is_null() {
            libc::free(dreq as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Missing 'expr' field in /eval request body".into()));
            return ptr::null_mut();
        }
        return dreq;
    }

    // POST /typecheck
    if method == HttpMethod::Post && path == "/typecheck" {
        (*dreq).method = DaemonMethod::Typecheck;
        if let Some(expr) = extract_json_string(body_str, "expr") {
            let c = std::ffi::CString::new(expr).unwrap_or_default();
            (*dreq).expr = libc::strdup(c.as_ptr());
        }
        if (*dreq).expr.is_null() {
            libc::free(dreq as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Missing 'expr' field in /typecheck request body".into()));
            return ptr::null_mut();
        }
        return dreq;
    }

    // POST /bind
    if method == HttpMethod::Post && path == "/bind" {
        (*dreq).method = DaemonMethod::Bind;
        if let Some(expr) = extract_json_string(body_str, "expr") {
            let c = std::ffi::CString::new(expr).unwrap_or_default();
            (*dreq).expr = libc::strdup(c.as_ptr());
        }
        if let Some(name) = extract_json_string(body_str, "name") {
            let c = std::ffi::CString::new(name).unwrap_or_default();
            (*dreq).name = libc::strdup(c.as_ptr());
        }
        if (*dreq).expr.is_null() {
            libc::free(dreq as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Missing 'expr' field in /bind request body".into()));
            return ptr::null_mut();
        }
        return dreq;
    }

    // GET /bindings
    if method == HttpMethod::Get && path == "/bindings" {
        (*dreq).method = DaemonMethod::Bindings;
        return dreq;
    }

    // DELETE /bindings/<name>
    if method == HttpMethod::Delete && path.starts_with("/bindings/") {
        let name = &path[10..];
        if name.is_empty() {
            libc::free(dreq as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Missing binding name in /bindings/ path".into()));
            return ptr::null_mut();
        }
        (*dreq).method = DaemonMethod::Unbind;
        let c = std::ffi::CString::new(name).unwrap_or_default();
        (*dreq).name = libc::strdup(c.as_ptr());
        return dreq;
    }

    // POST /call/<command>
    if method == HttpMethod::Post && path.starts_with("/call/") {
        let cmd_name = &path[6..];
        if cmd_name.is_empty() {
            libc::free(dreq as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("Missing command name in /call/ path".into()));
            return ptr::null_mut();
        }
        (*dreq).method = DaemonMethod::Call;
        let c = std::ffi::CString::new(cmd_name).unwrap_or_default();
        (*dreq).command = libc::strdup(c.as_ptr());

        // Parse body
        let trimmed = body_str.trim();
        if trimmed.starts_with('[') {
            let c = std::ffi::CString::new(trimmed).unwrap_or_default();
            (*dreq).args_json = libc::strdup(c.as_ptr());
        } else if trimmed.starts_with('{') {
            // Extract "args" array
            if let Some(args_pos) = trimmed.find("\"args\"") {
                let after = &trimmed[args_pos + 6..];
                let after = after.trim_start().strip_prefix(':').unwrap_or(after).trim_start();
                if after.starts_with('[') {
                    // Find matching ]
                    let mut depth = 0i32;
                    let mut in_string = false;
                    let mut end = 0;
                    for (i, ch) in after.chars().enumerate() {
                        if in_string {
                            if ch == '\\' { continue; }
                            if ch == '"' { in_string = false; }
                        } else {
                            if ch == '"' { in_string = true; }
                            else if ch == '[' { depth += 1; }
                            else if ch == ']' { depth -= 1; if depth == 0 { end = i + 1; break; } }
                        }
                    }
                    if end > 0 {
                        let arr = &after[..end];
                        let c = std::ffi::CString::new(arr).unwrap_or_default();
                        (*dreq).args_json = libc::strdup(c.as_ptr());
                    }
                }
            }
        }
        return dreq;
    }

    // OPTIONS (CORS preflight)
    if method == HttpMethod::Options {
        (*dreq).method = DaemonMethod::Health;
        return dreq;
    }

    libc::free(dreq as *mut c_void);
    let method_str = match method {
        HttpMethod::Get => "GET",
        HttpMethod::Post => "POST",
        HttpMethod::Delete => "DELETE",
        HttpMethod::Options => "OPTIONS",
    };
    set_errmsg(errmsg, &MorlocError::Other(format!("Unknown HTTP endpoint: {} {}", method_str, path)));
    ptr::null_mut()
}


================================================
FILE: data/rust/morloc-runtime/src/intrinsics.rs
================================================
//! Intrinsic functions for morloc: save/load/show/read/hash.
//! Replaces intrinsics.c. These are thin wrappers around serialization functions.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};

// ── mlc_save: serialize to msgpack file ────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_save(
    data: *const c_void,
    schema: *const CSchema,
    path: *const c_char,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);

    extern "C" {
        fn pack_with_schema(
            mlc: *const c_void, schema: *const CSchema,
            mpk: *mut *mut c_char, mpk_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
        fn write_atomic(
            filename: *const c_char, data: *const u8, size: usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let mut err: *mut c_char = ptr::null_mut();
    let mut mpk: *mut c_char = ptr::null_mut();
    let mut mpk_size: usize = 0;

    let rc = pack_with_schema(data, schema, &mut mpk, &mut mpk_size, &mut err);
    if rc != 0 {
        *errmsg = err;
        return 1;
    }

    let wrc = write_atomic(path, mpk as *const u8, mpk_size, &mut err);
    libc::free(mpk as *mut c_void);
    if wrc != 0 {
        *errmsg = err;
        return 1;
    }
    0
}

// ── mlc_save_json: serialize to JSON file ──────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_save_json(
    data: *const c_void,
    schema: *const CSchema,
    path: *const c_char,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);

    extern "C" {
        fn voidstar_to_json_string(
            data: *const c_void, schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut c_char;
        fn write_atomic(
            filename: *const c_char, data: *const u8, size: usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let mut err: *mut c_char = ptr::null_mut();
    let json = voidstar_to_json_string(data, schema, &mut err);
    if json.is_null() {
        *errmsg = err;
        return 1;
    }

    let json_len = libc::strlen(json);
    let wrc = write_atomic(path, json as *const u8, json_len, &mut err);
    libc::free(json as *mut c_void);
    if wrc != 0 {
        *errmsg = err;
        return 1;
    }
    0
}

// ── mlc_save_voidstar: serialize to binary voidstar file ───────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_save_voidstar(
    data: *const c_void,
    schema: *const CSchema,
    path: *const c_char,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);

    extern "C" {
        fn flatten_voidstar_to_buffer(
            data: *const c_void, schema: *const CSchema,
            out_buf: *mut *mut u8, out_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
        fn write_binary_fd(
            fd: i32, buf: *const c_char, count: usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let mut err: *mut c_char = ptr::null_mut();

    // Get directory for temp file
    let path_str = CStr::from_ptr(path).to_string_lossy();
    let parent = std::path::Path::new(path_str.as_ref()).parent();
    let dir = match parent {
        Some(p) if !p.as_os_str().is_empty() => p.to_string_lossy().into_owned(),
        _ => ".".to_string(),
    };

    let tmp_template = format!("{}/morloc-tmp_XXXXXX\0", dir);
    let mut tmp_buf: Vec<u8> = tmp_template.into_bytes();
    let fd = libc::mkstemp(tmp_buf.as_mut_ptr() as *mut c_char);
    if fd < 0 {
        set_errmsg(errmsg, &MorlocError::Io(std::io::Error::last_os_error()));
        return 1;
    }

    // Write packet header placeholder
    let header_size = std::mem::size_of::<crate::packet::PacketHeader>();
    let zeros = vec![0u8; header_size];
    if write_binary_fd(fd, zeros.as_ptr() as *const c_char, header_size, &mut err) != 0 {
        libc::close(fd);
        libc::unlink(tmp_buf.as_ptr() as *const c_char);
        *errmsg = err;
        return 1;
    }

    // Flatten voidstar
    let mut blob: *mut u8 = ptr::null_mut();
    let mut blob_size: usize = 0;
    if flatten_voidstar_to_buffer(data, schema, &mut blob, &mut blob_size, &mut err) != 0 {
        libc::close(fd);
        libc::unlink(tmp_buf.as_ptr() as *const c_char);
        *errmsg = err;
        return 1;
    }

    // Write flattened data
    if write_binary_fd(fd, blob as *const c_char, blob_size, &mut err) != 0 {
        libc::free(blob as *mut c_void);
        libc::close(fd);
        libc::unlink(tmp_buf.as_ptr() as *const c_char);
        *errmsg = err;
        return 1;
    }
    libc::free(blob as *mut c_void);

    // Seek back and write real header
    libc::lseek(fd, 0, libc::SEEK_SET);
    let header = crate::packet::PacketHeader::data_mesg(
        crate::packet::PACKET_FORMAT_VOIDSTAR,
        blob_size as u64,
    );
    let hdr_bytes = header.to_bytes();
    write_binary_fd(fd, hdr_bytes.as_ptr() as *const c_char, hdr_bytes.len(), &mut err);

    libc::fsync(fd);
    libc::close(fd);

    // Atomic rename
    if libc::rename(tmp_buf.as_ptr() as *const c_char, path) != 0 {
        libc::unlink(tmp_buf.as_ptr() as *const c_char);
        set_errmsg(errmsg, &MorlocError::Io(std::io::Error::last_os_error()));
        return 1;
    }

    0
}

// ── mlc_load: load from file (auto-detect format) ─────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_load(
    path: *const c_char,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    clear_errmsg(errmsg);

    extern "C" {
        fn file_exists(filename: *const c_char) -> bool;
        fn read_binary_file(
            filename: *const c_char, file_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
        fn load_morloc_data_file(
            path: *const c_char, data: *mut u8, data_size: usize,
            schema: *const CSchema, errmsg: *mut *mut c_char,
        ) -> *mut c_void;
    }

    if !file_exists(path) {
        return ptr::null_mut();
    }

    let mut err: *mut c_char = ptr::null_mut();
    let mut file_size: usize = 0;
    let data = read_binary_file(path, &mut file_size, &mut err);
    if data.is_null() {
        if !err.is_null() {
            let path_str = CStr::from_ptr(path).to_string_lossy();
            let err_str = CStr::from_ptr(err).to_string_lossy();
            eprintln!("@load warning ({}): {}", path_str, err_str);
            libc::free(err as *mut libc::c_void);
        }
        return ptr::null_mut();
    }

    let result = load_morloc_data_file(path, data, file_size, schema, &mut err);
    if result.is_null() && !err.is_null() {
        let path_str = CStr::from_ptr(path).to_string_lossy();
        let err_str = CStr::from_ptr(err).to_string_lossy();
        eprintln!("@load warning ({}): {}", path_str, err_str);
        libc::free(err as *mut libc::c_void);
    }
    result
}

// ── mlc_hash: hash voidstar data ───────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_hash(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);

    let mut err: *mut c_char = ptr::null_mut();
    let hash = crate::cache::hash_voidstar(data, schema, 0, &mut err);
    if !err.is_null() {
        *errmsg = err;
        return ptr::null_mut();
    }

    let hex = format!("{:016x}", hash);
    match CString::new(hex) {
        Ok(cs) => cs.into_raw(),
        Err(_) => {
            set_errmsg(errmsg, &MorlocError::Other("CString error".into()));
            ptr::null_mut()
        }
    }
}

// ── mlc_show: serialize to JSON string ─────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_show(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);

    extern "C" {
        fn voidstar_to_json_string(
            data: *const c_void, schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut c_char;
    }

    voidstar_to_json_string(data, schema, errmsg)
}

// ── mlc_read: deserialize from JSON string ─────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn mlc_read(
    json_str: *const c_char,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_void {
    clear_errmsg(errmsg);

    extern "C" {
        fn read_json_with_schema(
            dest: *mut u8, json: *mut c_char, schema: *const CSchema,
            errmsg: *mut *mut c_char,
        ) -> *mut u8;
    }

    let json_copy = libc::strdup(json_str);
    if json_copy.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("strdup failed".into()));
        return ptr::null_mut();
    }

    let mut err: *mut c_char = ptr::null_mut();
    let result = read_json_with_schema(ptr::null_mut(), json_copy, schema, &mut err);
    libc::free(json_copy as *mut c_void);
    if result.is_null() {
        if !err.is_null() {
            libc::free(err as *mut c_void);
        }
    }
    result as *mut c_void
}

// write_voidstar_binary is provided by packet.c (still C)
// It will be ported when packet.c is ported to Rust.

// Unused Rust implementation kept for future use
#[allow(dead_code)]
unsafe fn _write_voidstar_binary_rust(
    fd: i32,
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> isize {
    clear_errmsg(errmsg);

    extern "C" {
        fn flatten_voidstar_to_buffer(
            data: *const c_void, schema: *const CSchema,
            out_buf: *mut *mut u8, out_size: *mut usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
        fn write_binary_fd(
            fd: i32, buf: *const c_char, count: usize,
            errmsg: *mut *mut c_char,
        ) -> i32;
    }

    let mut err: *mut c_char = ptr::null_mut();
    let mut blob: *mut u8 = ptr::null_mut();
    let mut blob_size: usize = 0;

    if flatten_voidstar_to_buffer(data, schema, &mut blob, &mut blob_size, &mut err) != 0 {
        *errmsg = err;
        return -1;
    }

    if write_binary_fd(fd, blob as *const c_char, blob_size, &mut err) != 0 {
        libc::free(blob as *mut c_void);
        *errmsg = err;
        return -1;
    }

    libc::free(blob as *mut c_void);
    blob_size as isize
}


================================================
FILE: data/rust/morloc-runtime/src/ipc.rs
================================================
//! Unix domain socket IPC for communication between nexus and language pools.
//! Replaces ipc.c.

use crate::error::MorlocError;
use crate::packet::PacketHeader;
use std::io::{Read, Write};
use std::os::unix::net::UnixStream;
use std::path::Path;

/// Send a packet (header + payload) over a Unix stream socket and receive the response.
pub fn send_and_receive(
    socket_path: &Path,
    header: &PacketHeader,
    payload: &[u8],
) -> Result<(PacketHeader, Vec<u8>), MorlocError> {
    let mut stream = UnixStream::connect(socket_path).map_err(|e| {
        MorlocError::Ipc(format!(
            "failed to connect to {}: {e}",
            socket_path.display()
        ))
    })?;

    // Send header
    let header_bytes = header.to_bytes();
    stream
        .write_all(&header_bytes)
        .map_err(|e| MorlocError::Ipc(format!("failed to send header: {e}")))?;

    // Send payload
    if !payload.is_empty() {
        stream
            .write_all(payload)
            .map_err(|e| MorlocError::Ipc(format!("failed to send payload: {e}")))?;
    }

    // Read response header
    let mut resp_header_bytes = [0u8; 32];
    stream
        .read_exact(&mut resp_header_bytes)
        .map_err(|e| MorlocError::Ipc(format!("failed to read response header: {e}")))?;

    let resp_header = PacketHeader::from_bytes(&resp_header_bytes)?;

    // Read response payload
    let payload_len = resp_header.length as usize;
    let mut resp_payload = vec![0u8; payload_len];
    if payload_len > 0 {
        stream
            .read_exact(&mut resp_payload)
            .map_err(|e| MorlocError::Ipc(format!("failed to read response payload: {e}")))?;
    }

    Ok((resp_header, resp_payload))
}

/// Read a single packet from a connected stream.
pub fn read_packet(stream: &mut UnixStream) -> Result<(PacketHeader, Vec<u8>), MorlocError> {
    let mut header_bytes = [0u8; 32];
    stream
        .read_exact(&mut header_bytes)
        .map_err(|e| MorlocError::Ipc(format!("failed to read packet header: {e}")))?;

    let header = PacketHeader::from_bytes(&header_bytes)?;

    // Skip metadata between header and payload
    let skip = header.offset as usize - 32;
    if skip > 0 {
        let mut discard = vec![0u8; skip];
        stream
            .read_exact(&mut discard)
            .map_err(|e| MorlocError::Ipc(format!("failed to skip metadata: {e}")))?;
    }

    let payload_len = header.length as usize;
    let mut payload = vec![0u8; payload_len];
    if payload_len > 0 {
        stream
            .read_exact(&mut payload)
            .map_err(|e| MorlocError::Ipc(format!("failed to read payload: {e}")))?;
    }

    Ok((header, payload))
}

/// Send a packet over a connected stream.
pub fn send_packet(
    stream: &mut UnixStream,
    header: &PacketHeader,
    payload: &[u8],
) -> Result<(), MorlocError> {
    let header_bytes = header.to_bytes();
    stream
        .write_all(&header_bytes)
        .map_err(|e| MorlocError::Ipc(format!("failed to send header: {e}")))?;
    if !payload.is_empty() {
        stream
            .write_all(payload)
            .map_err(|e| MorlocError::Ipc(format!("failed to send payload: {e}")))?;
    }
    Ok(())
}


================================================
FILE: data/rust/morloc-runtime/src/ipc_ffi.rs
================================================
//! C ABI wrappers for IPC functions.
//! Replaces ipc.c with Rust implementations of Unix domain socket operations.

use std::ffi::{c_char, c_void, CStr};
use std::ptr;

use crate::error::{clear_errmsg, set_errmsg, MorlocError};

// ── C types from call.h ──────────────────────────────────────────────────────

#[repr(C)]
pub struct ClientList {
    pub fd: i32,
    pub next: *mut ClientList,
}

// language_daemon_t has fd_set which is 128 bytes on Linux.
// We represent it as an opaque struct and use libc calls.
#[repr(C)]
pub struct LanguageDaemon {
    pub socket_path: *mut c_char,
    pub tmpdir: *mut c_char,
    pub shm_basename: *mut c_char,
    pub shm: *mut crate::shm::ShmHeader,
    pub shm_default_size: usize,
    pub server_fd: i32,
    pub read_fds: libc::fd_set,
    pub client_fds: *mut ClientList,
}

const BUFFER_SIZE: usize = 65536;

// ── close_socket / close_daemon ──────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn close_socket(socket_id: i32) {
    if socket_id >= 0 {
        libc::close(socket_id);
    }
}

#[no_mangle]
pub unsafe extern "C" fn close_daemon(daemon_ptr: *mut *mut LanguageDaemon) {
    if daemon_ptr.is_null() || (*daemon_ptr).is_null() {
        return;
    }
    let daemon = *daemon_ptr;

    close_socket((*daemon).server_fd);

    // Free client list
    let mut current = (*daemon).client_fds;
    while !current.is_null() {
        let next = (*current).next;
        libc::close((*current).fd);
        libc::free(current as *mut c_void);
        current = next;
    }

    if !(*daemon).socket_path.is_null() {
        libc::unlink((*daemon).socket_path);
        libc::free((*daemon).socket_path as *mut c_void);
    }
    if !(*daemon).tmpdir.is_null() {
        libc::free((*daemon).tmpdir as *mut c_void);
    }
    if !(*daemon).shm_basename.is_null() {
        libc::free((*daemon).shm_basename as *mut c_void);
    }

    libc::free(daemon as *mut c_void);
    *daemon_ptr = ptr::null_mut();
}

// ── Socket helpers ───────────────────────────────────────────────────────────

unsafe fn new_socket(errmsg: *mut *mut c_char) -> i32 {
    clear_errmsg(errmsg);
    let fd = libc::socket(libc::AF_UNIX, libc::SOCK_STREAM, 0);
    if fd < 0 {
        set_errmsg(errmsg, &MorlocError::Ipc("Error creating socket".into()));
        return -1;
    }
    crate::utility::set_nosigpipe(fd);
    fd
}

unsafe fn new_server_addr(socket_path: *const c_char) -> libc::sockaddr_un {
    let mut addr: libc::sockaddr_un = std::mem::zeroed();
    addr.sun_family = libc::AF_UNIX as libc::sa_family_t;
    let path_bytes = CStr::from_ptr(socket_path).to_bytes();
    let copy_len = path_bytes.len().min(addr.sun_path.len() - 1);
    ptr::copy_nonoverlapping(
        path_bytes.as_ptr() as *const c_char,
        addr.sun_path.as_mut_ptr(),
        copy_len,
    );
    addr
}

unsafe fn new_server(socket_path: *const c_char, errmsg: *mut *mut c_char) -> i32 {
    let server_fd = new_socket(errmsg);
    if server_fd < 0 {
        return -1;
    }

    let addr = new_server_addr(socket_path);

    // Remove any existing socket file
    libc::unlink(socket_path);

    if libc::bind(server_fd, &addr as *const libc::sockaddr_un as *const libc::sockaddr,
                  std::mem::size_of::<libc::sockaddr_un>() as u32) < 0 {
        close_socket(server_fd);
        set_errmsg(errmsg, &MorlocError::Ipc("Error binding socket".into()));
        return -1;
    }

    if libc::listen(server_fd, 16) < 0 {
        close_socket(server_fd);
        set_errmsg(errmsg, &MorlocError::Ipc("Error listening on socket".into()));
        return -1;
    }

    server_fd
}

// ── start_daemon ─────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn start_daemon(
    socket_path: *const c_char,
    tmpdir: *const c_char,
    shm_basename: *const c_char,
    shm_default_size: usize,
    errmsg: *mut *mut c_char,
) -> *mut LanguageDaemon {
    clear_errmsg(errmsg);

    let daemon = libc::calloc(1, std::mem::size_of::<LanguageDaemon>()) as *mut LanguageDaemon;
    if daemon.is_null() {
        set_errmsg(errmsg, &MorlocError::Ipc("Calloc for language_daemon_t failed".into()));
        return ptr::null_mut();
    }

    (*daemon).server_fd = -1;
    (*daemon).socket_path = libc::strdup(socket_path);
    (*daemon).tmpdir = libc::strdup(tmpdir);
    (*daemon).shm_basename = libc::strdup(shm_basename);

    if (*daemon).socket_path.is_null() || (*daemon).tmpdir.is_null() || (*daemon).shm_basename.is_null() {
        close_daemon(&mut (daemon as *mut LanguageDaemon));
        set_errmsg(errmsg, &MorlocError::Ipc("strdup failed in start_daemon".into()));
        return ptr::null_mut();
    }

    (*daemon).shm_default_size = shm_default_size;
    (*daemon).client_fds = ptr::null_mut();
    libc::FD_ZERO(&mut (*daemon).read_fds);

    // Set fallback dir for file-backed SHM
    crate::shm::shm_set_fallback_dir(&CStr::from_ptr(tmpdir).to_string_lossy());

    // Init shared memory
    let mut err: *mut c_char = ptr::null_mut();
    let shm = crate::ffi::shinit(shm_basename, 0, shm_default_size, &mut err);
    if !err.is_null() {
        close_daemon(&mut (daemon as *mut LanguageDaemon));
        *errmsg = err;
        return ptr::null_mut();
    }
    (*daemon).shm = shm;

    // Create server socket
    (*daemon).server_fd = new_server(socket_path, &mut err);
    if !err.is_null() {
        close_daemon(&mut (daemon as *mut LanguageDaemon));
        *errmsg = err;
        return ptr::null_mut();
    }

    // Set non-blocking mode
    let flags = libc::fcntl((*daemon).server_fd, libc::F_GETFL);
    if flags == -1 || libc::fcntl((*daemon).server_fd, libc::F_SETFL, flags | libc::O_NONBLOCK) == -1 {
        let errno_msg = std::ffi::CStr::from_ptr(libc::strerror(crate::utility::errno_val()))
            .to_string_lossy().into_owned();
        close_daemon(&mut (daemon as *mut LanguageDaemon));
        set_errmsg(errmsg, &MorlocError::Ipc(format!("Failed to set non-blocking mode: {}", errno_msg)));
        return ptr::null_mut();
    }

    daemon
}

// ── stream_from_client_wait ──────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn stream_from_client_wait(
    client_fd: i32,
    pselect_timeout_us: i32,
    recv_timeout_us: i32,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);

    if libc::fcntl(client_fd, libc::F_GETFD) == -1 {
        set_errmsg(errmsg, &MorlocError::Ipc("Invalid file descriptor".into()));
        return ptr::null_mut();
    }

    let buffer = libc::calloc(BUFFER_SIZE, 1) as *mut u8;
    if buffer.is_null() {
        set_errmsg(errmsg, &MorlocError::Ipc("calloc failed for buffer".into()));
        return ptr::null_mut();
    }

    let mut read_fds: libc::fd_set = std::mem::zeroed();
    let max_fd = client_fd;

    // Timeout setup
    let mut ts_loop: libc::timespec = std::mem::zeroed();
    let timeout_ptr = if pselect_timeout_us > 0 {
        ts_loop.tv_sec = (pselect_timeout_us / 1000000) as i64;
        ts_loop.tv_nsec = ((pselect_timeout_us % 1000000) * 1000) as i64;
        &ts_loop as *const libc::timespec
    } else {
        ptr::null()
    };

    // Signal mask setup
    let mut mask: libc::sigset_t = std::mem::zeroed();
    let mut origmask: libc::sigset_t = std::mem::zeroed();
    libc::sigemptyset(&mut mask);
    libc::sigaddset(&mut mask, libc::SIGINT);
    libc::pthread_sigmask(libc::SIG_SETMASK, &mask, &mut origmask);

    // Initial receive with timeout
    let mut ready;
    loop {
        libc::FD_ZERO(&mut read_fds);
        libc::FD_SET(client_fd, &mut read_fds);
        ready = libc::pselect(max_fd + 1, &mut read_fds, ptr::null_mut(), ptr::null_mut(), timeout_ptr, &origmask);
        if !(ready < 0 && crate::utility::errno_val() == libc::EINTR) {
            break;
        }
    }
    libc::pthread_sigmask(libc::SIG_SETMASK, &origmask, ptr::null_mut());

    if ready == 0 {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("Timeout waiting for initial data".into()));
        return ptr::null_mut();
    }
    if ready < 0 {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("pselect error".into()));
        return ptr::null_mut();
    }
    if !libc::FD_ISSET(client_fd, &read_fds) {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("Bad client file descriptor".into()));
        return ptr::null_mut();
    }

    let recv_length = libc::recv(client_fd, buffer as *mut c_void, BUFFER_SIZE, 0);
    if recv_length == 0 {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("Connection closed by peer".into()));
        return ptr::null_mut();
    }
    if recv_length < 0 && crate::utility::errno_val() != libc::EWOULDBLOCK && crate::utility::errno_val() != libc::EAGAIN {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("Recv error".into()));
        return ptr::null_mut();
    }

    // Get packet size from header
    let mut packet_err: *mut c_char = ptr::null_mut();
    let packet_length = crate::packet_ffi::morloc_packet_size(buffer, &mut packet_err);
    if !packet_err.is_null() {
        libc::free(buffer as *mut c_void);
        *errmsg = packet_err;
        return ptr::null_mut();
    }

    let result = libc::calloc(packet_length, 1) as *mut u8;
    if result.is_null() {
        libc::free(buffer as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Ipc("calloc failure".into()));
        return ptr::null_mut();
    }

    let copy_length = (recv_length as usize).min(packet_length);
    ptr::copy_nonoverlapping(buffer, result, copy_length);
    let mut data_ptr = result.add(copy_length);
    libc::free(buffer as *mut c_void);

    let attempts = 10;
    while (data_ptr as usize - result as usize) < packet_length {
        let mut packet_received = false;
        for attempt in 0..attempts {
            libc::FD_ZERO(&mut read_fds);
            libc::FD_SET(client_fd, &mut read_fds);

            let recv_timeout_ptr = if recv_timeout_us > 0 {
                let total_us = recv_timeout_us as i64 * (attempt as i64 + 1);
                ts_loop.tv_sec = total_us / 1000000;
                ts_loop.tv_nsec = (total_us % 1000000) * 1000;
                &ts_loop as *const libc::timespec
            } else {
                ptr::null()
            };

            libc::pthread_sigmask(libc::SIG_SETMASK, &mask, ptr::null_mut());
            ready = libc::pselect(max_fd + 1, &mut read_fds, ptr::null_mut(), ptr::null_mut(), recv_timeout_ptr, &origmask);
            libc::pthread_sigmask(libc::SIG_SETMASK, &origmask, ptr::null_mut());

            if ready == 0 {
                libc::free(result as *mut c_void);
                set_errmsg(errmsg, &MorlocError::Ipc("Timeout waiting for remaining data".into()));
                return ptr::null_mut();
            }
            if ready < 0 && crate::utility::errno_val() != libc::EINTR {
                libc::free(result as *mut c_void);
                set_errmsg(errmsg, &MorlocError::Ipc("pselect error".into()));
                return ptr::null_mut();
            }
            if ready <= 0 { continue; }

            if libc::FD_ISSET(client_fd, &read_fds) {
                let remaining = packet_length - (data_ptr as usize - result as usize);
                let recv_size = remaining.min(BUFFER_SIZE);
                let n = libc::recv(client_fd, data_ptr as *mut c_void, recv_size, 0);
                if n > 0 {
                    data_ptr = data_ptr.add(n as usize);
                    packet_received = true;
                    break;
                }
                if n == 0 {
                    libc::free(result as *mut c_void);
                    set_errmsg(errmsg, &MorlocError::Ipc("Connection closed early".into()));
                    return ptr::null_mut();
                }
                if n < 0 && crate::utility::errno_val() != libc::EWOULDBLOCK && crate::utility::errno_val() != libc::EAGAIN {
                    libc::free(result as *mut c_void);
                    set_errmsg(errmsg, &MorlocError::Ipc("Recv error".into()));
                    return ptr::null_mut();
                }
            }
        }
        if !packet_received {
            libc::free(result as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Ipc("Failed to retrieve packet".into()));
            return ptr::null_mut();
        }
    }

    result
}

#[no_mangle]
pub unsafe extern "C" fn stream_from_client(
    client_fd: i32,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    stream_from_client_wait(client_fd, 0, 0, errmsg)
}

// ── send_and_receive_over_socket ─────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn send_and_receive_over_socket_wait(
    socket_path: *const c_char,
    packet: *const u8,
    pselect_timeout_us: i32,
    recv_timeout_us: i32,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);

    let mut err: *mut c_char = ptr::null_mut();
    let client_fd = new_socket(&mut err);
    if client_fd < 0 {
        *errmsg = err;
        return ptr::null_mut();
    }

    let addr = new_server_addr(socket_path);

    // Connect with retry (matching C WAIT macro behavior)
    let mut retcode;
    let mut attempts = 0;
    loop {
        retcode = libc::connect(client_fd, &addr as *const libc::sockaddr_un as *const libc::sockaddr,
                                std::mem::size_of::<libc::sockaddr_un>() as u32);
        if retcode == 0 { break; }
        attempts += 1;
        if attempts > 300 { // ~30 seconds with 100ms sleep
            close_socket(client_fd);
            set_errmsg(errmsg, &MorlocError::Ipc(format!(
                "Failed to connect to pipe '{}'",
                CStr::from_ptr(socket_path).to_string_lossy()
            )));
            return ptr::null_mut();
        }
        libc::usleep(100_000); // 100ms
    }

    let packet_size = crate::packet_ffi::morloc_packet_size(packet, &mut err);
    if !err.is_null() {
        close_socket(client_fd);
        *errmsg = err;
        return ptr::null_mut();
    }

    // Send packet in loop
    let mut total_sent: usize = 0;
    while total_sent < packet_size {
        let bytes_sent = libc::send(
            client_fd,
            packet.add(total_sent) as *const c_void,
            packet_size - total_sent,
            crate::utility::SEND_NOSIGNAL,
        );
        if bytes_sent <= 0 {
            close_socket(client_fd);
            set_errmsg(errmsg, &MorlocError::Ipc(format!(
                "Failed to send data to '{}'",
                CStr::from_ptr(socket_path).to_string_lossy()
            )));
            return ptr::null_mut();
        }
        total_sent += bytes_sent as usize;
    }

    let result = stream_from_client_wait(client_fd, pselect_timeout_us, recv_timeout_us, &mut err);
    if !err.is_null() {
        close_socket(client_fd);
        *errmsg = err;
        return ptr::null_mut();
    }

    close_socket(client_fd);
    result
}

#[no_mangle]
pub unsafe extern "C" fn send_and_receive_over_socket(
    socket_path: *const c_char,
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    send_and_receive_over_socket_wait(socket_path, packet, 0, 0, errmsg)
}

// ── send_packet_to_foreign_server ────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn send_packet_to_foreign_server(
    client_fd: i32,
    packet: *mut u8,
    errmsg: *mut *mut c_char,
) -> usize {
    clear_errmsg(errmsg);

    let mut err: *mut c_char = ptr::null_mut();
    let size = crate::packet_ffi::morloc_packet_size(packet, &mut err);
    if !err.is_null() {
        *errmsg = err;
        return 0;
    }

    let mut total_sent: usize = 0;
    while total_sent < size {
        let bytes_sent = libc::send(
            client_fd,
            packet.add(total_sent) as *const c_void,
            size - total_sent,
            crate::utility::SEND_NOSIGNAL,
        );
        if bytes_sent <= 0 {
            set_errmsg(errmsg, &MorlocError::Ipc(format!(
                "Failed to send over client {}", client_fd
            )));
            return 0;
        }
        total_sent += bytes_sent as usize;
    }

    total_sent
}

// ── wait_for_client ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn wait_for_client_with_timeout(
    daemon: *mut LanguageDaemon,
    timeout_us: i32,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);

    libc::FD_ZERO(&mut (*daemon).read_fds);
    libc::FD_SET((*daemon).server_fd, &mut (*daemon).read_fds);

    let mut max_fd = (*daemon).server_fd;

    // Add existing client fds
    let mut client = (*daemon).client_fds;
    while !client.is_null() {
        libc::FD_SET((*client).fd, &mut (*daemon).read_fds);
        if (*client).fd > max_fd {
            max_fd = (*client).fd;
        }
        client = (*client).next;
    }

    // Timeout
    let mut ts: libc::timespec = std::mem::zeroed();
    let timeout_ptr = if timeout_us > 0 {
        ts.tv_sec = (timeout_us / 1000000) as i64;
        ts.tv_nsec = ((timeout_us % 1000000) * 1000) as i64;
        &ts as *const libc::timespec
    } else {
        ptr::null()
    };

    let mut emptymask: libc::sigset_t = std::mem::zeroed();
    libc::sigemptyset(&mut emptymask);

    let ready = libc::pselect(max_fd + 1, &mut (*daemon).read_fds, ptr::null_mut(), ptr::null_mut(), timeout_ptr, &emptymask);
    if ready < 0 {
        if crate::utility::errno_val() == libc::EINTR {
            return 0;
        }
        set_errmsg(errmsg, &MorlocError::Ipc("pselect error".into()));
        return -1;
    }
    if ready == 0 {
        return 0;
    }

    // Check for new connection
    if libc::FD_ISSET((*daemon).server_fd, &(*daemon).read_fds) {
        let selected_fd = libc::accept((*daemon).server_fd, ptr::null_mut(), ptr::null_mut());
        if selected_fd >= 0 {
            crate::utility::set_nosigpipe(selected_fd);
            libc::fcntl(selected_fd, libc::F_SETFL, libc::O_NONBLOCK);

            let new_client = libc::calloc(1, std::mem::size_of::<ClientList>()) as *mut ClientList;
            (*new_client).fd = selected_fd;
            (*new_client).next = ptr::null_mut();

            if (*daemon).client_fds.is_null() {
                (*daemon).client_fds = new_client;
            } else {
                let mut last = (*daemon).client_fds;
                while !(*last).next.is_null() {
                    last = (*last).next;
                }
                (*last).next = new_client;
            }
        }
        // Ignore EAGAIN/EWOULDBLOCK on accept
    }

    if (*daemon).client_fds.is_null() {
        return 0; // spurious wakeup
    }

    // Dequeue first client
    let client_node = (*daemon).client_fds;
    let return_fd = (*client_node).fd;
    (*daemon).client_fds = (*client_node).next;
    libc::free(client_node as *mut c_void);

    return_fd
}

#[no_mangle]
pub unsafe extern "C" fn wait_for_client(
    daemon: *mut LanguageDaemon,
    errmsg: *mut *mut c_char,
) -> i32 {
    wait_for_client_with_timeout(daemon, 0, errmsg)
}


================================================
FILE: data/rust/morloc-runtime/src/json.rs
================================================
//! JSON <-> Voidstar conversion.
//!
//! # Safety model
//!
//! All SHM pointer operations are encapsulated in `ShmWriter` (write) and
//! `ShmReader` (read). Each has a single `unsafe fn new()` constructor;
//! all subsequent reads/writes through the handle are safe methods.
//! The only remaining `unsafe` blocks are `libc::snprintf` for float
//! formatting and constructing readers/writers at known-valid offsets.

use crate::error::MorlocError;
use crate::schema::{Schema, SerialType};
use crate::shm::{self, AbsPtr, Array, RELNULL};

// ── Safe SHM abstractions ────────────────────────────────────────────────────

/// Write handle to a region of shared memory.
///
/// # Safety invariant
/// `ptr` was obtained from `shmalloc` and points to at least `len` writable bytes.
struct ShmWriter {
    ptr: *mut u8,
    #[cfg(debug_assertions)]
    len: usize,
}

impl ShmWriter {
    /// # Safety
    /// `ptr` must point to `len` bytes of valid, writable SHM.
    unsafe fn new(ptr: *mut u8, len: usize) -> Self {
        let _ = len;
        ShmWriter { ptr, #[cfg(debug_assertions)] len }
    }

    fn as_ptr(&self) -> *mut u8 { self.ptr }

    fn write_bytes(&self, offset: usize, src: &[u8]) {
        debug_assert!(offset + src.len() <= { #[cfg(debug_assertions)] { self.len } #[cfg(not(debug_assertions))] { usize::MAX } });
        unsafe { std::ptr::copy_nonoverlapping(src.as_ptr(), self.ptr.add(offset), src.len()); }
    }

    fn zero(&self, offset: usize, count: usize) {
        unsafe { std::ptr::write_bytes(self.ptr.add(offset), 0, count); }
    }

    fn write_val<T: Copy>(&self, offset: usize, val: T) {
        unsafe { (self.ptr.add(offset) as *mut T).write_unaligned(val); }
    }

    fn write_array_header(&self, offset: usize, size: usize, data_rel: shm::RelPtr) {
        let arr = Array { size, data: data_rel };
        unsafe {
            std::ptr::copy_nonoverlapping(
                &arr as *const Array as *const u8, self.ptr.add(offset),
                std::mem::size_of::<Array>(),
            );
        }
    }

    fn sub(&self, offset: usize, sub_len: usize) -> ShmWriter {
        unsafe { ShmWriter::new(self.ptr.add(offset), sub_len) }
    }
}

/// Read handle to SHM data.
///
/// # Safety invariant
/// `ptr` was obtained from `rel2abs`/`shmalloc` and points to valid readable SHM.
struct ShmReader { ptr: *const u8 }

impl ShmReader {
    /// # Safety
    /// `ptr` must point to valid, readable shared memory.
    unsafe fn new(ptr: *const u8) -> Self { ShmReader { ptr } }

    fn read_val<T: Copy>(&self, offset: usize) -> T {
        unsafe { (self.ptr.add(offset) as *const T).read_unaligned() }
    }
    fn read_u8(&self, offset: usize) -> u8 { self.read_val(offset) }
    fn read_array(&self, offset: usize) -> Array { unsafe { *(self.ptr.add(offset) as *const Array) } }

    fn read_str(&self, offset: usize, len: usize) -> &str {
        unsafe {
            std::str::from_utf8(std::slice::from_raw_parts(self.ptr.add(offset), len)).unwrap_or("")
        }
    }

    fn at(&self, offset: usize) -> ShmReader {
        unsafe { ShmReader::new(self.ptr.add(offset)) }
    }
}

// ── JSON -> Voidstar ───────────────────────────────────────────────────────

pub fn read_json_with_schema(json_str: &str, schema: &Schema) -> Result<AbsPtr, MorlocError> {
    read_json_with_schema_dest(None, json_str, schema)
}

pub fn read_json_with_schema_dest(
    dest: Option<AbsPtr>, json_str: &str, schema: &Schema,
) -> Result<AbsPtr, MorlocError> {
    let value: serde_json::Value = serde_json::from_str(json_str)
        .map_err(|e| MorlocError::Serialization(format!("JSON parse error: {}", e)))?;
    json_to_voidstar(&value, schema, dest)
}

fn alloc(dest: Option<AbsPtr>, size: usize) -> Result<ShmWriter, MorlocError> {
    let ptr = match dest { Some(p) => p, None => shm::shmalloc(size)? };
    // SAFETY: ptr from shmalloc or caller-provided valid SHM of sufficient size
    Ok(unsafe { ShmWriter::new(ptr, size) })
}

fn json_to_voidstar(
    value: &serde_json::Value, schema: &Schema, dest: Option<AbsPtr>,
) -> Result<AbsPtr, MorlocError> {
    match schema.serial_type {
        SerialType::Nil => { let w = alloc(dest, 1)?; w.write_val::<u8>(0, 0); Ok(w.as_ptr()) }
        SerialType::Bool => {
            let b = value.as_bool().ok_or_else(|| err("expected bool"))?;
            let w = alloc(dest, 1)?; w.write_val::<u8>(0, b as u8); Ok(w.as_ptr())
        }
        SerialType::Sint8  => { let w = alloc(dest, 1)?; w.write_val::<i8>(0,  as_i64(value)? as i8);  Ok(w.as_ptr()) }
        SerialType::Sint16 => { let w = alloc(dest, 2)?; w.write_val::<i16>(0, as_i64(value)? as i16); Ok(w.as_ptr()) }
        SerialType::Sint32 => { let w = alloc(dest, 4)?; w.write_val::<i32>(0, as_i64(value)? as i32); Ok(w.as_ptr()) }
        SerialType::Sint64 => { let w = alloc(dest, 8)?; w.write_val::<i64>(0, as_i64(value)?);        Ok(w.as_ptr()) }
        SerialType::Uint8  => { let w = alloc(dest, 1)?; w.write_val::<u8>(0,  as_u64(value)? as u8);  Ok(w.as_ptr()) }
        SerialType::Uint16 => { let w = alloc(dest, 2)?; w.write_val::<u16>(0, as_u64(value)? as u16); Ok(w.as_ptr()) }
        SerialType::Uint32 => { let w = alloc(dest, 4)?; w.write_val::<u32>(0, as_u64(value)? as u32); Ok(w.as_ptr()) }
        SerialType::Uint64 => { let w = alloc(dest, 8)?; w.write_val::<u64>(0, as_u64(value)?);        Ok(w.as_ptr()) }
        SerialType::Float32 => { let w = alloc(dest, 4)?; w.write_val::<f32>(0, as_f64(value)? as f32); Ok(w.as_ptr()) }
        SerialType::Float64 => { let w = alloc(dest, 8)?; w.write_val::<f64>(0, as_f64(value)?);        Ok(w.as_ptr()) }

        SerialType::String => {
            let s = value.as_str().ok_or_else(|| err("expected string"))?;
            let bytes = s.as_bytes();
            let hdr = std::mem::size_of::<Array>();

            let (w, data_rel) = if dest.is_some() {
                let w = alloc(dest, hdr)?;
                let data_rel = if bytes.is_empty() { RELNULL } else {
                    shm::abs2rel(shm::shmemcpy(bytes.as_ptr(), bytes.len())?)?
                };
                (w, data_rel)
            } else {
                let w = alloc(None, hdr + bytes.len())?;
                w.write_bytes(hdr, bytes);
                // SAFETY: data is hdr bytes into the same shmalloc block
                let data_rel = shm::abs2rel(unsafe { w.as_ptr().add(hdr) })?;
                (w, data_rel)
            };
            w.write_array_header(0, bytes.len(), data_rel);
            Ok(w.as_ptr())
        }

        SerialType::Array => {
            let arr_val = value.as_array().ok_or_else(|| err("expected array"))?;
            let es = schema.parameters.first().ok_or_else(|| err("array has no element type"))?;
            let n = arr_val.len();
            let ew = es.width;
            let hdr = std::mem::size_of::<Array>();

            let (hw, data_ptr) = if dest.is_some() {
                let hw = alloc(dest, hdr)?;
                let dp = if n > 0 { shm::shmalloc(n * ew)? } else { std::ptr::null_mut() };
                (hw, dp)
            } else {
                let w = alloc(None, hdr + n * ew)?;
                // SAFETY: data is hdr bytes into the same shmalloc block
                let dp = unsafe { w.as_ptr().add(hdr) };
                (w, dp)
            };
            let data_rel = if data_ptr.is_null() { RELNULL } else { shm::abs2rel(data_ptr)? };

            for (i, elem) in arr_val.iter().enumerate() {
                // SAFETY: data_ptr + i * ew is within the data allocation
                let ep = unsafe { data_ptr.add(i * ew) };
                json_to_voidstar(elem, es, Some(ep))?;
            }
            hw.write_array_header(0, n, data_rel);
            Ok(hw.as_ptr())
        }

        SerialType::Tuple | SerialType::Map => {
            let fields = extract_fields(value, schema)?;
            if fields.len() != schema.parameters.len() {
                return Err(err(&format!("expected {} fields, got {}", schema.parameters.len(), fields.len())));
            }
            let w = alloc(dest, schema.width)?;
            w.zero(0, schema.width);
            for (i, (fv, fs)) in fields.iter().zip(schema.parameters.iter()).enumerate() {
                let sub = w.sub(schema.offsets[i], fs.width);
                json_to_voidstar(fv, fs, Some(sub.as_ptr()))?;
            }
            Ok(w.as_ptr())
        }

        SerialType::Optional => {
            let inner = schema.parameters.first().ok_or_else(|| err("optional has no inner type"))?;
            let off = shm::align_up(1, inner.alignment().max(1));
            let total = off + inner.width;
            let w = alloc(dest, total)?;
            if value.is_null() {
                w.zero(0, total);
            } else {
                w.write_val::<u8>(0, 1);
                json_to_voidstar(value, inner, Some(w.sub(off, inner.width).as_ptr()))?;
            }
            Ok(w.as_ptr())
        }

        SerialType::Tensor => Err(err("Tensor JSON parsing not yet implemented")),
    }
}

fn extract_fields(value: &serde_json::Value, schema: &Schema) -> Result<Vec<serde_json::Value>, MorlocError> {
    if schema.serial_type == SerialType::Map && value.is_object() {
        let obj = value.as_object().unwrap();
        Ok(schema.keys.iter().map(|k| obj.get(k).cloned().unwrap_or(serde_json::Value::Null)).collect())
    } else {
        value.as_array().ok_or_else(|| err("expected array for tuple/map")).cloned()
    }
}

// ── Voidstar -> JSON ───────────────────────────────────────────────────────

pub fn voidstar_to_json_string(ptr: AbsPtr, schema: &Schema) -> Result<String, MorlocError> {
    let mut buf = String::new();
    // SAFETY: ptr from shmalloc/rel2abs — valid SHM
    let r = unsafe { ShmReader::new(ptr) };
    to_json(&r, schema, &mut buf)?;
    Ok(buf)
}

pub fn print_voidstar(ptr: AbsPtr, schema: &Schema) -> Result<(), MorlocError> {
    println!("{}", voidstar_to_json_string(ptr, schema)?);
    Ok(())
}

pub fn pretty_print_voidstar(ptr: AbsPtr, schema: &Schema) -> Result<(), MorlocError> {
    let json = voidstar_to_json_string(ptr, schema)?;
    let v: serde_json::Value = serde_json::from_str(&json).map_err(|e| err(&e.to_string()))?;
    match &v {
        // Print strings as raw text (unescaped, no quotes)
        serde_json::Value::String(s) => println!("{}", s),
        // Print numbers and bools as plain values
        serde_json::Value::Number(n) => println!("{}", n),
        serde_json::Value::Bool(b) => println!("{}", b),
        serde_json::Value::Null => println!("null"),
        // Print arrays and objects as indented JSON
        _ => println!("{}", serde_json::to_string_pretty(&v).map_err(|e| err(&e.to_string()))?),
    }
    Ok(())
}

fn to_json(r: &ShmReader, schema: &Schema, buf: &mut String) -> Result<(), MorlocError> {
    match schema.serial_type {
        SerialType::Nil    => buf.push_str("null"),
        SerialType::Bool   => buf.push_str(if r.read_u8(0) != 0 { "true" } else { "false" }),
        SerialType::Sint8  => buf.push_str(&(r.read_val::<i8>(0)).to_string()),
        SerialType::Sint16 => buf.push_str(&(r.read_val::<i16>(0)).to_string()),
        SerialType::Sint32 => buf.push_str(&(r.read_val::<i32>(0)).to_string()),
        SerialType::Sint64 => buf.push_str(&(r.read_val::<i64>(0)).to_string()),
        SerialType::Uint8  => buf.push_str(&r.read_u8(0).to_string()),
        SerialType::Uint16 => buf.push_str(&(r.read_val::<u16>(0)).to_string()),
        SerialType::Uint32 => buf.push_str(&(r.read_val::<u32>(0)).to_string()),
        SerialType::Uint64 => buf.push_str(&(r.read_val::<u64>(0)).to_string()),
        SerialType::Float32 => write_float(buf, r.read_val::<f32>(0) as f64, b"%.7g\0"),
        SerialType::Float64 => write_float(buf, r.read_val::<f64>(0), b"%.15g\0"),

        SerialType::String => {
            let arr = r.read_array(0);
            if arr.size == 0 || arr.data == RELNULL {
                buf.push_str("\"\"");
            } else {
                // SAFETY: arr.data resolved to valid SHM string bytes
                let dr = unsafe { ShmReader::new(shm::rel2abs(arr.data)?) };
                json_escape(dr.read_str(0, arr.size), buf);
            }
        }
        SerialType::Array => {
            let arr = r.read_array(0);
            let es = &schema.parameters[0];
            buf.push('[');
            if arr.size > 0 && arr.data != RELNULL {
                let data = shm::rel2abs(arr.data)?;
                for i in 0..arr.size {
                    if i > 0 { buf.push(','); }
                    // SAFETY: data + i * es.width within array data block
                    let er = unsafe { ShmReader::new(data.add(i * es.width)) };
                    to_json(&er, es, buf)?;
                }
            }
            buf.push(']');
        }
        SerialType::Tuple => {
            buf.push('[');
            for (i, fs) in schema.parameters.iter().enumerate() {
                if i > 0 { buf.push(','); }
                to_json(&r.at(schema.offsets[i]), fs, buf)?;
            }
            buf.push(']');
        }
        SerialType::Map => {
            buf.push('{');
            for (i, fs) in schema.parameters.iter().enumerate() {
                if i > 0 { buf.push(','); }
                if i < schema.keys.len() { buf.push('"'); buf.push_str(&schema.keys[i]); buf.push_str("\":"); }
                to_json(&r.at(schema.offsets[i]), fs, buf)?;
            }
            buf.push('}');
        }
        SerialType::Optional => {
            if r.read_u8(0) == 0 {
                buf.push_str("null");
            } else {
                let inner = &schema.parameters[0];
                to_json(&r.at(shm::align_up(1, inner.alignment().max(1))), inner, buf)?;
            }
        }
        SerialType::Tensor => {
            // SAFETY: reading Tensor struct from SHM
            let tensor = unsafe { &*(r.ptr as *const shm::Tensor) };
            if tensor.total_elements == 0 {
                buf.push_str("[]");
            } else {
                let ndim = schema.offsets.first().copied().unwrap_or(1);
                let sp = shm::rel2abs(tensor.shape)?;
                // SAFETY: sp points to ndim i64 values in SHM
                let shape: Vec<usize> = (0..ndim).map(|i| unsafe { *((sp as *const i64).add(i)) } as usize).collect();
                let dp = shm::rel2abs(tensor.data)?;
                let es = &schema.parameters[0];
                tensor_to_json(buf, dp, &shape, tensor.total_elements, es)?;
            }
        }
    }
    Ok(())
}

fn tensor_to_json(
    buf: &mut String, data: *const u8, shape: &[usize], stride: usize, es: &Schema,
) -> Result<(), MorlocError> {
    buf.push('[');
    if shape.len() == 1 {
        for i in 0..shape[0] {
            if i > 0 { buf.push(','); }
            // SAFETY: data + i * es.width within tensor data
            let r = unsafe { ShmReader::new(data.add(i * es.width)) };
            to_json(&r, es, buf)?;
        }
    } else {
        let inner = stride / shape[0];
        for i in 0..shape[0] {
            if i > 0 { buf.push(','); }
            tensor_to_json(buf, data.wrapping_add(i * inner * es.width), &shape[1..], inner, es)?;
        }
    }
    buf.push(']');
    Ok(())
}

// ── Helpers ────────────────────────────────────────────────────────────────

fn json_escape(s: &str, buf: &mut String) {
    buf.push('"');
    for ch in s.chars() {
        match ch {
            '"' => buf.push_str("\\\""), '\\' => buf.push_str("\\\\"), '/' => buf.push_str("\\/"),
            '\x08' => buf.push_str("\\b"), '\x0c' => buf.push_str("\\f"),
            '\n' => buf.push_str("\\n"), '\r' => buf.push_str("\\r"), '\t' => buf.push_str("\\t"),
            c if c < '\x20' => buf.push_str(&format!("\\u{:04x}", c as u32)),
            c => buf.push(c),
        }
    }
    buf.push('"');
}

fn err(msg: &str) -> MorlocError { MorlocError::Serialization(msg.into()) }
fn as_i64(v: &serde_json::Value) -> Result<i64, MorlocError> { v.as_i64().ok_or_else(|| err("expected integer")) }
fn as_u64(v: &serde_json::Value) -> Result<u64, MorlocError> { v.as_u64().ok_or_else(|| err("expected unsigned integer")) }
fn as_f64(v: &serde_json::Value) -> Result<f64, MorlocError> { v.as_f64().ok_or_else(|| err("expected number")) }

fn write_float(buf: &mut String, f: f64, fmt: &[u8]) {
    if f.is_nan() || f.is_infinite() { buf.push_str("null"); return; }
    let mut cbuf = [0u8; 64];
    // SAFETY: snprintf writes to stack-local buffer with explicit size limit
    let n = unsafe { libc::snprintf(cbuf.as_mut_ptr() as *mut libc::c_char, cbuf.len(), fmt.as_ptr() as *const libc::c_char, f) };
    if n > 0 && (n as usize) < cbuf.len() {
        buf.push_str(std::str::from_utf8(&cbuf[..n as usize]).unwrap_or("0"));
    } else {
        buf.push_str("0");
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::schema::parse_schema;
    fn setup() { crate::init_test_shm(); }

    #[test] fn test_int()     { setup(); let s = parse_schema("i4").unwrap(); let p = read_json_with_schema("42", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "42"); }
    #[test] fn test_string()  { setup(); let s = parse_schema("s").unwrap(); let p = read_json_with_schema("\"hello\"", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "\"hello\""); }
    #[test] fn test_bool()    { setup(); let s = parse_schema("b").unwrap(); let p = read_json_with_schema("true", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "true"); }
    #[test] fn test_array()   { setup(); let s = parse_schema("ai4").unwrap(); let p = read_json_with_schema("[1,2,3]", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "[1,2,3]"); }
    #[test] fn test_opt_some(){ setup(); let s = parse_schema("?i4").unwrap(); let p = read_json_with_schema("5", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "5"); }
    #[test] fn test_opt_null(){ setup(); let s = parse_schema("?i4").unwrap(); let p = read_json_with_schema("null", &s).unwrap(); assert_eq!(voidstar_to_json_string(p, &s).unwrap(), "null"); }
}


================================================
FILE: data/rust/morloc-runtime/src/json_ffi.rs
================================================
//! C ABI wrappers for JSON functions.
//! Replaces json.c's core functions with calls to Rust json.rs.
//! Arrow output and json_buf API are also implemented here.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};

// ── quoted ─────────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn quoted(input: *const c_char) -> *mut c_char {
    if input.is_null() {
        return ptr::null_mut();
    }
    let s = CStr::from_ptr(input);
    let bytes = s.to_bytes();
    let len = bytes.len();
    // Simple wrapping: "input" (matching C behavior — no escaping)
    let buf = libc::calloc(len + 3, 1) as *mut c_char;
    if buf.is_null() {
        return ptr::null_mut();
    }
    *buf = b'"' as c_char;
    std::ptr::copy_nonoverlapping(bytes.as_ptr(), buf.add(1) as *mut u8, len);
    *buf.add(len + 1) = b'"' as c_char;
    buf
}

// ── read_json_with_schema ──────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_json_with_schema(
    dest: *mut u8,
    json_str: *mut c_char,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    if json_str.is_null() || schema.is_null() {
        set_errmsg(errmsg, &MorlocError::NullPointer);
        return ptr::null_mut();
    }

    let rs = CSchema::to_rust(schema);
    let json = CStr::from_ptr(json_str).to_string_lossy();

    let dest_opt = if dest.is_null() { None } else { Some(dest) };
    match crate::json::read_json_with_schema_dest(dest_opt, &json, &rs) {
        Ok(ptr) => ptr,
        Err(e) => {
            set_errmsg(errmsg, &e);
            ptr::null_mut()
        }
    }
}

// ── voidstar_to_json_string ────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn voidstar_to_json_string(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match crate::json::voidstar_to_json_string(data as *mut u8, &rs) {
        Ok(s) => {
            match CString::new(s) {
                Ok(cs) => cs.into_raw(),
                Err(_) => {
                    set_errmsg(errmsg, &MorlocError::Other("CString conversion failed".into()));
                    ptr::null_mut()
                }
            }
        }
        Err(e) => {
            set_errmsg(errmsg, &e);
            ptr::null_mut()
        }
    }
}

// ── print_voidstar ─────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn print_voidstar(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match crate::json::print_voidstar(data as *mut u8, &rs) {
        Ok(_) => true,
        Err(e) => {
            set_errmsg(errmsg, &e);
            false
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn pretty_print_voidstar(
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match crate::json::pretty_print_voidstar(data as *mut u8, &rs) {
        Ok(_) => true,
        Err(e) => {
            set_errmsg(errmsg, &e);
            false
        }
    }
}

// ── json_buf API (used by daemon.c for discovery JSON) ─────────────────────

/// Dynamic JSON string builder.
pub struct JsonBuf {
    buf: String,
    needs_comma: Vec<bool>,
}

#[no_mangle]
pub extern "C" fn json_buf_new() -> *mut JsonBuf {
    Box::into_raw(Box::new(JsonBuf {
        buf: String::with_capacity(256),
        needs_comma: Vec::new(),
    }))
}

#[no_mangle]
pub unsafe extern "C" fn json_buf_free(jb: *mut JsonBuf) {
    if !jb.is_null() {
        let _ = Box::from_raw(jb);
    }
}

#[no_mangle]
pub unsafe extern "C" fn json_buf_finish(jb: *mut JsonBuf) -> *mut c_char {
    if jb.is_null() {
        return ptr::null_mut();
    }
    let jb = Box::from_raw(jb);
    match CString::new(jb.buf) {
        Ok(cs) => cs.into_raw(),
        Err(_) => ptr::null_mut(),
    }
}

unsafe fn jb_maybe_comma(jb: &mut JsonBuf) {
    if let Some(needs) = jb.needs_comma.last_mut() {
        if *needs {
            jb.buf.push(',');
        }
        *needs = true;
    }
}

#[no_mangle]
pub unsafe extern "C" fn json_write_obj_start(jb: *mut JsonBuf) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push('{');
    jb.needs_comma.push(false);
}

#[no_mangle]
pub unsafe extern "C" fn json_write_obj_end(jb: *mut JsonBuf) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb.needs_comma.pop();
    jb.buf.push('}');
}

#[no_mangle]
pub unsafe extern "C" fn json_write_arr_start(jb: *mut JsonBuf) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push('[');
    jb.needs_comma.push(false);
}

#[no_mangle]
pub unsafe extern "C" fn json_write_arr_end(jb: *mut JsonBuf) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb.needs_comma.pop();
    jb.buf.push(']');
}

#[no_mangle]
pub unsafe extern "C" fn json_write_key(jb: *mut JsonBuf, key: *const c_char) {
    if jb.is_null() || key.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    let s = CStr::from_ptr(key).to_string_lossy();
    jb.buf.push('"');
    jb.buf.push_str(&s);
    jb.buf.push_str("\":");
    // Don't set needs_comma — the value will follow immediately
    if let Some(needs) = jb.needs_comma.last_mut() {
        *needs = false;
    }
}

#[no_mangle]
pub unsafe extern "C" fn json_write_string(jb: *mut JsonBuf, val: *const c_char) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    if val.is_null() {
        jb.buf.push_str("null");
    } else {
        let s = CStr::from_ptr(val).to_string_lossy();
        // JSON-escape the string
        jb.buf.push('"');
        for ch in s.chars() {
            match ch {
                '"' => jb.buf.push_str("\\\""),
                '\\' => jb.buf.push_str("\\\\"),
                '\n' => jb.buf.push_str("\\n"),
                '\r' => jb.buf.push_str("\\r"),
                '\t' => jb.buf.push_str("\\t"),
                c if c < '\x20' => {
                    jb.buf.push_str(&format!("\\u{:04x}", c as u32));
                }
                c => jb.buf.push(c),
            }
        }
        jb.buf.push('"');
    }
}

#[no_mangle]
pub unsafe extern "C" fn json_write_int(jb: *mut JsonBuf, val: i64) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push_str(&val.to_string());
}

#[no_mangle]
pub unsafe extern "C" fn json_write_uint(jb: *mut JsonBuf, val: u64) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push_str(&val.to_string());
}

#[no_mangle]
pub unsafe extern "C" fn json_write_bool(jb: *mut JsonBuf, val: bool) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push_str(if val { "true" } else { "false" });
}

#[no_mangle]
pub unsafe extern "C" fn json_write_null(jb: *mut JsonBuf) {
    if jb.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    jb.buf.push_str("null");
}

#[no_mangle]
pub unsafe extern "C" fn json_write_raw(jb: *mut JsonBuf, raw: *const c_char) {
    if jb.is_null() || raw.is_null() { return; }
    let jb = &mut *jb;
    jb_maybe_comma(jb);
    let s = CStr::from_ptr(raw).to_string_lossy();
    jb.buf.push_str(&s);
}

// ── Arrow JSON output ──────────────────────────────────────────────────────
// Arrow output is complex and depends on the Arrow C Data Interface.
// These are implemented in C (arrow_json.c) and linked via the hybrid build.
// The functions below are stubs that will be overridden by the C implementations
// when we create a separate arrow_json.c file.
// For now, remove the Rust stubs and let C json.c's implementations be used
// from a separate compilation unit.

// print_arrow_as_json and print_arrow_as_table are provided by the C
// arrow_json code (extracted from json.c, kept in build as arrow_json.c)

#[allow(dead_code)]
unsafe fn _print_arrow_as_json_stub(
    data: *const c_void,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);

    // Use the arrow.c implementation which handles the Arrow C Data Interface
    extern "C" {
        fn arrow_column_desc(
            header: *const c_void,
            col_idx: usize,
        ) -> *const c_void;
        fn arrow_column_data(
            header: *const c_void,
            col_idx: usize,
        ) -> *const c_void;
        fn arrow_column_name(
            header: *const c_void,
            col_idx: usize,
        ) -> *const c_char;
    }

    // Read arrow_shm_header fields
    // arrow_shm_header_t: { magic: u32, n_columns: u32, n_rows: u64, ... }
    let header = data as *const u8;
    let n_columns = *(header.add(4) as *const u32) as usize;
    let n_rows = *(header.add(8) as *const u64) as usize;

    // Build JSON array of objects
    print!("[");
    for row in 0..n_rows {
        if row > 0 { print!(","); }
        print!("{{");
        for col in 0..n_columns {
            if col > 0 { print!(","); }
            let name = arrow_column_name(data, col);
            let name_str = if name.is_null() { "?" } else { CStr::from_ptr(name).to_str().unwrap_or("?") };
            print!("\"{}\":", name_str);

            let desc = arrow_column_desc(data, col);
            if desc.is_null() {
                print!("null");
                continue;
            }
            // desc is arrow_column_desc_t: { type: u8, length: u32, null_count: u32, name_offset, data_offset }
            let col_type = *(desc as *const u8);
            let col_data = arrow_column_data(data, col);

            // Print value based on type
            // Types: 0=nil, 1=bool, 2=i8, ..., 11=f64, 13=string
            match col_type {
                4 => { // i32
                    let vals = col_data as *const i32;
                    print!("{}", *vals.add(row));
                }
                5 => { // i64
                    let vals = col_data as *const i64;
                    print!("{}", *vals.add(row));
                }
                11 => { // f64
                    let vals = col_data as *const f64;
                    let mut cbuf = [0u8; 64];
                    let fmt = b"%.15g\0";
                    let n = libc::snprintf(cbuf.as_mut_ptr() as *mut c_char, 64, fmt.as_ptr() as *const c_char, *vals.add(row));
                    if n > 0 {
                        let s = std::str::from_utf8(&cbuf[..n as usize]).unwrap_or("0");
                        print!("{}", s);
                    }
                }
                13 => { // string
                    // Arrow strings: offsets array + data buffer
                    // For simplicity, use arrow_column_data which gives the data pointer
                    // This is a simplified implementation — full Arrow string handling
                    // requires offset arrays
                    print!("\"<string>\"");
                }
                _ => {
                    print!("null");
                }
            }
        }
        print!("}}");
    }
    println!("]");

    true
}

#[allow(dead_code)]
unsafe fn _print_arrow_as_table_stub(
    _data: *const c_void,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    // Stub — Arrow table output is rarely used
    // The full implementation would print TSV-formatted columns
    set_errmsg(errmsg, &MorlocError::Other("Arrow table output not yet implemented in Rust".into()));
    false
}


================================================
FILE: data/rust/morloc-runtime/src/lib.rs
================================================
pub mod error;
pub mod schema;
pub mod packet;
pub mod shm;
pub mod hash;
pub mod ipc;
pub mod json;
pub mod mpack;
// FFI and utility modules export #[no_mangle] extern "C" symbols.
// When the "no-ffi-exports" feature is active (nexus build), these modules
// are not compiled, preventing symbol conflicts with libmorloc.so.
// CSchema type is always available (used by nexus for Rust<->C conversion)
pub mod cschema;
pub mod ffi;
pub mod utility;
pub mod cache;
pub mod intrinsics;
pub mod voidstar;
pub mod json_ffi;
pub mod packet_ffi;
pub mod ipc_ffi;
pub mod http_ffi;
pub mod slurm_ffi;
pub mod manifest_ffi;
pub mod eval_ffi;
pub mod arrow_ffi;
pub mod pool_ffi;
pub mod daemon_ffi;
pub mod router_ffi;
pub mod cli;

/// Shared test SHM initialization. Call from all test modules.
#[cfg(test)]
pub(crate) fn init_test_shm() {
    use std::sync::Once;
    static INIT: Once = Once::new();
    INIT.call_once(|| {
        let tmpdir = std::env::temp_dir();
        let test_dir = tmpdir.join(format!("morloc_test_{}", std::process::id()));
        let _ = std::fs::create_dir_all(&test_dir);
        shm::shm_set_fallback_dir(test_dir.to_str().unwrap());
        let basename = format!("morloc_test_{}", std::process::id());
        shm::shinit(&basename, 0, 0x100000).unwrap(); // 1MB
    });
}

// Re-export core types at crate root
pub use error::MorlocError;
pub use schema::{Schema, SerialType};
pub use packet::{PacketHeader, PACKET_MAGIC};
pub use shm::{RelPtr, VolPtr, AbsPtr, Array, Tensor};


================================================
FILE: data/rust/morloc-runtime/src/manifest_ffi.rs
================================================
//! C ABI wrappers for manifest parsing and discovery JSON.
//!
//! This file mirrors the manifest data model into raw `#[repr(C)]`
//! structs that the daemon and slurm subsystems read via FFI from C
//! code. It is **not** the canonical Rust deserializer of the manifest
//! schema -- that lives in
//! `data/rust/morloc-nexus/src/manifest.rs`, which has full doc
//! comments describing the v2 manifest schema, every field's purpose,
//! and which slots are reserved for future expansion.
//!
//! The split exists for two reasons:
//!
//! 1. **C ABI stability.** The C structs here have the original v1
//!    field layout (flat `arg_schemas`, `return_schema`, `return_type`,
//!    `return_desc`, `build_dir`, `version`) so that downstream C
//!    callers (the daemon, the slurm bridge, any third-party FFI
//!    consumers) don't break when the JSON schema evolves. The
//!    `parse_manifest` function below reads the new v2 JSON shape and
//!    populates these legacy C struct fields, acting as a translation
//!    layer.
//!
//! 2. **Build-time decoupling.** The morloc-runtime crate needs to
//!    consume manifests without depending on the morloc-nexus crate.
//!    Sharing a Rust-level data model would create a circular
//!    dependency between the two crates.
//!
//! When the v2 schema gains new fields (constraints, metadata, etc.),
//! the canonical Rust model in `morloc-nexus/src/manifest.rs` is
//! updated first. This file gets new C struct fields only when a C-side
//! consumer needs them; otherwise the new JSON keys are silently
//! ignored here, which is the correct forward-compatible behavior.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};

// -- C-compatible types matching eval.h ---------------------------------------

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum MorlocExpressionType {
    Dat = 0,
    App = 1,
    Lam = 2,
    Bnd = 3,
    Pat = 4,
    Fmt = 5,
    Show = 6,
    Read = 7,
    Hash = 8,
    Save = 9,
    Load = 10,
}

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum MorlocAppExpressionType {
    Pattern = 0,
    Lambda = 1,
    Format = 2,
}

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum MorlocPatternType {
    ByKey = 0,
    ByIndex = 1,
    End = 2,
}

#[repr(C)]
pub union PatternFields {
    pub indices: *mut usize,
    pub keys: *mut *mut c_char,
}

#[repr(C)]
pub struct MorlocPattern {
    pub ptype: MorlocPatternType,
    pub size: usize,
    pub fields: PatternFields,
    pub selectors: *mut *mut MorlocPattern,
}

#[repr(C)]
pub union Primitive {
    pub s: *mut c_char,
    pub z: u8,
    pub b: bool,
    pub i1: i8,
    pub i2: i16,
    pub i4: i32,
    pub i8_: i64,
    pub u1: u8,
    pub u2: u16,
    pub u4: u32,
    pub u8_: u64,
    pub f4: f32,
    pub f8: f64,
}

#[repr(C)]
pub struct MorlocDataArray {
    pub schema: *mut CSchema,
    pub size: usize,
    pub values: *mut *mut MorlocExpression,
}

#[repr(C)]
// Primitive contains a pointer (s: *mut c_char), so DataUnion uses ManuallyDrop
#[repr(C)]
pub union DataUnion {
    pub lit_val: std::mem::ManuallyDrop<Primitive>,
    pub tuple_val: *mut *mut MorlocExpression,
    pub array_val: *mut MorlocDataArray,
    pub voidstar: *mut c_void,
}

#[repr(C)]
pub struct MorlocData {
    pub is_voidstar: bool,
    pub data: DataUnion,
}

#[repr(C)]
pub union AppFunction {
    pub pattern: *mut MorlocPattern,
    pub lambda: *mut MorlocLamExpression,
    pub fmt: *mut *mut c_char,
}

#[repr(C)]
pub struct MorlocAppExpression {
    pub atype: MorlocAppExpressionType,
    pub function: AppFunction,
    pub args: *mut *mut MorlocExpression,
    pub nargs: usize,
}

#[repr(C)]
pub struct MorlocLamExpression {
    pub nargs: usize,
    pub args: *mut *mut c_char,
    pub body: *mut MorlocExpression,
}

#[repr(C)]
pub struct MorlocSaveExpression {
    pub format: *mut c_char,
    pub value: *mut MorlocExpression,
    pub path: *mut MorlocExpression,
}

#[repr(C)]
pub union ExprUnion {
    pub app_expr: *mut MorlocAppExpression,
    pub lam_expr: *mut MorlocLamExpression,
    pub bnd_expr: *mut c_char,
    pub interpolation: *mut *mut c_char,
    pub pattern_expr: *mut MorlocPattern,
    pub data_expr: *mut MorlocData,
    pub unary_expr: *mut MorlocExpression,
    pub save_expr: *mut MorlocSaveExpression,
}

#[repr(C)]
pub struct MorlocExpression {
    pub etype: MorlocExpressionType,
    pub schema: *mut CSchema,
    pub expr: ExprUnion,
}

// -- C-ABI mirror of morloc-manifest v2 ---------------------------------------
//
// These #[repr(C)] structs are the in-memory layout that daemon_ffi /
// router_ffi / slurm_ffi consume via raw pointers. They mirror the
// shape of morloc_manifest's Rust types one-for-one (modulo C-string
// encoding) -- when the Rust schema gains a new field, it's added here
// too as a parallel C field. There is no longer any "translation" or
// reshape layer; parse_manifest below is a near-1:1 walker.
//
// Conventions:
// - C-string fields are owned by the manifest and freed by free_manifest.
// - Array fields use a (pointer, count) pair (e.g. desc + n_desc).
// - The "constraints" and "metadata" extension slots described in
//   morloc-manifest's docs are mirrored here so daemon-side constraint
//   enforcement can later read them without another C ABI break.
// - metadata is serialized as JSON text (`metadata_json`) because the
//   C side has no natural map type and the slot is reserved for now.

#[repr(C)]
pub struct ManifestBuild {
    pub path: *mut c_char,
    pub time: i64,
    pub morloc_version: *mut c_char,
}

#[repr(C)]
pub struct ManifestConstraint {
    /// Constraint discriminator (e.g. "kind", "min", "regex").
    pub ctype: *mut c_char,
    /// JSON-encoded payload for the constraint, or NULL when the
    /// constraint type carries no value (e.g. "non_empty").
    pub value_json: *mut c_char,
}

#[repr(C)]
pub struct ManifestPool {
    pub lang: *mut c_char,
    pub exec: *mut *mut c_char, // NULL-terminated
    pub socket: *mut c_char,
    /// JSON-encoded pool-level metadata. Reserved.
    pub metadata_json: *mut c_char,
}

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum ManifestArgKind {
    Pos = 0,
    Opt = 1,
    Flag = 2,
    Grp = 3,
}

#[repr(C)]
pub struct ManifestGrpEntry {
    pub key: *mut c_char,
    pub arg: *mut ManifestArg,
}

#[repr(C)]
pub struct ManifestArg {
    pub kind: ManifestArgKind,
    /// Per-arg morloc serialization schema. NULL for flags. Group
    /// entries also have NULL here (the group's top-level schema
    /// covers them).
    pub schema: *mut c_char,
    /// User-facing type name. NULL for flags.
    pub type_desc: *mut c_char,
    pub metavar: *mut c_char,
    pub quoted: bool,
    pub short_opt: c_char,
    pub long_opt: *mut c_char,
    pub long_rev: *mut c_char,
    pub default_val: *mut c_char,
    /// NULL-terminated array of description lines.
    pub desc: *mut *mut c_char,
    pub n_desc: usize,
    /// Array of ManifestConstraint owned by this arg.
    pub constraints: *mut ManifestConstraint,
    pub n_constraints: usize,
    /// Group sub-fields (only meaningful when kind == Grp).
    pub grp_short: c_char,
    pub grp_long: *mut c_char,
    pub entries: *mut ManifestGrpEntry,
    pub n_entries: usize,
    /// JSON-encoded per-arg metadata. Reserved.
    pub metadata_json: *mut c_char,
}

#[repr(C)]
pub struct ManifestReturn {
    pub schema: *mut c_char,
    pub type_desc: *mut c_char,
    pub desc: *mut *mut c_char,
    pub n_desc: usize,
    pub constraints: *mut ManifestConstraint,
    pub n_constraints: usize,
    pub metadata_json: *mut c_char,
}

#[repr(C)]
pub struct ManifestCmdGroup {
    pub name: *mut c_char,
    pub desc: *mut *mut c_char,
    pub n_desc: usize,
    pub metadata_json: *mut c_char,
}

#[repr(C)]
pub struct ManifestCommand {
    pub name: *mut c_char,
    pub is_pure: bool,
    pub mid: u32,
    pub pool_index: usize,
    pub needed_pools: *mut usize,
    pub n_needed_pools: usize,
    pub desc: *mut *mut c_char,
    pub n_desc: usize,
    pub args: *mut ManifestArg,
    pub n_args: usize,
    /// Return-value descriptor as a sub-struct (replaces v1's flat
    /// return_schema/return_type/return_desc fields).
    pub ret: ManifestReturn,
    pub constraints: *mut ManifestConstraint,
    pub n_constraints: usize,
    pub expr: *mut MorlocExpression,
    pub group: *mut c_char,
    pub metadata_json: *mut c_char,
}

#[repr(C)]
pub struct ManifestService {
    pub stype: *mut c_char,
    pub host: *mut c_char,
    pub port: i32,
    pub socket: *mut c_char,
    pub metadata_json: *mut c_char,
}

#[repr(C)]
pub struct Manifest {
    pub name: *mut c_char,
    pub build: ManifestBuild,
    pub pools: *mut ManifestPool,
    pub n_pools: usize,
    pub commands: *mut ManifestCommand,
    pub n_commands: usize,
    pub groups: *mut ManifestCmdGroup,
    pub n_groups: usize,
    pub service: *mut ManifestService,
    pub metadata_json: *mut c_char,
}

impl ManifestCommand {
    /// Build a transient NULL-terminated array of schema strings for
    /// the command's args, in declaration order. The caller owns the
    /// outer array allocation but NOT the inner C strings (they
    /// remain owned by the ManifestArg objects). Use
    /// `libc::free(arr as *mut c_void)` to release the outer array
    /// when done.
    ///
    /// The array has one entry per arg INCLUDING flags. Flags have a
    /// per-arg `schema` field of NULL on the v2 ManifestArg, but the
    /// legacy callers (e.g. make_call_packet_from_cli) expect a slot
    /// per arg position to keep index alignment with the parallel
    /// args array; we substitute "b" (the boolean schema) for flags
    /// so dispatch reads the flag value as a Bool, matching v1
    /// behavior.
    pub unsafe fn build_arg_schemas_array(&self) -> *mut *mut c_char {
        let n = self.n_args;
        let arr = libc::calloc(n + 1, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
        for i in 0..n {
            let arg = &*self.args.add(i);
            *arr.add(i) = if arg.kind == ManifestArgKind::Flag || arg.schema.is_null() {
                // Flag schema fallback: use the static "b" string. This
                // pointer is NOT freed by the caller (it's a global
                // string literal), but since the caller only frees the
                // OUTER array, this is fine. We use a per-call CString
                // leak so each call has a distinct C-string buffer the
                // caller doesn't try to free with the per-arg owners.
                // Cleaner: we just point to the existing per-arg
                // schema slot if non-null, else fall through. Most
                // flag args won't be hit by legacy callers anyway.
                static FLAG_SCHEMA: &[u8] = b"b\0";
                FLAG_SCHEMA.as_ptr() as *mut c_char
            } else {
                arg.schema
            };
        }
        *arr.add(n) = ptr::null_mut();
        arr
    }
}

// -- Helpers ------------------------------------------------------------------

unsafe fn c_strdup(s: &str) -> *mut c_char {
    match CString::new(s) {
        Ok(cs) => libc::strdup(cs.as_ptr()),
        Err(_) => ptr::null_mut(),
    }
}

unsafe fn nullable_strdup(s: Option<&str>) -> *mut c_char {
    match s {
        Some(s) => c_strdup(s),
        None => ptr::null_mut(),
    }
}

// -- Expression builder (using serde_json::Value) -----------------------------

unsafe fn build_pattern(jp: &serde_json::Value) -> Result<*mut MorlocPattern, MorlocError> {
    let ptype = jp.get("type").and_then(|v| v.as_str()).ok_or_else(|| MorlocError::Other("Pattern missing 'type' field".into()))?;

    if ptype == "end" {
        // make_morloc_pattern_end - call C function
        extern "C" {
            fn make_morloc_pattern_end() -> *mut MorlocPattern;
        }
        return Ok(make_morloc_pattern_end());
    }

    let sels = jp.get("selectors").and_then(|v| v.as_array());
    let n = sels.map(|a| a.len()).unwrap_or(0);

    let pat = libc::calloc(1, std::mem::size_of::<MorlocPattern>()) as *mut MorlocPattern;
    (*pat).size = n;
    (*pat).selectors = libc::calloc(n, std::mem::size_of::<*mut MorlocPattern>()) as *mut *mut MorlocPattern;

    if ptype == "idx" {
        (*pat).ptype = MorlocPatternType::ByIndex;
        (*pat).fields.indices = libc::calloc(n, std::mem::size_of::<usize>()) as *mut usize;
        if let Some(sels) = sels {
            for (i, sel) in sels.iter().enumerate() {
                *(*pat).fields.indices.add(i) = sel.get("index").and_then(|v| v.as_f64()).unwrap_or(0.0) as usize;
                *(*pat).selectors.add(i) = build_pattern(sel.get("sub").unwrap_or(&serde_json::Value::Null))?;
            }
        }
    } else if ptype == "key" {
        (*pat).ptype = MorlocPatternType::ByKey;
        (*pat).fields.keys = libc::calloc(n, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
        if let Some(sels) = sels {
            for (i, sel) in sels.iter().enumerate() {
                let key = sel.get("key").and_then(|v| v.as_str()).unwrap_or("");
                *(*pat).fields.keys.add(i) = c_strdup(key);
                *(*pat).selectors.add(i) = build_pattern(sel.get("sub").unwrap_or(&serde_json::Value::Null))?;
            }
        }
    } else {
        return Err(MorlocError::Other(format!("Unknown pattern type: {}", ptype)));
    }

    Ok(pat)
}

unsafe fn build_expr(je: &serde_json::Value) -> Result<*mut MorlocExpression, MorlocError> {
    let tag = je.get("tag").and_then(|v| v.as_str()).ok_or_else(|| MorlocError::Other("Expression missing 'tag' field".into()))?;

    extern "C" {
        fn parse_schema(s: *const c_char, errmsg: *mut *mut c_char) -> *mut CSchema;
        fn make_morloc_literal(schema: *const c_char, prim: Primitive, errmsg: *mut *mut c_char) -> *mut MorlocExpression;
        fn make_morloc_bound_var(schema: *const c_char, var: *mut c_char, errmsg: *mut *mut c_char) -> *mut MorlocExpression;
        fn make_morloc_pattern(schema: *const c_char, pat: *mut MorlocPattern, errmsg: *mut *mut c_char) -> *mut MorlocExpression;
    }

    let mut err: *mut c_char = ptr::null_mut();

    match tag {
        "lit" => {
            let schema = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let lt = je.get("lit_type").and_then(|v| v.as_str()).unwrap_or("");
            let val = je.get("value").and_then(|v| v.as_str()).unwrap_or("0");
            let mut prim: Primitive = std::mem::zeroed();

            match lt {
                "f4" => prim.f4 = val.parse::<f32>().unwrap_or(0.0),
                "f8" => prim.f8 = val.parse::<f64>().unwrap_or(0.0),
                "i1" => prim.i1 = val.parse::<i8>().unwrap_or(0),
                "i2" => prim.i2 = val.parse::<i16>().unwrap_or(0),
                "i4" => prim.i4 = val.parse::<i32>().unwrap_or(0),
                "i8" => prim.i8_ = val.parse::<i64>().unwrap_or(0),
                "u1" => prim.u1 = val.parse::<u8>().unwrap_or(0),
                "u2" => prim.u2 = val.parse::<u16>().unwrap_or(0),
                "u4" => prim.u4 = val.parse::<u32>().unwrap_or(0),
                "u8" => prim.u8_ = val.parse::<u64>().unwrap_or(0),
                "b" => prim.b = val != "0",
                "z" => prim.z = 0,
                _ => return Err(MorlocError::Other(format!("Unknown lit_type: {}", lt))),
            }

            let c_schema = CString::new(schema).unwrap_or_default();
            let result = make_morloc_literal(c_schema.as_ptr(), prim, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            Ok(result)
        }

        "str" => {
            let schema = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let val = je.get("value").and_then(|v| v.as_str()).unwrap_or("");
            let mut prim: Primitive = std::mem::zeroed();
            prim.s = c_strdup(val);
            let c_schema = CString::new(schema).unwrap_or_default();
            let result = make_morloc_literal(c_schema.as_ptr(), prim, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            Ok(result)
        }

        "container" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let elems = je.get("elements").and_then(|v| v.as_array());
            let n = elems.map(|a| a.len()).unwrap_or(0);

            let c_schema_str = CString::new(schema_str).unwrap_or_default();
            let schema = parse_schema(c_schema_str.as_ptr(), &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }

            let values = libc::calloc(n, std::mem::size_of::<*mut MorlocExpression>()) as *mut *mut MorlocExpression;
            if let Some(elems) = elems {
                for (i, elem) in elems.iter().enumerate() {
                    *values.add(i) = build_expr(elem)?;
                }
            }

            let data = libc::calloc(1, std::mem::size_of::<MorlocData>()) as *mut MorlocData;
            (*data).is_voidstar = false;

            let schema_type = (*schema).serial_type;
            // MORLOC_ARRAY = 14, MORLOC_TUPLE = 15, MORLOC_MAP = 16
            if schema_type == 14 { // Array
                let arr = libc::calloc(1, std::mem::size_of::<MorlocDataArray>()) as *mut MorlocDataArray;
                (*arr).schema = if (*schema).size > 0 && !(*schema).parameters.is_null() { *(*schema).parameters } else { ptr::null_mut() };
                (*arr).size = n;
                (*arr).values = values;
                (*data).data.array_val = arr;
            } else if schema_type == 15 || schema_type == 16 { // Tuple or Map
                (*data).data.tuple_val = values;
            } else {
                libc::free(values as *mut c_void);
                libc::free(data as *mut c_void);
                CSchema::free(schema);
                return Err(MorlocError::Other("Container schema is not a container type".into()));
            }

            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = MorlocExpressionType::Dat;
            (*expr).schema = schema;
            (*expr).expr.data_expr = data;
            Ok(expr)
        }

        "app" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let jargs = je.get("args").and_then(|v| v.as_array());
            let n = jargs.map(|a| a.len()).unwrap_or(0);

            let c_schema_str = CString::new(schema_str).unwrap_or_default();
            let schema = parse_schema(c_schema_str.as_ptr(), &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }

            let func = build_expr(je.get("func").unwrap_or(&serde_json::Value::Null))?;
            let args = libc::calloc(n, std::mem::size_of::<*mut MorlocExpression>()) as *mut *mut MorlocExpression;
            if let Some(jargs) = jargs {
                for (i, a) in jargs.iter().enumerate() {
                    *args.add(i) = build_expr(a)?;
                }
            }

            let app = libc::calloc(1, std::mem::size_of::<MorlocAppExpression>()) as *mut MorlocAppExpression;
            match (*func).etype {
                MorlocExpressionType::Pat => {
                    (*app).atype = MorlocAppExpressionType::Pattern;
                    (*app).function.pattern = (*func).expr.pattern_expr;
                }
                MorlocExpressionType::Lam => {
                    (*app).atype = MorlocAppExpressionType::Lambda;
                    (*app).function.lambda = (*func).expr.lam_expr;
                }
                MorlocExpressionType::Fmt => {
                    (*app).atype = MorlocAppExpressionType::Format;
                    (*app).function.fmt = (*func).expr.interpolation;
                }
                _ => {
                    return Err(MorlocError::Other(format!("Invalid function in app expression (type={:?})", (*func).etype)));
                }
            }
            (*app).args = args;
            (*app).nargs = n;

            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = MorlocExpressionType::App;
            (*expr).schema = schema;
            (*expr).expr.app_expr = app;
            Ok(expr)
        }

        "lambda" => {
            let jvars = je.get("vars").and_then(|v| v.as_array());
            let n = jvars.map(|a| a.len()).unwrap_or(0);

            let body = build_expr(je.get("body").unwrap_or(&serde_json::Value::Null))?;
            let vars = libc::calloc(n, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
            if let Some(jvars) = jvars {
                for (i, v) in jvars.iter().enumerate() {
                    *vars.add(i) = c_strdup(v.as_str().unwrap_or(""));
                }
            }

            let lam = libc::calloc(1, std::mem::size_of::<MorlocLamExpression>()) as *mut MorlocLamExpression;
            (*lam).nargs = n;
            (*lam).args = vars;
            (*lam).body = body;

            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = MorlocExpressionType::Lam;
            (*expr).schema = ptr::null_mut();
            (*expr).expr.lam_expr = lam;
            Ok(expr)
        }

        "bound" => {
            let schema = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let var = je.get("var").and_then(|v| v.as_str()).unwrap_or("");
            let c_schema = CString::new(schema).unwrap_or_default();
            let c_var = c_strdup(var);
            let result = make_morloc_bound_var(c_schema.as_ptr(), c_var, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            Ok(result)
        }

        "show" | "read" | "hash" | "load" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let c_schema_str = CString::new(schema_str).unwrap_or_default();
            let schema = parse_schema(c_schema_str.as_ptr(), &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            let child = build_expr(je.get("child").unwrap_or(&serde_json::Value::Null))?;
            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = match tag {
                "show" => MorlocExpressionType::Show,
                "read" => MorlocExpressionType::Read,
                "hash" => MorlocExpressionType::Hash,
                "load" => MorlocExpressionType::Load,
                _ => unreachable!(),
            };
            (*expr).schema = schema;
            (*expr).expr.unary_expr = child;
            Ok(expr)
        }

        "save" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let c_schema_str = CString::new(schema_str).unwrap_or_default();
            let schema = parse_schema(c_schema_str.as_ptr(), &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            let fmt_str = je.get("format").and_then(|v| v.as_str()).unwrap_or("voidstar");
            let c_fmt = CString::new(fmt_str).unwrap_or_default();
            let value = build_expr(je.get("value").unwrap_or(&serde_json::Value::Null))?;
            let path = build_expr(je.get("path").unwrap_or(&serde_json::Value::Null))?;
            let save = libc::calloc(1, std::mem::size_of::<MorlocSaveExpression>()) as *mut MorlocSaveExpression;
            (*save).format = c_fmt.into_raw();
            (*save).value = value;
            (*save).path = path;
            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = MorlocExpressionType::Save;
            (*expr).schema = schema;
            (*expr).expr.save_expr = save;
            Ok(expr)
        }

        "interpolation" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let jstrs = je.get("strings").and_then(|v| v.as_array());
            let n = jstrs.map(|a| a.len()).unwrap_or(0);

            let c_schema_str = CString::new(schema_str).unwrap_or_default();
            let schema = parse_schema(c_schema_str.as_ptr(), &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }

            let strings = libc::calloc(n + 1, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
            if let Some(jstrs) = jstrs {
                for (i, s) in jstrs.iter().enumerate() {
                    *strings.add(i) = c_strdup(s.as_str().unwrap_or(""));
                }
            }

            let expr = libc::calloc(1, std::mem::size_of::<MorlocExpression>()) as *mut MorlocExpression;
            (*expr).etype = MorlocExpressionType::Fmt;
            (*expr).schema = schema;
            (*expr).expr.interpolation = strings;
            Ok(expr)
        }

        "pattern" => {
            let schema_str = je.get("schema").and_then(|v| v.as_str()).unwrap_or("");
            let pat = build_pattern(je.get("pattern").unwrap_or(&serde_json::Value::Null))?;
            let c_schema = CString::new(schema_str).unwrap_or_default();
            let result = make_morloc_pattern(c_schema.as_ptr(), pat, &mut err);
            if !err.is_null() {
                let msg = CStr::from_ptr(err).to_string_lossy().into_owned();
                libc::free(err as *mut c_void);
                return Err(MorlocError::Other(msg));
            }
            Ok(result)
        }

        _ => Err(MorlocError::Other(format!("Unknown expression tag: {}", tag))),
    }
}

// -- build_manifest_expr ------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn build_manifest_expr(
    json_str: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut MorlocExpression {
    clear_errmsg(errmsg);
    let s = CStr::from_ptr(json_str).to_string_lossy();
    let jv: serde_json::Value = match serde_json::from_str(&s) {
        Ok(v) => v,
        Err(e) => {
            set_errmsg(errmsg, &MorlocError::Other(format!("Failed to parse expression JSON: {}", e)));
            return ptr::null_mut();
        }
    };
    match build_expr(&jv) {
        Ok(expr) => expr,
        Err(e) => {
            set_errmsg(errmsg, &e);
            ptr::null_mut()
        }
    }
}

// -- C-ABI population from morloc-manifest Rust types -------------------------
//
// parse_manifest is now a thin shell over morloc_manifest::parse_manifest
// (which does all the JSON parsing, version checking, and serde
// validation). The walker functions below convert the Rust-native
// structs into owned C structs, mirroring the v2 schema field-for-field.

unsafe fn populate_constraint(dst: *mut ManifestConstraint, src: &morloc_manifest::Constraint) {
    (*dst).ctype = c_strdup(&src.ctype);
    (*dst).value_json = match &src.value {
        Some(v) => c_strdup(&v.to_string()),
        None => ptr::null_mut(),
    };
}

unsafe fn populate_constraints(
    src: &[morloc_manifest::Constraint],
) -> (*mut ManifestConstraint, usize) {
    if src.is_empty() {
        return (ptr::null_mut(), 0);
    }
    let arr =
        libc::calloc(src.len(), std::mem::size_of::<ManifestConstraint>()) as *mut ManifestConstraint;
    for (i, c) in src.iter().enumerate() {
        populate_constraint(arr.add(i), c);
    }
    (arr, src.len())
}

unsafe fn populate_metadata(src: &morloc_manifest::Metadata) -> *mut c_char {
    if src.is_empty() {
        c_strdup("{}")
    } else {
        let s = serde_json::to_string(src).unwrap_or_else(|_| "{}".into());
        c_strdup(&s)
    }
}

/// Convert a Vec<String> to a NULL-terminated array of C strings,
/// and return (pointer, count). Caller owns the allocation.
unsafe fn populate_str_vec(src: &[String]) -> (*mut *mut c_char, usize) {
    let n = src.len();
    let arr = libc::calloc(n + 1, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
    for (i, s) in src.iter().enumerate() {
        *arr.add(i) = c_strdup(s);
    }
    *arr.add(n) = ptr::null_mut();
    (arr, n)
}

unsafe fn populate_arg(dst: *mut ManifestArg, src: &morloc_manifest::Arg) {
    use morloc_manifest::Arg;
    match src {
        Arg::Positional {
            schema,
            type_desc,
            metavar,
            quoted,
            desc,
            constraints,
            ..
        } => {
            (*dst).kind = ManifestArgKind::Pos;
            (*dst).schema = nullable_strdup(schema.as_deref());
            (*dst).type_desc = nullable_strdup(type_desc.as_deref());
            (*dst).metavar = nullable_strdup(metavar.as_deref());
            (*dst).quoted = *quoted;
            let (d, n) = populate_str_vec(desc);
            (*dst).desc = d;
            (*dst).n_desc = n;
            let (cs, nc) = populate_constraints(constraints);
            (*dst).constraints = cs;
            (*dst).n_constraints = nc;
            (*dst).metadata_json = c_strdup("{}");
        }
        Arg::Optional {
            schema,
            type_desc,
            metavar,
            quoted,
            short_opt,
            long_opt,
            default_val,
            desc,
            constraints,
            ..
        } => {
            (*dst).kind = ManifestArgKind::Opt;
            (*dst).schema = nullable_strdup(schema.as_deref());
            (*dst).type_desc = nullable_strdup(type_desc.as_deref());
            (*dst).metavar = nullable_strdup(metavar.as_deref());
            (*dst).quoted = *quoted;
            (*dst).short_opt = short_opt
                .as_ref()
                .and_then(|s| s.as_bytes().first().copied())
                .map(|b| b as c_char)
                .unwrap_or(0);
            (*dst).long_opt = nullable_strdup(long_opt.as_deref());
            (*dst).default_val = nullable_strdup(default_val.as_deref());
            let (d, n) = populate_str_vec(desc);
            (*dst).desc = d;
            (*dst).n_desc = n;
            let (cs, nc) = populate_constraints(constraints);
            (*dst).constraints = cs;
            (*dst).n_constraints = nc;
            (*dst).metadata_json = c_strdup("{}");
        }
        Arg::Flag {
            short_opt,
            long_opt,
            long_rev,
            default_val,
            desc,
            ..
        } => {
            (*dst).kind = ManifestArgKind::Flag;
            (*dst).short_opt = short_opt
                .as_ref()
                .and_then(|s| s.as_bytes().first().copied())
                .map(|b| b as c_char)
                .unwrap_or(0);
            (*dst).long_opt = nullable_strdup(long_opt.as_deref());
            (*dst).long_rev = nullable_strdup(long_rev.as_deref());
            (*dst).default_val = nullable_strdup(default_val.as_deref());
            let (d, n) = populate_str_vec(desc);
            (*dst).desc = d;
            (*dst).n_desc = n;
            (*dst).metadata_json = c_strdup("{}");
        }
        Arg::Group {
            schema,
            type_desc,
            metavar,
            desc,
            group_opt,
            entries,
            constraints,
            ..
        } => {
            (*dst).kind = ManifestArgKind::Grp;
            (*dst).schema = nullable_strdup(schema.as_deref());
            (*dst).type_desc = nullable_strdup(type_desc.as_deref());
            (*dst).metavar = nullable_strdup(metavar.as_deref());
            let (d, n) = populate_str_vec(desc);
            (*dst).desc = d;
            (*dst).n_desc = n;
            if let Some(g) = group_opt {
                (*dst).grp_short = g
                    .short_opt
                    .as_ref()
                    .and_then(|s| s.as_bytes().first().copied())
                    .map(|b| b as c_char)
                    .unwrap_or(0);
                (*dst).grp_long = nullable_strdup(g.long_opt.as_deref());
            }
            if !entries.is_empty() {
                (*dst).n_entries = entries.len();
                (*dst).entries = libc::calloc(
                    entries.len(),
                    std::mem::size_of::<ManifestGrpEntry>(),
                ) as *mut ManifestGrpEntry;
                for (i, ge) in entries.iter().enumerate() {
                    let ge_dst = &mut *(*dst).entries.add(i);
                    ge_dst.key = c_strdup(&ge.key);
                    let sub_arg = libc::calloc(1, std::mem::size_of::<ManifestArg>())
                        as *mut ManifestArg;
                    populate_arg(sub_arg, &ge.arg);
                    ge_dst.arg = sub_arg;
                }
            }
            let (cs, nc) = populate_constraints(constraints);
            (*dst).constraints = cs;
            (*dst).n_constraints = nc;
            (*dst).metadata_json = c_strdup("{}");
        }
    }
}

unsafe fn populate_return(dst: *mut ManifestReturn, src: &morloc_manifest::Return) {
    (*dst).schema = c_strdup(&src.schema);
    (*dst).type_desc = c_strdup(&src.type_desc);
    let (d, n) = populate_str_vec(&src.desc);
    (*dst).desc = d;
    (*dst).n_desc = n;
    let (cs, nc) = populate_constraints(&src.constraints);
    (*dst).constraints = cs;
    (*dst).n_constraints = nc;
    (*dst).metadata_json = populate_metadata(&src.metadata);
}

unsafe fn populate_command(dst: *mut ManifestCommand, src: &morloc_manifest::Command) -> Result<(), MorlocError> {
    (*dst).name = c_strdup(&src.name);
    (*dst).is_pure = src.is_pure();
    (*dst).mid = src.mid;
    (*dst).pool_index = src.pool_index;
    if !src.needed_pools.is_empty() {
        (*dst).n_needed_pools = src.needed_pools.len();
        (*dst).needed_pools = libc::calloc(
            src.needed_pools.len(),
            std::mem::size_of::<usize>(),
        ) as *mut usize;
        for (i, p) in src.needed_pools.iter().enumerate() {
            *(*dst).needed_pools.add(i) = *p;
        }
    }
    let (d, n) = populate_str_vec(&src.desc);
    (*dst).desc = d;
    (*dst).n_desc = n;

    if !src.args.is_empty() {
        (*dst).n_args = src.args.len();
        (*dst).args = libc::calloc(
            src.args.len(),
            std::mem::size_of::<ManifestArg>(),
        ) as *mut ManifestArg;
        for (i, a) in src.args.iter().enumerate() {
            populate_arg((*dst).args.add(i), a);
        }
    }

    populate_return(&mut (*dst).ret, &src.ret);

    let (cs, nc) = populate_constraints(&src.constraints);
    (*dst).constraints = cs;
    (*dst).n_constraints = nc;

    (*dst).metadata_json = populate_metadata(&src.metadata);

    if src.is_pure() {
        if let Some(expr_val) = &src.expr {
            match build_expr(expr_val) {
                Ok(e) => (*dst).expr = e,
                Err(e) => return Err(e),
            }
        }
    }

    (*dst).group = match &src.group {
        Some(g) => c_strdup(g),
        None => ptr::null_mut(),
    };

    Ok(())
}

unsafe fn populate_pool(dst: *mut ManifestPool, src: &morloc_manifest::Pool) {
    (*dst).lang = c_strdup(&src.lang);
    let n = src.exec.len();
    (*dst).exec = libc::calloc(n + 1, std::mem::size_of::<*mut c_char>()) as *mut *mut c_char;
    for (i, e) in src.exec.iter().enumerate() {
        *(*dst).exec.add(i) = c_strdup(e);
    }
    *(*dst).exec.add(n) = ptr::null_mut();
    (*dst).socket = c_strdup(&src.socket);
    (*dst).metadata_json = populate_metadata(&src.metadata);
}

unsafe fn populate_cmd_group(dst: *mut ManifestCmdGroup, src: &morloc_manifest::CmdGroup) {
    (*dst).name = c_strdup(&src.name);
    let (d, n) = populate_str_vec(&src.desc);
    (*dst).desc = d;
    (*dst).n_desc = n;
    (*dst).metadata_json = populate_metadata(&src.metadata);
}

unsafe fn populate_service(dst: *mut ManifestService, src: &morloc_manifest::Service) {
    (*dst).stype = nullable_strdup(src.service_type.as_deref());
    (*dst).host = nullable_strdup(src.host.as_deref());
    (*dst).port = src.port.unwrap_or(0);
    (*dst).socket = nullable_strdup(src.socket.as_deref());
    (*dst).metadata_json = populate_metadata(&src.metadata);
}

// -- parse_manifest -----------------------------------------------------------
//
// Reads a manifest JSON string, parses it via the canonical
// morloc-manifest crate (which performs the version staleness check),
// and converts the resulting Rust struct into owned C structs for
// daemon-side consumers. There is no separate JSON walker here -- the
// shape and validation rules live in one place (the morloc-manifest
// crate).

#[no_mangle]
pub unsafe extern "C" fn parse_manifest(
    text: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut Manifest {
    clear_errmsg(errmsg);
    let s = CStr::from_ptr(text).to_string_lossy();

    let parsed = match morloc_manifest::parse_manifest(&s) {
        Ok(p) => p,
        Err(e) => {
            set_errmsg(errmsg, &MorlocError::Other(e));
            return ptr::null_mut();
        }
    };

    let m = libc::calloc(1, std::mem::size_of::<Manifest>()) as *mut Manifest;
    (*m).name = c_strdup(&parsed.name);

    // build sub-object
    (*m).build.path = c_strdup(&parsed.build.path);
    (*m).build.time = parsed.build.time;
    (*m).build.morloc_version = c_strdup(&parsed.build.morloc_version);

    // pools
    if !parsed.pools.is_empty() {
        (*m).n_pools = parsed.pools.len();
        (*m).pools = libc::calloc(
            parsed.pools.len(),
            std::mem::size_of::<ManifestPool>(),
        ) as *mut ManifestPool;
        for (i, p) in parsed.pools.iter().enumerate() {
            populate_pool((*m).pools.add(i), p);
        }
    }

    // commands
    if !parsed.commands.is_empty() {
        (*m).n_commands = parsed.commands.len();
        (*m).commands = libc::calloc(
            parsed.commands.len(),
            std::mem::size_of::<ManifestCommand>(),
        ) as *mut ManifestCommand;
        for (i, c) in parsed.commands.iter().enumerate() {
            if let Err(e) = populate_command((*m).commands.add(i), c) {
                set_errmsg(errmsg, &e);
                return ptr::null_mut();
            }
        }
    }

    // groups
    if !parsed.groups.is_empty() {
        (*m).n_groups = parsed.groups.len();
        (*m).groups = libc::calloc(
            parsed.groups.len(),
            std::mem::size_of::<ManifestCmdGroup>(),
        ) as *mut ManifestCmdGroup;
        for (i, g) in parsed.groups.iter().enumerate() {
            populate_cmd_group((*m).groups.add(i), g);
        }
    }

    // service
    if let Some(svc) = parsed.service {
        (*m).service =
            libc::calloc(1, std::mem::size_of::<ManifestService>()) as *mut ManifestService;
        populate_service((*m).service, &svc);
    }

    (*m).metadata_json = populate_metadata(&parsed.metadata);

    m
}

// -- read_manifest ------------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn read_manifest(
    path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut Manifest {
    clear_errmsg(errmsg);
    let path_str = CStr::from_ptr(path).to_string_lossy();
    match std::fs::read_to_string(path_str.as_ref()) {
        Ok(text) => {
            let c_text = CString::new(text).unwrap_or_default();
            parse_manifest(c_text.as_ptr(), errmsg)
        }
        Err(e) => {
            set_errmsg(errmsg, &MorlocError::Io(e));
            ptr::null_mut()
        }
    }
}

// -- free_manifest ------------------------------------------------------------
//
// Walks the v2 C structs and releases every owned C string + sub-allocation.
// Helper functions mirror the populate_* helpers above for symmetry.

unsafe fn free_str_array(arr: *mut *mut c_char) {
    if arr.is_null() {
        return;
    }
    let mut j = 0;
    while !(*arr.add(j)).is_null() {
        libc::free(*arr.add(j) as *mut c_void);
        j += 1;
    }
    libc::free(arr as *mut c_void);
}

unsafe fn free_constraints(ptr: *mut ManifestConstraint, n: usize) {
    if ptr.is_null() {
        return;
    }
    for i in 0..n {
        let c = &*ptr.add(i);
        if !c.ctype.is_null() {
            libc::free(c.ctype as *mut c_void);
        }
        if !c.value_json.is_null() {
            libc::free(c.value_json as *mut c_void);
        }
    }
    libc::free(ptr as *mut c_void);
}

unsafe fn free_arg(arg: &ManifestArg) {
    if !arg.schema.is_null() {
        libc::free(arg.schema as *mut c_void);
    }
    if !arg.type_desc.is_null() {
        libc::free(arg.type_desc as *mut c_void);
    }
    if !arg.metavar.is_null() {
        libc::free(arg.metavar as *mut c_void);
    }
    if !arg.long_opt.is_null() {
        libc::free(arg.long_opt as *mut c_void);
    }
    if !arg.long_rev.is_null() {
        libc::free(arg.long_rev as *mut c_void);
    }
    if !arg.default_val.is_null() {
        libc::free(arg.default_val as *mut c_void);
    }
    free_str_array(arg.desc);
    free_constraints(arg.constraints, arg.n_constraints);
    if !arg.grp_long.is_null() {
        libc::free(arg.grp_long as *mut c_void);
    }
    if !arg.entries.is_null() {
        for i in 0..arg.n_entries {
            let ge = &*arg.entries.add(i);
            if !ge.key.is_null() {
                libc::free(ge.key as *mut c_void);
            }
            if !ge.arg.is_null() {
                free_arg(&*ge.arg);
                libc::free(ge.arg as *mut c_void);
            }
        }
        libc::free(arg.entries as *mut c_void);
    }
    if !arg.metadata_json.is_null() {
        libc::free(arg.metadata_json as *mut c_void);
    }
}

unsafe fn free_return(ret: &ManifestReturn) {
    if !ret.schema.is_null() {
        libc::free(ret.schema as *mut c_void);
    }
    if !ret.type_desc.is_null() {
        libc::free(ret.type_desc as *mut c_void);
    }
    free_str_array(ret.desc);
    free_constraints(ret.constraints, ret.n_constraints);
    if !ret.metadata_json.is_null() {
        libc::free(ret.metadata_json as *mut c_void);
    }
}

#[no_mangle]
pub unsafe extern "C" fn free_manifest(manifest: *mut Manifest) {
    if manifest.is_null() {
        return;
    }
    let m = &*manifest;
    if !m.name.is_null() {
        libc::free(m.name as *mut c_void);
    }
    // build sub-object
    if !m.build.path.is_null() {
        libc::free(m.build.path as *mut c_void);
    }
    if !m.build.morloc_version.is_null() {
        libc::free(m.build.morloc_version as *mut c_void);
    }
    // pools
    for i in 0..m.n_pools {
        let pool = &*m.pools.add(i);
        if !pool.lang.is_null() {
            libc::free(pool.lang as *mut c_void);
        }
        free_str_array(pool.exec);
        if !pool.socket.is_null() {
            libc::free(pool.socket as *mut c_void);
        }
        if !pool.metadata_json.is_null() {
            libc::free(pool.metadata_json as *mut c_void);
        }
    }
    if !m.pools.is_null() {
        libc::free(m.pools as *mut c_void);
    }
    // commands
    for i in 0..m.n_commands {
        let cmd = &*m.commands.add(i);
        if !cmd.name.is_null() {
            libc::free(cmd.name as *mut c_void);
        }
        if !cmd.needed_pools.is_null() {
            libc::free(cmd.needed_pools as *mut c_void);
        }
        free_str_array(cmd.desc);
        for j in 0..cmd.n_args {
            free_arg(&*cmd.args.add(j));
        }
        if !cmd.args.is_null() {
            libc::free(cmd.args as *mut c_void);
        }
        free_return(&cmd.ret);
        free_constraints(cmd.constraints, cmd.n_constraints);
        if !cmd.group.is_null() {
            libc::free(cmd.group as *mut c_void);
        }
        if !cmd.metadata_json.is_null() {
            libc::free(cmd.metadata_json as *mut c_void);
        }
        // Note: cmd.expr is owned by the C side and freed by its own
        // free function in eval_ffi.rs (not in scope here).
    }
    if !m.commands.is_null() {
        libc::free(m.commands as *mut c_void);
    }
    // groups
    for i in 0..m.n_groups {
        let g = &*m.groups.add(i);
        if !g.name.is_null() {
            libc::free(g.name as *mut c_void);
        }
        free_str_array(g.desc);
        if !g.metadata_json.is_null() {
            libc::free(g.metadata_json as *mut c_void);
        }
    }
    if !m.groups.is_null() {
        libc::free(m.groups as *mut c_void);
    }
    // service
    if !m.service.is_null() {
        let svc = &*m.service;
        if !svc.stype.is_null() {
            libc::free(svc.stype as *mut c_void);
        }
        if !svc.host.is_null() {
            libc::free(svc.host as *mut c_void);
        }
        if !svc.socket.is_null() {
            libc::free(svc.socket as *mut c_void);
        }
        if !svc.metadata_json.is_null() {
            libc::free(svc.metadata_json as *mut c_void);
        }
        libc::free(m.service as *mut c_void);
    }
    if !m.metadata_json.is_null() {
        libc::free(m.metadata_json as *mut c_void);
    }
    libc::free(manifest as *mut c_void);
}

// -- manifest_to_discovery_json -----------------------------------------------
//
// Emits a v2-shape JSON describing the manifest's commands. Used by the
// daemon/router code for discovery RPC. The output mirrors the morloc
// compiler's manifest format closely (no v1 legacy field names).

#[no_mangle]
pub unsafe extern "C" fn manifest_to_discovery_json(manifest: *const Manifest) -> *mut c_char {
    if manifest.is_null() {
        return ptr::null_mut();
    }
    let m = &*manifest;

    extern "C" {
        fn json_buf_new() -> *mut c_void;
        fn json_buf_finish(jb: *mut c_void) -> *mut c_char;
        fn json_write_obj_start(jb: *mut c_void);
        fn json_write_obj_end(jb: *mut c_void);
        fn json_write_arr_start(jb: *mut c_void);
        fn json_write_arr_end(jb: *mut c_void);
        fn json_write_key(jb: *mut c_void, key: *const c_char);
        fn json_write_string(jb: *mut c_void, val: *const c_char);
    }

    let jb = json_buf_new();
    json_write_obj_start(jb);

    let name_key = b"name\0".as_ptr() as *const c_char;
    let type_key = b"type\0".as_ptr() as *const c_char;
    let kind_key = b"kind\0".as_ptr() as *const c_char;
    let schema_key = b"schema\0".as_ptr() as *const c_char;

    json_write_key(jb, name_key);
    json_write_string(
        jb,
        if m.name.is_null() {
            b"unknown\0".as_ptr() as *const c_char
        } else {
            m.name
        },
    );

    // Surface the morloc compiler version that built this manifest.
    if !m.build.morloc_version.is_null() {
        let mv_key = b"morloc_version\0".as_ptr() as *const c_char;
        json_write_key(jb, mv_key);
        json_write_string(jb, m.build.morloc_version);
    }

    let commands_key = b"commands\0".as_ptr() as *const c_char;
    json_write_key(jb, commands_key);
    json_write_arr_start(jb);

    for i in 0..m.n_commands {
        let cmd = &*m.commands.add(i);
        json_write_obj_start(jb);

        json_write_key(jb, name_key);
        json_write_string(jb, cmd.name);

        json_write_key(jb, type_key);
        json_write_string(
            jb,
            if cmd.is_pure {
                b"pure\0".as_ptr() as *const c_char
            } else {
                b"remote\0".as_ptr() as *const c_char
            },
        );

        // Return descriptor (nested return object).
        if !cmd.ret.type_desc.is_null() || !cmd.ret.schema.is_null() {
            let ret_key = b"return\0".as_ptr() as *const c_char;
            json_write_key(jb, ret_key);
            json_write_obj_start(jb);
            if !cmd.ret.type_desc.is_null() {
                json_write_key(jb, type_key);
                json_write_string(jb, cmd.ret.type_desc);
            }
            if !cmd.ret.schema.is_null() {
                json_write_key(jb, schema_key);
                json_write_string(jb, cmd.ret.schema);
            }
            json_write_obj_end(jb);
        }

        // Args. Each arg's schema (if any) is on the arg itself; no
        // parallel array, no flag-skipping bug.
        let args_key = b"args\0".as_ptr() as *const c_char;
        json_write_key(jb, args_key);
        json_write_arr_start(jb);
        for a in 0..cmd.n_args {
            let arg = &*cmd.args.add(a);
            json_write_obj_start(jb);

            json_write_key(jb, kind_key);
            match arg.kind {
                ManifestArgKind::Pos => json_write_string(jb, b"pos\0".as_ptr() as *const c_char),
                ManifestArgKind::Opt => json_write_string(jb, b"opt\0".as_ptr() as *const c_char),
                ManifestArgKind::Flag => json_write_string(jb, b"flag\0".as_ptr() as *const c_char),
                ManifestArgKind::Grp => json_write_string(jb, b"grp\0".as_ptr() as *const c_char),
            }

            if !arg.metavar.is_null() {
                json_write_key(jb, b"metavar\0".as_ptr() as *const c_char);
                json_write_string(jb, arg.metavar);
            }
            if !arg.type_desc.is_null() {
                json_write_key(jb, type_key);
                json_write_string(jb, arg.type_desc);
            }
            if !arg.schema.is_null() {
                json_write_key(jb, schema_key);
                json_write_string(jb, arg.schema);
            }
            if !arg.default_val.is_null() {
                json_write_key(jb, b"default\0".as_ptr() as *const c_char);
                json_write_string(jb, arg.default_val);
            }
            if !arg.long_opt.is_null() {
                json_write_key(jb, b"long\0".as_ptr() as *const c_char);
                json_write_string(jb, arg.long_opt);
            }
            if arg.short_opt != 0 {
                let short_str = [arg.short_opt as u8, 0];
                json_write_key(jb, b"short\0".as_ptr() as *const c_char);
                json_write_string(jb, short_str.as_ptr() as *const c_char);
            }
            if arg.n_desc > 0 && !arg.desc.is_null() && !(*arg.desc).is_null() {
                let first = *arg.desc;
                if *first != 0 {
                    let desc_key = b"desc\0".as_ptr() as *const c_char;
                    json_write_key(jb, desc_key);
                    json_write_string(jb, first);
                }
            }

            json_write_obj_end(jb);
        }
        json_write_arr_end(jb);

        if cmd.n_desc > 0 && !cmd.desc.is_null() && !(*cmd.desc).is_null() {
            let first = *cmd.desc;
            if *first != 0 {
                json_write_key(jb, b"desc\0".as_ptr() as *const c_char);
                json_write_string(jb, first);
            }
        }

        if !cmd.group.is_null() {
            json_write_key(jb, b"group\0".as_ptr() as *const c_char);
            json_write_string(jb, cmd.group);
        }

        json_write_obj_end(jb);
    }

    json_write_arr_end(jb);

    if m.n_groups > 0 {
        let groups_key = b"groups\0".as_ptr() as *const c_char;
        json_write_key(jb, groups_key);
        json_write_arr_start(jb);
        for i in 0..m.n_groups {
            let g = &*m.groups.add(i);
            json_write_obj_start(jb);
            json_write_key(jb, name_key);
            json_write_string(jb, g.name);
            if g.n_desc > 0 && !g.desc.is_null() && !(*g.desc).is_null() {
                json_write_key(jb, b"desc\0".as_ptr() as *const c_char);
                json_write_string(jb, *g.desc);
            }
            json_write_obj_end(jb);
        }
        json_write_arr_end(jb);
    }

    json_write_obj_end(jb);
    json_buf_finish(jb)
}


================================================
FILE: data/rust/morloc-runtime/src/mpack.rs
================================================
//! MessagePack <-> Voidstar conversion.
//!
//! Replaces serialize.c + mpack.c. Uses the `rmp` crate for MessagePack I/O.
//! The voidstar binary format is morloc-specific (Array/Tensor structs with relptrs).

use crate::error::MorlocError;
use crate::schema::{Schema, SerialType};
use crate::shm::{self, AbsPtr, Array, RELNULL};

// ── Voidstar -> MessagePack ────────────────────────────────────────────────

/// Serialize voidstar data to MessagePack bytes.
pub fn pack_with_schema(ptr: AbsPtr, schema: &Schema) -> Result<Vec<u8>, MorlocError> {
    let mut buf = Vec::with_capacity(256);
    pack_data(ptr, schema, &mut buf)?;
    Ok(buf)
}

fn pack_data(ptr: AbsPtr, schema: &Schema, buf: &mut Vec<u8>) -> Result<(), MorlocError> {
    // SAFETY: ptr points to voidstar data in SHM with layout described by schema.
    // All reads are within bounds defined by schema.width, Array headers, etc.
    unsafe {
        match schema.serial_type {
            SerialType::Nil => {
                rmp::encode::write_nil(buf)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack nil: {}", e)))?;
            }
            SerialType::Bool => {
                let v = *ptr != 0;
                rmp::encode::write_bool(buf, v)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack bool: {}", e)))?;
            }
            SerialType::Uint8 => {
                rmp::encode::write_uint(buf, *ptr as u64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack uint: {}", e)))?;
            }
            SerialType::Uint16 => {
                rmp::encode::write_uint(buf, *(ptr as *const u16) as u64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack uint: {}", e)))?;
            }
            SerialType::Uint32 => {
                rmp::encode::write_uint(buf, *(ptr as *const u32) as u64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack uint: {}", e)))?;
            }
            SerialType::Uint64 => {
                rmp::encode::write_uint(buf, *(ptr as *const u64))
                    .map_err(|e| MorlocError::Serialization(format!("msgpack uint: {}", e)))?;
            }
            SerialType::Sint8 => {
                rmp::encode::write_sint(buf, *(ptr as *const i8) as i64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack sint: {}", e)))?;
            }
            SerialType::Sint16 => {
                rmp::encode::write_sint(buf, *(ptr as *const i16) as i64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack sint: {}", e)))?;
            }
            SerialType::Sint32 => {
                rmp::encode::write_sint(buf, *(ptr as *const i32) as i64)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack sint: {}", e)))?;
            }
            SerialType::Sint64 => {
                rmp::encode::write_sint(buf, *(ptr as *const i64))
                    .map_err(|e| MorlocError::Serialization(format!("msgpack sint: {}", e)))?;
            }
            SerialType::Float32 => {
                let f = *(ptr as *const f32) as f64;
                rmp::encode::write_f64(buf, f)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack float: {}", e)))?;
            }
            SerialType::Float64 => {
                let f = *(ptr as *const f64);
                rmp::encode::write_f64(buf, f)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack float: {}", e)))?;
            }
            SerialType::String => {
                let arr = &*(ptr as *const Array);
                let data = shm::rel2abs(arr.data)?;
                let bytes = std::slice::from_raw_parts(data, arr.size);
                rmp::encode::write_str_len(buf, arr.size as u32)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack str: {}", e)))?;
                buf.extend_from_slice(bytes);
            }
            SerialType::Array => {
                let arr = &*(ptr as *const Array);
                let elem_schema = &schema.parameters[0];
                let elem_width = elem_schema.width;

                rmp::encode::write_array_len(buf, arr.size as u32)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack array: {}", e)))?;

                if arr.size > 0 && arr.data != RELNULL {
                    let data = shm::rel2abs(arr.data)?;
                    for i in 0..arr.size {
                        let elem_ptr = data.add(i * elem_width);
                        pack_data(elem_ptr, elem_schema, buf)?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                rmp::encode::write_array_len(buf, schema.parameters.len() as u32)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack tuple: {}", e)))?;

                for (i, field_schema) in schema.parameters.iter().enumerate() {
                    let field_ptr = ptr.add(schema.offsets[i]);
                    pack_data(field_ptr, field_schema, buf)?;
                }
            }
            SerialType::Optional => {
                let tag = *ptr;
                if tag == 0 {
                    rmp::encode::write_nil(buf)
                        .map_err(|e| MorlocError::Serialization(format!("msgpack nil: {}", e)))?;
                } else {
                    let inner_schema = &schema.parameters[0];
                    let inner_offset = schema.offsets.first().copied()
                        .unwrap_or_else(|| shm::align_up(1, inner_schema.alignment().max(1)));
                    let inner_ptr = ptr.add(inner_offset);
                    pack_data(inner_ptr, inner_schema, buf)?;
                }
            }
            SerialType::Tensor => {
                return Err(MorlocError::Serialization(
                    "MessagePack serialization of tensors not yet supported".into(),
                ));
            }
        }
    }
    Ok(())
}

// ── MessagePack -> Voidstar ────────────────────────────────────────────────

/// Deserialize MessagePack bytes into voidstar format in SHM.
pub fn unpack_with_schema(
    data: &[u8],
    schema: &Schema,
) -> Result<AbsPtr, MorlocError> {
    // Two-pass: first calculate size, then deserialize
    let size = calc_unpack_size(data, schema)?;
    let base = shm::shmalloc(size)?;
    // SAFETY: base is freshly allocated with `size` bytes.
    unsafe { std::ptr::write_bytes(base, 0, size) };

    // SAFETY: cursor starts at base + schema.width, within the allocated region.
    let mut cursor = unsafe { base.add(schema.width) };
    let mut reader = &data[..];
    unpack_obj(base, schema, &mut cursor, &mut reader)?;
    Ok(base)
}

fn unpack_obj(
    ptr: AbsPtr,
    schema: &Schema,
    cursor: &mut AbsPtr,
    reader: &mut &[u8],
) -> Result<(), MorlocError> {
    use rmp::decode;

    // SAFETY: ptr and cursor point into a single contiguous SHM allocation
    // sized by calc_unpack_size. Each write respects schema.width bounds.
    unsafe {
        match schema.serial_type {
            SerialType::Nil => {
                decode::read_nil(reader)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack nil: {}", e)))?;
                *ptr = 0;
            }
            SerialType::Bool => {
                let v = decode::read_bool(reader)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack bool: {}", e)))?;
                *ptr = v as u8;
            }
            SerialType::Uint8 | SerialType::Uint16 | SerialType::Uint32 | SerialType::Uint64
            | SerialType::Sint8 | SerialType::Sint16 | SerialType::Sint32 | SerialType::Sint64 => {
                unpack_int(ptr, schema.serial_type, reader)?;
            }
            SerialType::Float32 => {
                let f = read_float(reader)?;
                *(ptr as *mut f32) = f as f32;
            }
            SerialType::Float64 => {
                let f = read_float(reader)?;
                *(ptr as *mut f64) = f;
            }
            SerialType::String => {
                let len = decode::read_str_len(reader)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack str len: {}", e)))?
                    as usize;
                let arr = &mut *(ptr as *mut Array);
                arr.size = len;
                arr.data = shm::abs2rel(*cursor)?;

                // Read string bytes directly
                if len > 0 {
                    if reader.len() < len {
                        return Err(MorlocError::Serialization("msgpack str truncated".into()));
                    }
                    std::ptr::copy_nonoverlapping(reader.as_ptr(), *cursor, len);
                    *reader = &reader[len..];
                }
                *cursor = cursor.add(len);
            }
            SerialType::Array => {
                let n = decode::read_array_len(reader)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack array len: {}", e)))?
                    as usize;
                let elem_schema = &schema.parameters[0];
                let elem_width = elem_schema.width;

                let arr = &mut *(ptr as *mut Array);
                arr.size = n;

                // Align cursor for element data
                let align = elem_schema.alignment();
                let aligned = shm::align_up(*cursor as usize, align);
                *cursor = aligned as AbsPtr;

                arr.data = shm::abs2rel(*cursor)?;
                let data_start = *cursor;
                *cursor = cursor.add(n * elem_width);

                for i in 0..n {
                    let elem_ptr = data_start.add(i * elem_width);
                    unpack_obj(elem_ptr, elem_schema, cursor, reader)?;
                }
            }
            SerialType::Tuple | SerialType::Map => {
                let _n = decode::read_array_len(reader)
                    .map_err(|e| MorlocError::Serialization(format!("msgpack tuple len: {}", e)))?;
                for (i, field_schema) in schema.parameters.iter().enumerate() {
                    let field_ptr = ptr.add(schema.offsets[i]);
                    unpack_obj(field_ptr, field_schema, cursor, reader)?;
                }
            }
            SerialType::Optional => {
                let inner_schema = &schema.parameters[0];
                let inner_offset = schema.offsets.first().copied()
                    .unwrap_or_else(|| shm::align_up(1, inner_schema.alignment().max(1)));

                // Peek at the next byte to detect nil
                if !reader.is_empty() && reader[0] == 0xc0 {
                    // Null: consume nil byte, set tag = 0
                    decode::read_nil(reader)
                        .map_err(|e| MorlocError::Serialization(format!("msgpack nil: {}", e)))?;
                    *ptr = 0;
                } else {
                    // Present: set tag = 1, parse inner
                    *ptr = 1;
                    let inner_ptr = ptr.add(inner_offset);
                    unpack_obj(inner_ptr, inner_schema, cursor, reader)?;
                }
            }
            SerialType::Tensor => {
                return Err(MorlocError::Serialization(
                    "MessagePack tensor deserialization not yet supported".into(),
                ));
            }
        }
    }
    Ok(())
}

fn unpack_int(ptr: AbsPtr, st: SerialType, reader: &mut &[u8]) -> Result<(), MorlocError> {
    // Use rmp's generic read_int which handles all integer markers
    let val: i64 = rmp::decode::read_int(reader)
        .map_err(|e| MorlocError::Serialization(format!("msgpack int: {}", e)))?;

    // SAFETY: ptr points to schema.width bytes in SHM; each cast writes exactly that width.
    unsafe {
        match st {
            SerialType::Sint8 => *(ptr as *mut i8) = val as i8,
            SerialType::Sint16 => *(ptr as *mut i16) = val as i16,
            SerialType::Sint32 => *(ptr as *mut i32) = val as i32,
            SerialType::Sint64 => *(ptr as *mut i64) = val,
            SerialType::Uint8 => *ptr = val as u8,
            SerialType::Uint16 => *(ptr as *mut u16) = val as u16,
            SerialType::Uint32 => *(ptr as *mut u32) = val as u32,
            SerialType::Uint64 => *(ptr as *mut u64) = val as u64,
            _ => {}
        }
    }
    Ok(())
}

fn read_float(reader: &mut &[u8]) -> Result<f64, MorlocError> {
    let marker = rmp::decode::read_marker(reader)
        .map_err(|_| MorlocError::Serialization("msgpack float: unexpected EOF".into()))?;
    match marker {
        rmp::Marker::F32 => {
            let bits = read_be_u32(reader)?;
            Ok(f32::from_bits(bits) as f64)
        }
        rmp::Marker::F64 => {
            let bits = read_be_u64(reader)?;
            Ok(f64::from_bits(bits))
        }
        // Integer markers can appear for integer-valued floats - read the data manually
        rmp::Marker::FixPos(v) => Ok(v as f64),
        rmp::Marker::FixNeg(v) => Ok(v as f64),
        _ => {
            // For other integer encodings, read bytes manually
            let n = match marker {
                rmp::Marker::U8 => { read_byte(reader)? as f64 }
                rmp::Marker::U16 => { read_be_u16(reader)? as f64 }
                rmp::Marker::U32 => { read_be_u32(reader)? as f64 }
                rmp::Marker::U64 => { read_be_u64(reader)? as f64 }
                rmp::Marker::I8 => { read_byte(reader)? as i8 as f64 }
                rmp::Marker::I16 => { read_be_u16(reader)? as i16 as f64 }
                rmp::Marker::I32 => { read_be_u32(reader)? as i32 as f64 }
                rmp::Marker::I64 => { read_be_u64(reader)? as i64 as f64 }
                _ => {
                    return Err(MorlocError::Serialization(format!(
                        "unexpected msgpack marker {:?} for float", marker
                    )));
                }
            };
            Ok(n)
        }
    }
}

// Also fix read_f32/read_f64 - rmp's functions include the marker, but we already consumed it
// So we need to read the raw data bytes directly.

fn read_byte(reader: &mut &[u8]) -> Result<u8, MorlocError> {
    if reader.is_empty() { return Err(MorlocError::Serialization("unexpected EOF".into())); }
    let v = reader[0];
    *reader = &reader[1..];
    Ok(v)
}

fn read_be_u16(reader: &mut &[u8]) -> Result<u16, MorlocError> {
    if reader.len() < 2 { return Err(MorlocError::Serialization("unexpected EOF".into())); }
    let v = u16::from_be_bytes([reader[0], reader[1]]);
    *reader = &reader[2..];
    Ok(v)
}

fn read_be_u32(reader: &mut &[u8]) -> Result<u32, MorlocError> {
    if reader.len() < 4 { return Err(MorlocError::Serialization("unexpected EOF".into())); }
    let v = u32::from_be_bytes([reader[0], reader[1], reader[2], reader[3]]);
    *reader = &reader[4..];
    Ok(v)
}

fn read_be_u64(reader: &mut &[u8]) -> Result<u64, MorlocError> {
    if reader.len() < 8 { return Err(MorlocError::Serialization("unexpected EOF".into())); }
    let v = u64::from_be_bytes([reader[0], reader[1], reader[2], reader[3], reader[4], reader[5], reader[6], reader[7]]);
    *reader = &reader[8..];
    Ok(v)
}

// ── Size calculation for unpack ────────────────────────────────────────────

fn calc_unpack_size(data: &[u8], schema: &Schema) -> Result<usize, MorlocError> {
    let mut reader = data;
    calc_size_r(schema, &mut reader)
}

fn calc_size_r(schema: &Schema, reader: &mut &[u8]) -> Result<usize, MorlocError> {
    match schema.serial_type {
        SerialType::Nil => {
            rmp::decode::read_nil(reader).ok();
            Ok(1)
        }
        SerialType::Bool => {
            rmp::decode::read_bool(reader).ok();
            Ok(1)
        }
        SerialType::Sint8 | SerialType::Uint8 => { skip_int(reader)?; Ok(1) }
        SerialType::Sint16 | SerialType::Uint16 => { skip_int(reader)?; Ok(2) }
        SerialType::Sint32 | SerialType::Uint32 | SerialType::Float32 => { skip_int(reader)?; Ok(4) }
        SerialType::Sint64 | SerialType::Uint64 | SerialType::Float64 => { skip_int(reader)?; Ok(8) }
        SerialType::String => {
            let len = rmp::decode::read_str_len(reader)
                .map_err(|e| MorlocError::Serialization(format!("size calc str: {}", e)))?
                as usize;
            if reader.len() >= len { *reader = &reader[len..]; }
            Ok(std::mem::size_of::<Array>() + len)
        }
        SerialType::Array => {
            let n = rmp::decode::read_array_len(reader)
                .map_err(|e| MorlocError::Serialization(format!("size calc array: {}", e)))?
                as usize;
            let elem_schema = &schema.parameters[0];
            let mut total = std::mem::size_of::<Array>();
            // Alignment padding
            total = shm::align_up(total, elem_schema.alignment());
            for _ in 0..n {
                total += calc_size_r(elem_schema, reader)?;
            }
            Ok(total)
        }
        SerialType::Tuple | SerialType::Map => {
            let _n = rmp::decode::read_array_len(reader).ok();
            let mut total = schema.width;
            for field_schema in &schema.parameters {
                if !field_schema.is_fixed_width() {
                    total += calc_size_r(field_schema, reader)?;
                } else {
                    calc_size_r(field_schema, reader)?;
                }
            }
            Ok(total)
        }
        SerialType::Optional => {
            let inner_schema = &schema.parameters[0];
            if !reader.is_empty() && reader[0] == 0xc0 {
                rmp::decode::read_nil(reader).ok();
                Ok(schema.width.max(1 + inner_schema.width))
            } else {
                let inner_size = calc_size_r(inner_schema, reader)?;
                let align = inner_schema.alignment().max(1);
                let offset = shm::align_up(1, align);
                Ok(offset + inner_size)
            }
        }
        SerialType::Tensor => Ok(0),
    }
}

fn skip_int(reader: &mut &[u8]) -> Result<(), MorlocError> {
    let marker = rmp::decode::read_marker(reader)
        .map_err(|_| MorlocError::Serialization("skip int: unexpected EOF".into()))?;
    let skip = match marker {
        rmp::Marker::FixPos(_) | rmp::Marker::FixNeg(_) => 0,
        rmp::Marker::U8 | rmp::Marker::I8 => 1,
        rmp::Marker::U16 | rmp::Marker::I16 => 2,
        rmp::Marker::U32 | rmp::Marker::I32 | rmp::Marker::F32 => 4,
        rmp::Marker::U64 | rmp::Marker::I64 | rmp::Marker::F64 => 8,
        _ => 0,
    };
    if reader.len() >= skip {
        *reader = &reader[skip..];
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::schema::parse_schema;
    use crate::json;

    fn setup_shm() {
        crate::init_test_shm();
    }

    #[test]
    fn test_roundtrip_int_via_msgpack() {
        setup_shm();
        let schema = parse_schema("i4").unwrap();
        // JSON -> voidstar -> msgpack -> voidstar -> JSON
        let ptr1 = json::read_json_with_schema("42", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        let ptr2 = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr2, &schema).unwrap();
        assert_eq!(json_out, "42");
    }

    #[test]
    fn test_roundtrip_string_via_msgpack() {
        setup_shm();
        let schema = parse_schema("s").unwrap();
        let ptr1 = json::read_json_with_schema("\"hello world\"", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        let ptr2 = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr2, &schema).unwrap();
        assert_eq!(json_out, "\"hello world\"");
    }

    #[test]
    fn test_roundtrip_array_via_msgpack() {
        setup_shm();
        let schema = parse_schema("ai4").unwrap();
        let ptr1 = json::read_json_with_schema("[10,20,30]", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        let ptr2 = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr2, &schema).unwrap();
        assert_eq!(json_out, "[10,20,30]");
    }

    #[test]
    fn test_roundtrip_bool_via_msgpack() {
        setup_shm();
        let schema = parse_schema("b").unwrap();
        let ptr1 = json::read_json_with_schema("true", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        let ptr2 = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr2, &schema).unwrap();
        assert_eq!(json_out, "true");
    }

    #[test]
    fn test_roundtrip_optional_null_via_msgpack() {
        setup_shm();
        let schema = parse_schema("?i4").unwrap();
        let ptr1 = json::read_json_with_schema("null", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        let ptr2 = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr2, &schema).unwrap();
        assert_eq!(json_out, "null");
    }

    #[test]
    fn test_pack_only_string() {
        setup_shm();
        let schema = parse_schema("s").unwrap();
        let ptr1 = json::read_json_with_schema("\"hi\"", &schema).unwrap();
        let mpk = pack_with_schema(ptr1, &schema).unwrap();
        assert!(!mpk.is_empty());
        assert_eq!(mpk.len(), 3);
    }

    #[test]
    fn test_unpack_only_int() {
        setup_shm();
        let schema = parse_schema("i4").unwrap();
        // msgpack for 42 = [42] (fixint)
        let mpk = vec![42u8];
        let ptr = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr, &schema).unwrap();
        assert_eq!(json_out, "42");
    }

    #[test]
    fn test_unpack_only_string() {
        setup_shm();
        let schema = parse_schema("s").unwrap();
        // msgpack for "hi" = [0xa2, 0x68, 0x69]
        let mpk = vec![0xa2, 0x68, 0x69];
        let size = calc_unpack_size(&mpk, &schema).unwrap();
        eprintln!("unpack size for string: {} (Array={}, total={})", size, std::mem::size_of::<shm::Array>(), size);
        let ptr = unpack_with_schema(&mpk, &schema).unwrap();
        let json_out = json::voidstar_to_json_string(ptr, &schema).unwrap();
        assert_eq!(json_out, "\"hi\"");
    }
}


================================================
FILE: data/rust/morloc-runtime/src/packet.rs
================================================
use crate::error::MorlocError;

// ── Magic & version constants ──────────────────────────────────────────────

pub const PACKET_MAGIC: u32 = 0x0707_f86d;
pub const THIS_PLAIN: u16 = 0;
pub const THIS_VERSION: u16 = 0;
pub const DEFAULT_FLAVOR: u16 = 0;
pub const DEFAULT_MODE: u16 = 0;

// ── Command type discriminants ─────────────────────────────────────────────

pub const PACKET_TYPE_DATA: u8 = 0;
pub const PACKET_TYPE_CALL: u8 = 1;
pub const PACKET_TYPE_PING: u8 = 2;

// ── Data source ────────────────────────────────────────────────────────────

pub const PACKET_SOURCE_MESG: u8 = 0x00;
pub const PACKET_SOURCE_FILE: u8 = 0x01;
pub const PACKET_SOURCE_RPTR: u8 = 0x02;

// ── Data format ────────────────────────────────────────────────────────────

pub const PACKET_FORMAT_JSON: u8 = 0x00;
pub const PACKET_FORMAT_MSGPACK: u8 = 0x01;
pub const PACKET_FORMAT_TEXT: u8 = 0x02;
pub const PACKET_FORMAT_DATA: u8 = 0x03;
pub const PACKET_FORMAT_VOIDSTAR: u8 = 0x04;
pub const PACKET_FORMAT_ARROW: u8 = 0x05;

// ── Compression / encryption ───────────────────────────────────────────────

pub const PACKET_COMPRESSION_NONE: u8 = 0x00;
pub const PACKET_ENCRYPTION_NONE: u8 = 0x00;

// ── Status ─────────────────────────────────────────────────────────────────

pub const PACKET_STATUS_PASS: u8 = 0x00;
pub const PACKET_STATUS_FAIL: u8 = 0x01;

// ── Entrypoint ────────────────────���────────────────────────────────────────

pub const PACKET_ENTRYPOINT_LOCAL: u8 = 0x00;
pub const PACKET_ENTRYPOINT_REMOTE_SFS: u8 = 0x01;

// ── Inline threshold ─────────────────────────────────────��─────────────────

pub const MORLOC_INLINE_THRESHOLD: usize = 64 * 1024;

// ── Metadata ─────────��─────────────────────────────────────────────────────

pub const METADATA_TYPE_SCHEMA_STRING: u8 = 0x01;
pub const METADATA_TYPE_XXHASH: u8 = 0x02;
pub const METADATA_HEADER_MAGIC: [u8; 3] = *b"mmh";

// ── Packed structs matching the C binary layout ────���───────────────────────

/// 8-byte command union. We represent each variant as its own struct and
/// transmute at the boundary.
#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct CommandType {
    pub cmd_type: u8,
    pub padding: [u8; 7],
}

#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct CommandCall {
    pub cmd_type: u8,
    pub entrypoint: u8,
    pub padding: [u8; 2],
    pub midx: u32,
}

#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct CommandData {
    pub cmd_type: u8,
    pub source: u8,
    pub format: u8,
    pub compression: u8,
    pub encryption: u8,
    pub status: u8,
    pub padding: [u8; 2],
}

#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct CommandPing {
    pub cmd_type: u8,
    pub padding: [u8; 7],
}

/// The 8-byte command field stored as raw bytes. Interpreted based on the
/// first byte (cmd_type discriminant).
#[derive(Clone, Copy)]
#[repr(C, packed)]
pub union PacketCommand {
    pub cmd_type: CommandType,
    pub call: CommandCall,
    pub data: CommandData,
    pub ping: CommandPing,
    pub raw: [u8; 8],
}

impl std::fmt::Debug for PacketCommand {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        let tag = unsafe { self.cmd_type.cmd_type };
        match tag {
            PACKET_TYPE_DATA => write!(f, "Command::Data({:?})", unsafe { self.data }),
            PACKET_TYPE_CALL => write!(f, "Command::Call({:?})", unsafe { self.call }),
            PACKET_TYPE_PING => write!(f, "Command::Ping"),
            _ => write!(f, "Command::Unknown({tag})"),
        }
    }
}

/// 32-byte packet header. Must match morloc_packet_header_t exactly.
#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct PacketHeader {
    pub magic: u32,
    pub plain: u16,
    pub version: u16,
    pub flavor: u16,
    pub mode: u16,
    pub command: PacketCommand,
    pub offset: u32,
    pub length: u64,
}

const _: () = assert!(std::mem::size_of::<PacketHeader>() == 32);
const _: () = assert!(std::mem::size_of::<PacketCommand>() == 8);
const _: () = assert!(std::mem::size_of::<CommandCall>() == 8);
const _: () = assert!(std::mem::size_of::<CommandData>() == 8);

/// 8-byte metadata header.
#[derive(Debug, Clone, Copy)]
#[repr(C, packed)]
pub struct MetadataHeader {
    pub magic: [u8; 3],
    pub metadata_type: u8,
    pub size: u32,
}

const _: () = assert!(std::mem::size_of::<MetadataHeader>() == 8);

// ── Packet construction helpers ────────────────────────────────────────────

impl PacketHeader {
    fn new(command: PacketCommand, offset: u32, length: u64) -> Self {
        PacketHeader {
            magic: PACKET_MAGIC,
            plain: THIS_PLAIN,
            version: THIS_VERSION,
            flavor: DEFAULT_FLAVOR,
            mode: DEFAULT_MODE,
            command,
            offset,
            length,
        }
    }

    /// Create a ping packet (no payload).
    pub fn ping() -> Self {
        Self::new(
            PacketCommand {
                ping: CommandPing {
                    cmd_type: PACKET_TYPE_PING,
                    padding: [0; 7],
                },
            },
            0, // no metadata
            0, // no payload
        )
    }

    /// Create a local call packet header.
    pub fn local_call(midx: u32, payload_len: u64) -> Self {
        Self::new(
            PacketCommand {
                call: CommandCall {
                    cmd_type: PACKET_TYPE_CALL,
                    entrypoint: PACKET_ENTRYPOINT_LOCAL,
                    padding: [0; 2],
                    midx,
                },
            },
            0, // no metadata between header and arg packets
            payload_len,
        )
    }

    /// Create a remote call packet header.
    pub fn remote_call(midx: u32, payload_len: u64) -> Self {
        Self::new(
            PacketCommand {
                call: CommandCall {
                    cmd_type: PACKET_TYPE_CALL,
                    entrypoint: PACKET_ENTRYPOINT_REMOTE_SFS,
                    padding: [0; 2],
                    midx,
                },
            },
            0,
            payload_len,
        )
    }

    /// Create a data packet header for inline message data.
    pub fn data_mesg(format: u8, payload_len: u64) -> Self {
        Self::new(
            PacketCommand {
                data: CommandData {
                    cmd_type: PACKET_TYPE_DATA,
                    source: PACKET_SOURCE_MESG,
                    format,
                    compression: PACKET_COMPRESSION_NONE,
                    encryption: PACKET_ENCRYPTION_NONE,
                    status: PACKET_STATUS_PASS,
                    padding: [0; 2],
                },
            },
            0, // metadata size set separately when building full packet
            payload_len,
        )
    }

    /// Create a data packet header for relative pointer (shared memory).
    pub fn data_rptr(format: u8, payload_len: u64) -> Self {
        Self::new(
            PacketCommand {
                data: CommandData {
                    cmd_type: PACKET_TYPE_DATA,
                    source: PACKET_SOURCE_RPTR,
                    format,
                    compression: PACKET_COMPRESSION_NONE,
                    encryption: PACKET_ENCRYPTION_NONE,
                    status: PACKET_STATUS_PASS,
                    padding: [0; 2],
                },
            },
            0, // metadata size set separately when building full packet
            payload_len,
        )
    }

    /// Create a fail packet with an error message.
    pub fn fail(error_msg_len: u64) -> Self {
        Self::new(
            PacketCommand {
                data: CommandData {
                    cmd_type: PACKET_TYPE_DATA,
                    source: PACKET_SOURCE_MESG,
                    format: PACKET_FORMAT_TEXT,
                    compression: PACKET_COMPRESSION_NONE,
                    encryption: PACKET_ENCRYPTION_NONE,
                    status: PACKET_STATUS_FAIL,
                    padding: [0; 2],
                },
            },
            0,
            error_msg_len,
        )
    }

    /// Total packet size (header + payload).
    pub fn total_size(&self) -> u64 {
        self.offset as u64 + self.length
    }

    /// Check if this is a valid morloc packet.
    pub fn is_valid(&self) -> bool {
        self.magic == PACKET_MAGIC
    }

    /// Get the command type.
    pub fn command_type(&self) -> u8 {
        unsafe { self.command.cmd_type.cmd_type }
    }

    pub fn is_ping(&self) -> bool {
        self.command_type() == PACKET_TYPE_PING
    }

    pub fn is_call(&self) -> bool {
        self.command_type() == PACKET_TYPE_CALL
    }

    pub fn is_data(&self) -> bool {
        self.command_type() == PACKET_TYPE_DATA
    }

    pub fn is_local_call(&self) -> bool {
        self.is_call() && unsafe { self.command.call.entrypoint } == PACKET_ENTRYPOINT_LOCAL
    }

    pub fn is_remote_call(&self) -> bool {
        self.is_call() && unsafe { self.command.call.entrypoint } == PACKET_ENTRYPOINT_REMOTE_SFS
    }

    pub fn is_fail(&self) -> bool {
        self.is_data() && unsafe { self.command.data.status } == PACKET_STATUS_FAIL
    }

    /// Serialize the header to bytes.
    pub fn to_bytes(&self) -> [u8; 32] {
        unsafe { std::mem::transmute(*self) }
    }

    /// Deserialize a header from bytes.
    pub fn from_bytes(bytes: &[u8; 32]) -> Result<Self, MorlocError> {
        let header: PacketHeader = unsafe { std::mem::transmute(*bytes) };
        if !header.is_valid() {
            let magic = { header.magic };
            return Err(MorlocError::Packet(format!(
                "invalid magic: 0x{magic:08x}"
            )));
        }
        Ok(header)
    }
}

// ── Full packet construction (header + metadata + payload) ─────────────────

/// Build a complete data packet with schema metadata and relptr payload.
pub fn make_standard_data_packet(relptr: crate::shm::RelPtr, schema: &crate::Schema) -> Vec<u8> {
    let schema_str = crate::schema::schema_to_string(schema);
    let schema_bytes = schema_str.as_bytes();
    let schema_len = schema_bytes.len() + 1; // +1 for null terminator

    // Metadata: header (8 bytes) + schema string (null-terminated), padded to 32-byte boundary
    let meta_header_size = std::mem::size_of::<MetadataHeader>();
    let raw_meta_len = meta_header_size + schema_len;
    let padded_meta_len = ((raw_meta_len + 31) / 32) * 32;

    // Payload: relptr
    let payload_len = std::mem::size_of::<crate::shm::RelPtr>();

    let total = 32 + padded_meta_len + payload_len;
    let mut packet = vec![0u8; total];

    // Write header
    let header = PacketHeader::data_rptr(PACKET_FORMAT_VOIDSTAR, payload_len as u64);
    let mut hdr = header;
    // Override offset to include metadata
    unsafe {
        let hdr_ptr = &mut hdr as *mut PacketHeader as *mut u8;
        // Set offset field (at byte 20 in packed struct)
        let offset_ptr = hdr_ptr.add(20) as *mut u32;
        *offset_ptr = padded_meta_len as u32;
    }
    let hdr_bytes = hdr.to_bytes();
    packet[..32].copy_from_slice(&hdr_bytes);

    // Write metadata header
    let meta_start = 32;
    packet[meta_start] = b'm';
    packet[meta_start + 1] = b'm';
    packet[meta_start + 2] = b'h';
    packet[meta_start + 3] = METADATA_TYPE_SCHEMA_STRING;
    let meta_size_bytes = (schema_len as u32).to_le_bytes();
    packet[meta_start + 4..meta_start + 8].copy_from_slice(&meta_size_bytes);

    // Write schema string (null-terminated)
    let schema_data_start = meta_start + meta_header_size;
    packet[schema_data_start..schema_data_start + schema_bytes.len()].copy_from_slice(schema_bytes);
    // Null terminator already there from vec![0u8]

    // Write relptr payload
    let payload_start = 32 + padded_meta_len;
    let relptr_bytes = relptr.to_ne_bytes();
    packet[payload_start..payload_start + relptr_bytes.len()].copy_from_slice(&relptr_bytes);

    packet
}

/// Build an inline MESG+MSGPACK data packet with schema metadata.
pub fn make_mesg_data_packet(mpk_data: &[u8], schema: &crate::Schema) -> Vec<u8> {
    let schema_str = crate::schema::schema_to_string(schema);
    let schema_bytes = schema_str.as_bytes();
    let schema_len = schema_bytes.len() + 1; // +1 for null terminator

    let meta_header_size = std::mem::size_of::<MetadataHeader>();
    let raw_meta_len = meta_header_size + schema_len;
    let padded_meta_len = ((raw_meta_len + 31) / 32) * 32;

    let total = 32 + padded_meta_len + mpk_data.len();
    let mut packet = vec![0u8; total];

    // Write header
    let mut header = PacketHeader::data_mesg(PACKET_FORMAT_MSGPACK, mpk_data.len() as u64);
    // Set offset to metadata size
    unsafe {
        let hdr_ptr = &mut header as *mut PacketHeader as *mut u8;
        let offset_ptr = hdr_ptr.add(20) as *mut u32;
        *offset_ptr = padded_meta_len as u32;
    }
    let hdr_bytes = header.to_bytes();
    packet[..32].copy_from_slice(&hdr_bytes);

    // Write metadata header
    let meta_start = 32;
    packet[meta_start] = b'm';
    packet[meta_start + 1] = b'm';
    packet[meta_start + 2] = b'h';
    packet[meta_start + 3] = METADATA_TYPE_SCHEMA_STRING;
    let meta_size_bytes = (schema_len as u32).to_le_bytes();
    packet[meta_start + 4..meta_start + 8].copy_from_slice(&meta_size_bytes);

    // Write schema string
    let schema_data_start = meta_start + meta_header_size;
    packet[schema_data_start..schema_data_start + schema_bytes.len()].copy_from_slice(schema_bytes);

    // Write msgpack payload
    let payload_start = 32 + padded_meta_len;
    packet[payload_start..payload_start + mpk_data.len()].copy_from_slice(mpk_data);

    packet
}

/// Build a call packet from argument data packets.
pub fn make_local_call_packet(midx: u32, arg_packets: &[Vec<u8>]) -> Vec<u8> {
    let data_length: usize = arg_packets.iter().map(|p| p.len()).sum();
    let total = 32 + data_length;
    let mut packet = vec![0u8; total];

    // Write call header
    let header = PacketHeader::local_call(midx, data_length as u64);
    let hdr_bytes = header.to_bytes();
    packet[..32].copy_from_slice(&hdr_bytes);

    // Concatenate argument packets
    let mut pos = 32;
    for arg in arg_packets {
        packet[pos..pos + arg.len()].copy_from_slice(arg);
        pos += arg.len();
    }

    packet
}

/// Build a fail packet with an error message string.
pub fn make_fail_packet_bytes(error_msg: &str) -> Vec<u8> {
    let msg_bytes = error_msg.as_bytes();
    let total = 32 + msg_bytes.len();
    let mut packet = vec![0u8; total];

    let header = PacketHeader::fail(msg_bytes.len() as u64);
    let hdr_bytes = header.to_bytes();
    packet[..32].copy_from_slice(&hdr_bytes);
    packet[32..].copy_from_slice(msg_bytes);

    packet
}

/// Extract the payload from a data packet (bytes after header + metadata offset).
pub fn get_data_payload(packet: &[u8]) -> Result<&[u8], MorlocError> {
    if packet.len() < 32 {
        return Err(MorlocError::Packet("packet too small".into()));
    }
    let header = PacketHeader::from_bytes(packet[..32].try_into().unwrap())?;
    let offset = { header.offset } as usize;
    let length = { header.length } as usize;
    let start = 32 + offset;
    let end = start + length;
    if end > packet.len() {
        return Err(MorlocError::Packet("payload extends past packet end".into()));
    }
    Ok(&packet[start..end])
}

/// Extract error message from a fail packet.
pub fn get_error_message(packet: &[u8]) -> Result<Option<String>, MorlocError> {
    if packet.len() < 32 {
        return Err(MorlocError::Packet("packet too small".into()));
    }
    let header = PacketHeader::from_bytes(packet[..32].try_into().unwrap())?;
    if !header.is_fail() {
        return Ok(None);
    }
    let payload = get_data_payload(packet)?;
    Ok(Some(String::from_utf8_lossy(payload).into_owned()))
}

/// Read the schema string from packet metadata section.
pub fn read_schema_from_meta(packet: &[u8]) -> Result<Option<String>, MorlocError> {
    if packet.len() < 32 {
        return Err(MorlocError::Packet("packet too small".into()));
    }
    let header = PacketHeader::from_bytes(packet[..32].try_into().unwrap())?;
    let offset = { header.offset } as usize;
    if offset == 0 {
        return Ok(None);
    }

    // Scan metadata headers
    let meta_start = 32;
    let meta_end = meta_start + offset;
    let mut pos = meta_start;
    while pos + 8 <= meta_end {
        if packet[pos] == b'm' && packet[pos + 1] == b'm' && packet[pos + 2] == b'h' {
            let meta_type = packet[pos + 3];
            let meta_size = u32::from_le_bytes([
                packet[pos + 4], packet[pos + 5], packet[pos + 6], packet[pos + 7],
            ]) as usize;
            if meta_type == METADATA_TYPE_SCHEMA_STRING {
                let str_start = pos + 8;
                let str_end = str_start + meta_size;
                if str_end <= meta_end {
                    let bytes = &packet[str_start..str_end];
                    // Find null terminator
                    let len = bytes.iter().position(|&b| b == 0).unwrap_or(bytes.len());
                    return Ok(Some(String::from_utf8_lossy(&bytes[..len]).into_owned()));
                }
            }
            pos += 8 + meta_size;
        } else {
            break;
        }
    }
    Ok(None)
}

/// Get the voidstar value from a data packet (resolves relptr to absptr).
pub fn get_data_value(
    packet: &[u8],
    schema: &crate::Schema,
) -> Result<crate::shm::AbsPtr, MorlocError> {
    let header = PacketHeader::from_bytes(packet[..32].try_into().unwrap())?;
    let source = unsafe { header.command.data.source };
    let format = unsafe { header.command.data.format };

    let payload = get_data_payload(packet)?;

    match source {
        PACKET_SOURCE_RPTR => {
            // Payload is a relptr
            if payload.len() < std::mem::size_of::<crate::shm::RelPtr>() {
                return Err(MorlocError::Packet("relptr payload too small".into()));
            }
            let relptr = crate::shm::RelPtr::from_ne_bytes(
                payload[..std::mem::size_of::<crate::shm::RelPtr>()].try_into().unwrap()
            );
            crate::shm::rel2abs(relptr)
        }
        PACKET_SOURCE_MESG => {
            match format {
                PACKET_FORMAT_MSGPACK => {
                    crate::mpack::unpack_with_schema(payload, schema)
                }
                PACKET_FORMAT_JSON => {
                    let json_str = std::str::from_utf8(payload)
                        .map_err(|e| MorlocError::Packet(format!("invalid UTF-8: {}", e)))?;
                    crate::json::read_json_with_schema(json_str, schema)
                }
                PACKET_FORMAT_VOIDSTAR => {
                    read_voidstar_binary(payload, schema)
                }
                _ => {
                    Err(MorlocError::Packet(format!(
                        "unsupported data format: {}", format
                    )))
                }
            }
        }
        _ => Err(MorlocError::Packet(format!("unsupported source: {}", source))),
    }
}

// ── Inline voidstar deserialization ─────────────────────────────────────────

/// Read a flat voidstar binary blob into shared memory, adjusting relptrs.
fn read_voidstar_binary(
    blob: &[u8],
    schema: &crate::Schema,
) -> Result<crate::shm::AbsPtr, MorlocError> {
    use crate::shm;

    let base = shm::shmalloc(blob.len())?;
    unsafe { std::ptr::copy_nonoverlapping(blob.as_ptr(), base, blob.len()) };

    let base_rel = shm::abs2rel(base)?;
    adjust_voidstar_relptrs(base, schema, base_rel)?;
    Ok(base)
}

/// Adjust relptrs in a voidstar blob that was copied into SHM.
/// The blob's internal relptrs are offsets from position 0 of the blob.
/// Adding `base_rel` converts them to valid SHM relptrs.
fn adjust_voidstar_relptrs(
    data: crate::shm::AbsPtr,
    schema: &crate::Schema,
    base_rel: crate::shm::RelPtr,
) -> Result<(), MorlocError> {
    use crate::schema::SerialType;
    use crate::shm::{self, Array, Tensor};

    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &mut *(data as *mut Array);
                arr.data += base_rel;
                // Recurse into elements if variable-width (strings are always fixed-width bytes)
                if !schema.parameters.is_empty() && !schema.parameters[0].is_fixed_width() {
                    let arr_data = shm::rel2abs(arr.data)?;
                    let elem_width = schema.parameters[0].width;
                    for i in 0..arr.size {
                        let elem = arr_data.add(i * elem_width);
                        adjust_voidstar_relptrs(elem, &schema.parameters[0], base_rel)?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    let child = data.add(schema.offsets[i]);
                    adjust_voidstar_relptrs(child, &schema.parameters[i], base_rel)?;
                }
            }
            SerialType::Optional => {
                let tag = *data;
                if tag != 0 {
                    let inner_offset = schema.offsets.first().copied().unwrap_or(
                        shm::align_up(1, schema.parameters[0].alignment().max(1)),
                    );
                    let child = data.add(inner_offset);
                    adjust_voidstar_relptrs(child, &schema.parameters[0], base_rel)?;
                }
            }
            SerialType::Tensor => {
                let tensor = &mut *(data as *mut Tensor);
                if tensor.total_elements > 0 {
                    tensor.shape += base_rel;
                    tensor.data += base_rel;
                }
            }
            _ => {} // Fixed-width primitives: no relptrs to adjust
        }
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_header_size() {
        assert_eq!(std::mem::size_of::<PacketHeader>(), 32);
    }

    #[test]
    fn test_ping_roundtrip() {
        let ping = PacketHeader::ping();
        assert!(ping.is_valid());
        assert!(ping.is_ping());
        let bytes = ping.to_bytes();
        let recovered = PacketHeader::from_bytes(&bytes).unwrap();
        assert!(recovered.is_ping());
    }

    #[test]
    fn test_call_packet() {
        let call = PacketHeader::local_call(42, 128);
        assert!(call.is_call());
        assert!(call.is_local_call());
        assert!(!call.is_remote_call());
        let bytes = call.to_bytes();
        let recovered = PacketHeader::from_bytes(&bytes).unwrap();
        assert!(recovered.is_local_call());
        let midx = unsafe { recovered.command.call.midx };
        assert_eq!(midx, 42);
        let len = { recovered.length };
        assert_eq!(len, 128);
    }

    #[test]
    fn test_fail_packet() {
        let fail = PacketHeader::fail(100);
        assert!(fail.is_data());
        assert!(fail.is_fail());
    }

    #[test]
    fn test_data_mesg() {
        let data = PacketHeader::data_mesg(PACKET_FORMAT_MSGPACK, 256);
        assert!(data.is_data());
        assert!(!data.is_fail());
        let fmt = unsafe { data.command.data.format };
        assert_eq!(fmt, PACKET_FORMAT_MSGPACK);
        let len = { data.length };
        assert_eq!(len, 256);
    }
}


================================================
FILE: data/rust/morloc-runtime/src/packet_ffi.rs
================================================
//! C ABI wrappers for packet functions.
//! Replaces packet.c with calls to Rust packet.rs + voidstar.rs.

use std::ffi::{c_char, c_void, CStr};
use std::ptr;

use crate::cschema::CSchema;
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::packet::*;
use crate::shm::{self, AbsPtr, RelPtr};

// ── morloc_call_t ────────────────────────────────────────────────────────────

/// Matches C `morloc_call_t` layout.
#[repr(C)]
pub struct MorlocCall {
    pub midx: u32,
    pub args: *mut *mut u8,
    pub nargs: usize,
    pub owns_args: i32,
}

// ── Header reading ───────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_morloc_packet_header(
    msg: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut PacketHeader {
    clear_errmsg(errmsg);
    if msg.is_null() {
        set_errmsg(errmsg, &MorlocError::Packet("Cannot make packet from NULL pointer".into()));
        return ptr::null_mut();
    }
    // Validate magic
    let header = &*(msg as *const PacketHeader);
    if !header.is_valid() {
        set_errmsg(errmsg, &MorlocError::Packet("Malformed morloc packet".into()));
        return ptr::null_mut();
    }
    msg as *mut PacketHeader
}

#[no_mangle]
pub unsafe extern "C" fn packet_is_ping(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return false; }
    (*header).is_ping()
}

#[no_mangle]
pub unsafe extern "C" fn packet_is_local_call(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return false; }
    (*header).is_local_call()
}

#[no_mangle]
pub unsafe extern "C" fn packet_is_remote_call(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return false; }
    (*header).is_remote_call()
}

// ── Packet size ──────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn morloc_packet_size_from_header(
    header: *const PacketHeader,
) -> usize {
    if header.is_null() { return 0; }
    32 + (*header).offset as usize + (*header).length as usize
}

#[no_mangle]
pub unsafe extern "C" fn morloc_packet_size(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> usize {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return 0; }
    morloc_packet_size_from_header(header)
}

// ── Ping ─────────────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn return_ping(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    if !packet_is_ping(packet, errmsg) {
        if (*errmsg).is_null() {
            set_errmsg(errmsg, &MorlocError::Packet("Not a ping packet".into()));
        }
        return ptr::null_mut();
    }
    let size = morloc_packet_size(packet, errmsg);
    if size == 0 { return ptr::null_mut(); }
    let buf = libc::calloc(size, 1) as *mut u8;
    if buf.is_null() {
        set_errmsg(errmsg, &MorlocError::Packet("Failed to allocate ping response".into()));
        return ptr::null_mut();
    }
    ptr::copy_nonoverlapping(packet, buf, size);
    buf
}

#[no_mangle]
pub extern "C" fn make_ping_packet() -> *mut u8 {
    // SAFETY: calloc returns null or a valid pointer to 32 zeroed bytes.
    let buf = unsafe { libc::calloc(32, 1) as *mut u8 };
    if buf.is_null() { return ptr::null_mut(); }
    let header = PacketHeader::ping();
    let bytes = header.to_bytes();
    // SAFETY: buf points to 32 bytes; bytes is exactly 32 bytes from to_bytes().
    unsafe { ptr::copy_nonoverlapping(bytes.as_ptr(), buf, 32) };
    buf
}

// ── Data packet construction helpers ─────────────────────────────────────────

/// Build metadata section: metadata header + schema string, padded to 32-byte boundary.
/// Returns (metadata_buffer, padded_length). Returns (null, 0) if schema is null.
///
/// # Safety
/// `schema` must be null or a valid CSchema pointer.
unsafe fn build_schema_metadata(schema: *const CSchema) -> (*mut u8, usize) {
    if schema.is_null() {
        return (ptr::null_mut(), 0);
    }
    let rs = CSchema::to_rust(schema);
    let schema_str = crate::schema::schema_to_string(&rs);
    let schema_bytes = schema_str.as_bytes();
    let schema_len = schema_bytes.len() + 1; // +1 for null terminator
    let meta_header_size = 8; // sizeof(morloc_metadata_header_t)
    let raw_meta_len = meta_header_size + schema_len;
    let padded_meta_len = ((raw_meta_len + 31) / 32) * 32;

    let metadata = libc::calloc(padded_meta_len, 1) as *mut u8;
    if metadata.is_null() {
        return (ptr::null_mut(), 0);
    }

    // Write metadata header
    *metadata = b'm';
    *metadata.add(1) = b'm';
    *metadata.add(2) = b'h';
    *metadata.add(3) = METADATA_TYPE_SCHEMA_STRING;
    *(metadata.add(4) as *mut u32) = schema_len as u32;

    // Write schema string
    ptr::copy_nonoverlapping(schema_bytes.as_ptr(), metadata.add(meta_header_size), schema_bytes.len());
    // Null terminator already zeroed by calloc

    (metadata, padded_meta_len)
}

/// Generic data packet builder matching C's make_morloc_data_packet.
///
/// # Safety
/// If non-null, `data` must point to `data_length` readable bytes.
/// If non-null, `metadata` must point to `metadata_length` readable bytes.
unsafe fn make_data_packet_raw(
    data: *const u8,
    data_length: usize,
    metadata: *const u8,
    metadata_length: usize,
    src: u8,
    fmt: u8,
    cmpr: u8,
    encr: u8,
    status: u8,
) -> *mut u8 {
    let total = 32 + metadata_length + data_length;
    let packet = libc::calloc(total, 1) as *mut u8;
    if packet.is_null() { return ptr::null_mut(); }

    // Build command
    let cmd = CommandData {
        cmd_type: PACKET_TYPE_DATA,
        source: src,
        format: fmt,
        compression: cmpr,
        encryption: encr,
        status,
        padding: [0; 2],
    };
    let header = PacketHeader {
        magic: PACKET_MAGIC,
        plain: THIS_PLAIN,
        version: THIS_VERSION,
        flavor: DEFAULT_FLAVOR,
        mode: DEFAULT_MODE,
        command: PacketCommand { data: cmd },
        offset: metadata_length as u32,
        length: data_length as u64,
    };
    let hdr_bytes = header.to_bytes();
    ptr::copy_nonoverlapping(hdr_bytes.as_ptr(), packet, 32);

    if !metadata.is_null() && metadata_length > 0 {
        ptr::copy_nonoverlapping(metadata, packet.add(32), metadata_length);
    }
    if !data.is_null() && data_length > 0 {
        ptr::copy_nonoverlapping(data, packet.add(32 + metadata_length), data_length);
    }

    packet
}

/// Generic data packet with schema metadata.
unsafe fn make_data_packet_with_schema(
    data: *const u8,
    data_length: usize,
    schema: *const CSchema,
    src: u8,
    fmt: u8,
    cmpr: u8,
    encr: u8,
    status: u8,
) -> *mut u8 {
    let (metadata, metadata_length) = build_schema_metadata(schema);
    let result = make_data_packet_raw(
        data, data_length, metadata, metadata_length, src, fmt, cmpr, encr, status,
    );
    if !metadata.is_null() {
        libc::free(metadata as *mut c_void);
    }
    result
}

// ── Standard data packet (RPTR + VOIDSTAR) ──────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_standard_data_packet(
    relptr: RelPtr,
    schema: *const CSchema,
) -> *mut u8 {
    let packet = make_data_packet_with_schema(
        ptr::null(),
        std::mem::size_of::<RelPtr>(),
        schema,
        PACKET_SOURCE_RPTR,
        PACKET_FORMAT_VOIDSTAR,
        PACKET_COMPRESSION_NONE,
        PACKET_ENCRYPTION_NONE,
        PACKET_STATUS_PASS,
    );
    if packet.is_null() { return ptr::null_mut(); }

    // Write the relptr into the payload area
    let header = &*(packet as *const PacketHeader);
    let payload_offset = 32 + header.offset as usize;
    *(packet.add(payload_offset) as *mut RelPtr) = relptr;

    packet
}

#[no_mangle]
pub unsafe extern "C" fn make_arrow_data_packet(
    relptr: RelPtr,
    schema: *const CSchema,
) -> *mut u8 {
    let packet = make_data_packet_with_schema(
        ptr::null(),
        std::mem::size_of::<RelPtr>(),
        schema,
        PACKET_SOURCE_RPTR,
        PACKET_FORMAT_ARROW,
        PACKET_COMPRESSION_NONE,
        PACKET_ENCRYPTION_NONE,
        PACKET_STATUS_PASS,
    );
    if packet.is_null() { return ptr::null_mut(); }

    let header = &*(packet as *const PacketHeader);
    let payload_offset = 32 + header.offset as usize;
    *(packet.add(payload_offset) as *mut RelPtr) = relptr;

    packet
}

// ── Msgpack packets ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_mpk_data_packet(
    mpk_filename: *const c_char,
    schema: *const CSchema,
) -> *mut u8 {
    if mpk_filename.is_null() { return ptr::null_mut(); }
    let filename = CStr::from_ptr(mpk_filename);
    let bytes = filename.to_bytes();
    make_data_packet_with_schema(
        bytes.as_ptr(),
        bytes.len(),
        schema,
        PACKET_SOURCE_FILE,
        PACKET_FORMAT_MSGPACK,
        PACKET_COMPRESSION_NONE,
        PACKET_ENCRYPTION_NONE,
        PACKET_STATUS_PASS,
    )
}

#[no_mangle]
pub unsafe extern "C" fn make_data_packet_from_mpk(
    mpk: *const c_char,
    mpk_size: usize,
    schema: *const CSchema,
) -> *mut u8 {
    make_data_packet_with_schema(
        mpk as *const u8,
        mpk_size,
        schema,
        PACKET_SOURCE_MESG,
        PACKET_FORMAT_MSGPACK,
        PACKET_COMPRESSION_NONE,
        PACKET_ENCRYPTION_NONE,
        PACKET_STATUS_PASS,
    )
}

// ── get_data_packet_as_mpk ───────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn get_data_packet_as_mpk(
    packet: *const u8,
    schema: *const CSchema,
    mpk_out: *mut *mut c_char,
    mpk_size_out: *mut usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    *mpk_out = ptr::null_mut();
    *mpk_size_out = 0;

    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return 0; }

    if (*header).command_type() != PACKET_TYPE_DATA {
        set_errmsg(errmsg, &MorlocError::Packet("Expected a data packet".into()));
        return 0;
    }

    // Check for error
    if (*header).is_fail() {
        let payload_start = 32 + (*header).offset as usize;
        let payload_len = (*header).length as usize;
        let msg = std::str::from_utf8_unchecked(
            std::slice::from_raw_parts(packet.add(payload_start), payload_len)
        );
        set_errmsg(errmsg, &MorlocError::Packet(format!("\n{}", msg)));
        return 0;
    }

    let rs = CSchema::to_rust(schema);
    let source = (*header).command.data.source;
    let format = (*header).command.data.format;
    let payload_start = 32 + (*header).offset as usize;
    let payload_len = (*header).length as usize;
    let payload = std::slice::from_raw_parts(packet.add(payload_start), payload_len);

    if source == PACKET_SOURCE_MESG && format == PACKET_FORMAT_MSGPACK {
        // Inline msgpack: copy directly
        let buf = libc::malloc(payload_len) as *mut c_char;
        if buf.is_null() {
            set_errmsg(errmsg, &MorlocError::Packet("malloc failed".into()));
            return 0;
        }
        ptr::copy_nonoverlapping(payload.as_ptr(), buf as *mut u8, payload_len);
        *mpk_out = buf;
        *mpk_size_out = payload_len;
    } else if source == PACKET_SOURCE_MESG && format == PACKET_FORMAT_VOIDSTAR {
        // Inline voidstar: load into SHM then convert to msgpack
        match crate::voidstar::read_binary(payload, &rs) {
            Ok(abs) => {
                match crate::mpack::pack_with_schema(abs, &rs) {
                    Ok(data) => {
                        let buf = libc::malloc(data.len()) as *mut u8;
                        if buf.is_null() {
                            set_errmsg(errmsg, &MorlocError::Packet("malloc failed".into()));
                            return 0;
                        }
                        ptr::copy_nonoverlapping(data.as_ptr(), buf, data.len());
                        *mpk_out = buf as *mut c_char;
                        *mpk_size_out = data.len();
                    }
                    Err(e) => { set_errmsg(errmsg, &e); return 0; }
                }
                // Free SHM
                let _ = crate::voidstar::free_by_schema(abs, &rs);
                let _ = shm::shfree(abs);
            }
            Err(e) => { set_errmsg(errmsg, &e); return 0; }
        }
    } else if source == PACKET_SOURCE_FILE && format == PACKET_FORMAT_MSGPACK {
        // File-based msgpack: read the file
        let filename_bytes = &payload[..payload_len.min(4096)];
        let filename = std::str::from_utf8(filename_bytes).unwrap_or("");
        let filename = filename.trim_end_matches('\0');
        match std::fs::read(filename) {
            Ok(data) => {
                let buf = libc::malloc(data.len()) as *mut u8;
                if buf.is_null() {
                    set_errmsg(errmsg, &MorlocError::Packet("malloc failed".into()));
                    return 0;
                }
                ptr::copy_nonoverlapping(data.as_ptr(), buf, data.len());
                *mpk_out = buf as *mut c_char;
                *mpk_size_out = data.len();
            }
            Err(e) => {
                set_errmsg(errmsg, &MorlocError::Io(e));
                return 0;
            }
        }
    } else if source == PACKET_SOURCE_RPTR && format == PACKET_FORMAT_VOIDSTAR {
        // Voidstar via relptr: convert to msgpack
        let relptr = *(payload.as_ptr() as *const RelPtr);
        match shm::rel2abs(relptr) {
            Ok(abs) => {
                match crate::mpack::pack_with_schema(abs, &rs) {
                    Ok(data) => {
                        let buf = libc::malloc(data.len()) as *mut u8;
                        if buf.is_null() {
                            set_errmsg(errmsg, &MorlocError::Packet("malloc failed".into()));
                            return 0;
                        }
                        ptr::copy_nonoverlapping(data.as_ptr(), buf, data.len());
                        *mpk_out = buf as *mut c_char;
                        *mpk_size_out = data.len();
                    }
                    Err(e) => { set_errmsg(errmsg, &e); return 0; }
                }
            }
            Err(e) => { set_errmsg(errmsg, &e); return 0; }
        }
    } else {
        set_errmsg(errmsg, &MorlocError::Packet(
            format!("Unsupported packet source/format: 0x{:02x}/0x{:02x}", source, format)
        ));
        return 0;
    }

    1 // true
}

// ── Schema from metadata ─────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_schema_from_packet_meta(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return ptr::null_mut(); }

    let offset = (*header).offset as usize;
    if offset < 8 { return ptr::null_mut(); } // no room for metadata header

    let meta_start = 32usize;
    let meta_end = meta_start + offset;
    let mut pos = meta_start;
    while pos + 8 <= meta_end {
        if *packet.add(pos) == b'm' && *packet.add(pos + 1) == b'm' && *packet.add(pos + 2) == b'h' {
            let meta_type = *packet.add(pos + 3);
            let meta_size = *(packet.add(pos + 4) as *const u32) as usize;
            if meta_type == METADATA_TYPE_SCHEMA_STRING {
                // Return pointer into the packet buffer (matches C behavior)
                return packet.add(pos + 8) as *mut c_char;
            }
            pos += 8 + meta_size;
        } else {
            break;
        }
    }
    ptr::null_mut()
}

// ── Fail packet ──────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_fail_packet(
    failure_message: *const c_char,
) -> *mut u8 {
    if failure_message.is_null() { return ptr::null_mut(); }
    let msg = CStr::from_ptr(failure_message).to_bytes();
    make_data_packet_raw(
        msg.as_ptr(),
        msg.len(),
        ptr::null(),
        0,
        PACKET_SOURCE_MESG,
        PACKET_FORMAT_TEXT,
        PACKET_COMPRESSION_NONE,
        PACKET_ENCRYPTION_NONE,
        PACKET_STATUS_FAIL,
    )
}

// ── Error message extraction ─────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn get_morloc_data_packet_error_message(
    data: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut c_char {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(data, errmsg);
    if header.is_null() { return ptr::null_mut(); }

    if (*header).is_fail() {
        let payload_start = 32 + (*header).offset as usize;
        let payload_len = (*header).length as usize;
        let buf = libc::calloc(payload_len + 1, 1) as *mut c_char;
        if buf.is_null() {
            set_errmsg(errmsg, &MorlocError::Packet("Failed to allocate error message".into()));
            return ptr::null_mut();
        }
        ptr::copy_nonoverlapping(data.add(payload_start), buf as *mut u8, payload_len);
        return buf;
    }

    ptr::null_mut()
}

// ── get_morloc_data_packet_value ─────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn get_morloc_data_packet_value(
    data: *const u8,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(data, errmsg);
    if header.is_null() { return ptr::null_mut(); }

    if (*header).command_type() != PACKET_TYPE_DATA {
        set_errmsg(errmsg, &MorlocError::Packet("Expected a data packet".into()));
        return ptr::null_mut();
    }

    // Check for error
    let packet_error = get_morloc_data_packet_error_message(data, errmsg);
    if !packet_error.is_null() {
        let err_str = CStr::from_ptr(packet_error).to_string_lossy().into_owned();
        libc::free(packet_error as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Packet(format!("\n{}", err_str)));
        return ptr::null_mut();
    }
    // Clear any errmsg from get_morloc_data_packet_error_message
    clear_errmsg(errmsg);

    let rs = CSchema::to_rust(schema);
    let source = (*header).command.data.source;
    let format = (*header).command.data.format;
    let payload_start = 32 + (*header).offset as usize;
    let payload_len = (*header).length as usize;

    match source {
        PACKET_SOURCE_MESG => {
            if format == PACKET_FORMAT_MSGPACK {
                let payload = std::slice::from_raw_parts(data.add(payload_start), payload_len);
                match crate::mpack::unpack_with_schema(payload, &rs) {
                    Ok(abs) => abs,
                    Err(e) => { set_errmsg(errmsg, &e); ptr::null_mut() }
                }
            } else if format == PACKET_FORMAT_VOIDSTAR {
                let payload = std::slice::from_raw_parts(data.add(payload_start), payload_len);
                match crate::voidstar::read_binary(payload, &rs) {
                    Ok(abs) => abs,
                    Err(e) => { set_errmsg(errmsg, &e); ptr::null_mut() }
                }
            } else {
                set_errmsg(errmsg, &MorlocError::Packet(
                    format!("Invalid format from mesg: 0x{:02x}", format)
                ));
                ptr::null_mut()
            }
        }
        PACKET_SOURCE_FILE => {
            if format == PACKET_FORMAT_MSGPACK {
                let filename_bytes = std::slice::from_raw_parts(data.add(payload_start), payload_len.min(4096));
                let filename = std::str::from_utf8(filename_bytes).unwrap_or("");
                let filename = filename.trim_end_matches('\0');
                match std::fs::read(filename) {
                    Ok(file_data) => {
                        match crate::mpack::unpack_with_schema(&file_data, &rs) {
                            Ok(abs) => abs,
                            Err(e) => { set_errmsg(errmsg, &e); ptr::null_mut() }
                        }
                    }
                    Err(e) => {
                        set_errmsg(errmsg, &MorlocError::Io(e));
                        ptr::null_mut()
                    }
                }
            } else {
                set_errmsg(errmsg, &MorlocError::Packet(
                    format!("Invalid format from file: 0x{:02x}", format)
                ));
                ptr::null_mut()
            }
        }
        PACKET_SOURCE_RPTR => {
            if format == PACKET_FORMAT_VOIDSTAR || format == PACKET_FORMAT_ARROW {
                let relptr = *(data.add(payload_start) as *const RelPtr);
                match shm::rel2abs(relptr) {
                    Ok(abs) => abs,
                    Err(e) => { set_errmsg(errmsg, &e); ptr::null_mut() }
                }
            } else {
                set_errmsg(errmsg, &MorlocError::Packet(
                    format!("For RPTR source, expected voidstar or arrow format, found: 0x{:02x}", format)
                ));
                ptr::null_mut()
            }
        }
        _ => {
            set_errmsg(errmsg, &MorlocError::Packet("Invalid source".into()));
            ptr::null_mut()
        }
    }
}

// ── Call packet construction ─────────────────────────────────────────────────

unsafe fn make_call_packet_gen(
    midx: u32,
    entrypoint: u8,
    arg_packets: *const *const u8,
    nargs: usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);

    // Calculate total data length
    let mut data_length: usize = 0;
    for i in 0..nargs {
        let arg = read_morloc_packet_header(*arg_packets.add(i), errmsg);
        if arg.is_null() { return ptr::null_mut(); }
        data_length += morloc_packet_size_from_header(arg);
    }

    let total = 32 + data_length;
    let packet = libc::calloc(total, 1) as *mut u8;
    if packet.is_null() {
        set_errmsg(errmsg, &MorlocError::Packet("Failed to allocate call packet".into()));
        return ptr::null_mut();
    }

    let cmd = CommandCall {
        cmd_type: PACKET_TYPE_CALL,
        entrypoint,
        padding: [0; 2],
        midx,
    };
    let header = PacketHeader {
        magic: PACKET_MAGIC,
        plain: THIS_PLAIN,
        version: THIS_VERSION,
        flavor: DEFAULT_FLAVOR,
        mode: DEFAULT_MODE,
        command: PacketCommand { call: cmd },
        offset: 0,
        length: data_length as u64,
    };
    let hdr_bytes = header.to_bytes();
    ptr::copy_nonoverlapping(hdr_bytes.as_ptr(), packet, 32);

    let mut pos = 32;
    for i in 0..nargs {
        let arg = read_morloc_packet_header(*arg_packets.add(i), errmsg);
        if arg.is_null() {
            libc::free(packet as *mut c_void);
            return ptr::null_mut();
        }
        let arg_size = morloc_packet_size_from_header(arg);
        ptr::copy_nonoverlapping(*arg_packets.add(i), packet.add(pos), arg_size);
        pos += arg_size;
    }

    packet
}

#[no_mangle]
pub unsafe extern "C" fn make_morloc_local_call_packet(
    midx: u32,
    arg_packets: *const *const u8,
    nargs: usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    make_call_packet_gen(midx, PACKET_ENTRYPOINT_LOCAL, arg_packets, nargs, errmsg)
}

#[no_mangle]
pub unsafe extern "C" fn make_morloc_remote_call_packet(
    midx: u32,
    arg_packets: *const *const u8,
    nargs: usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    make_call_packet_gen(midx, PACKET_ENTRYPOINT_REMOTE_SFS, arg_packets, nargs, errmsg)
}

// ── Call packet reading ──────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_morloc_call_packet(
    packet: *const u8,
    errmsg: *mut *mut c_char,
) -> *mut MorlocCall {
    clear_errmsg(errmsg);

    let call = libc::calloc(1, std::mem::size_of::<MorlocCall>()) as *mut MorlocCall;
    if call.is_null() {
        set_errmsg(errmsg, &MorlocError::Packet("calloc failed".into()));
        return ptr::null_mut();
    }

    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() {
        libc::free(call as *mut c_void);
        return ptr::null_mut();
    }
    if (*header).command_type() != PACKET_TYPE_CALL {
        set_errmsg(errmsg, &MorlocError::Packet("Expected packet to be a call".into()));
        libc::free(call as *mut c_void);
        return ptr::null_mut();
    }

    (*call).midx = (*header).command.call.midx;
    (*call).nargs = 0;
    (*call).args = ptr::null_mut();
    (*call).owns_args = 0; // borrowing pointers into packet

    let start_pos = 32 + (*header).offset as usize;
    let end_pos = start_pos + (*header).length as usize;

    // First pass: count args
    let mut pos = start_pos;
    while pos < end_pos {
        let arg_size = morloc_packet_size(packet.add(pos), errmsg);
        if arg_size == 0 {
            free_morloc_call(call);
            return ptr::null_mut();
        }
        pos += arg_size;
        (*call).nargs += 1;
    }

    // Allocate args array
    (*call).args = libc::calloc((*call).nargs, std::mem::size_of::<*mut u8>()) as *mut *mut u8;
    if (*call).args.is_null() {
        set_errmsg(errmsg, &MorlocError::Packet("calloc failed for args".into()));
        libc::free(call as *mut c_void);
        return ptr::null_mut();
    }

    // Second pass: fill pointers (borrowing into original packet)
    pos = start_pos;
    for i in 0..(*call).nargs {
        let arg_header = read_morloc_packet_header(packet.add(pos), errmsg);
        if arg_header.is_null() {
            free_morloc_call(call);
            return ptr::null_mut();
        }
        if (*arg_header).command_type() != PACKET_TYPE_DATA {
            set_errmsg(errmsg, &MorlocError::Packet(
                format!("Argument #{} is not a DATA packet (type={})", i, (*arg_header).command_type())
            ));
            free_morloc_call(call);
            return ptr::null_mut();
        }
        *(*call).args.add(i) = packet.add(pos) as *mut u8;
        pos += morloc_packet_size_from_header(arg_header);
    }

    call
}

#[no_mangle]
pub unsafe extern "C" fn free_morloc_call(call: *mut MorlocCall) {
    if call.is_null() { return; }
    let c = &*call;
    if !c.args.is_null() {
        if c.owns_args != 0 {
            for i in 0..c.nargs {
                let arg = *c.args.add(i);
                if !arg.is_null() {
                    libc::free(arg as *mut c_void);
                }
            }
        }
        libc::free(c.args as *mut c_void);
    }
    libc::free(call as *mut c_void);
}

// adjust_voidstar_relptrs: still provided by cli.c (will move to Rust when cli.c is ported)
// read_voidstar_binary: still provided by cli.c (will move to Rust when cli.c is ported)

// ── write_voidstar_binary (for intrinsics.c) ─────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn write_voidstar_binary(
    fd: i32,
    data: *const c_void,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> RelPtr {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);
    match crate::voidstar::write_binary_to_fd(fd, data as AbsPtr, &rs) {
        Ok(n) => n as RelPtr,
        Err(e) => {
            set_errmsg(errmsg, &e);
            -1isize as RelPtr
        }
    }
}

// ── flatten_voidstar_to_buffer ───────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn flatten_voidstar_to_buffer(
    data: *const c_void,
    schema: *const CSchema,
    out_buf: *mut *mut u8,
    out_size: *mut usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    *out_buf = ptr::null_mut();
    *out_size = 0;

    let rs = CSchema::to_rust(schema);
    match crate::voidstar::flatten_to_buffer(data as AbsPtr, &rs) {
        Ok(buf) => {
            let len = buf.len();
            let c_buf = libc::malloc(len) as *mut u8;
            if c_buf.is_null() {
                set_errmsg(errmsg, &MorlocError::Packet("malloc failed".into()));
                return 1;
            }
            ptr::copy_nonoverlapping(buf.as_ptr(), c_buf, len);
            *out_buf = c_buf;
            *out_size = len;
            0
        }
        Err(e) => {
            set_errmsg(errmsg, &e);
            1
        }
    }
}

// read_voidstar_binary: still provided by cli.c (will move to Rust when cli.c is ported)

// ── make_data_packet_auto ────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn make_data_packet_auto(
    voidstar: *mut c_void,
    relptr: RelPtr,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    let rs = CSchema::to_rust(schema);

    let flat_size = match crate::ffi::calc_voidstar_size_inner(voidstar as *const u8, &rs) {
        Ok(s) => s,
        Err(e) => {
            set_errmsg(errmsg, &e);
            return ptr::null_mut();
        }
    };

    if flat_size <= MORLOC_INLINE_THRESHOLD {
        match crate::voidstar::flatten_to_buffer(voidstar as AbsPtr, &rs) {
            Ok(blob) => {
                let packet = make_data_packet_with_schema(
                    blob.as_ptr(),
                    blob.len(),
                    schema,
                    PACKET_SOURCE_MESG,
                    PACKET_FORMAT_VOIDSTAR,
                    PACKET_COMPRESSION_NONE,
                    PACKET_ENCRYPTION_NONE,
                    PACKET_STATUS_PASS,
                );
                if packet.is_null() {
                    set_errmsg(errmsg, &MorlocError::Packet("Failed to create inline data packet".into()));
                }
                return packet;
            }
            Err(e) => {
                set_errmsg(errmsg, &e);
                return ptr::null_mut();
            }
        }
    }

    make_standard_data_packet(relptr, schema)
}

// ── print_morloc_data_packet ─────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn print_morloc_data_packet(
    packet: *const u8,
    schema: *const CSchema,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    let header = read_morloc_packet_header(packet, errmsg);
    if header.is_null() { return 1; }

    if (*header).command_type() != PACKET_TYPE_DATA {
        set_errmsg(errmsg, &MorlocError::Packet("Expected a data packet".into()));
        return 1;
    }

    // Check for error
    let packet_error = get_morloc_data_packet_error_message(packet, errmsg);
    if !packet_error.is_null() {
        let err_str = CStr::from_ptr(packet_error).to_string_lossy().into_owned();
        libc::free(packet_error as *mut c_void);
        set_errmsg(errmsg, &MorlocError::Packet(format!("\n{}", err_str)));
        return 1;
    }
    clear_errmsg(errmsg);

    let rs = CSchema::to_rust(schema);
    let source = (*header).command.data.source;
    let format = (*header).command.data.format;
    let packet_size = morloc_packet_size_from_header(header);

    match source {
        PACKET_SOURCE_MESG | PACKET_SOURCE_FILE => {
            // Print the raw packet bytes
            if print_binary(packet, packet_size, errmsg) != 0 {
                return 1;
            }
        }
        PACKET_SOURCE_RPTR => {
            match format {
                PACKET_FORMAT_VOIDSTAR => {
                    let payload_start = 32 + (*header).offset as usize;
                    let relptr = *(packet.add(payload_start) as *const RelPtr);
                    let voidstar_ptr = match shm::rel2abs(relptr) {
                        Ok(p) => p,
                        Err(e) => { set_errmsg(errmsg, &e); return 1; }
                    };

                    // Build modified header with flat size
                    let flat_size = match crate::ffi::calc_voidstar_size_inner(voidstar_ptr, &rs) {
                        Ok(s) => s,
                        Err(e) => { set_errmsg(errmsg, &e); return 1; }
                    };

                    let mut new_header = *header;
                    new_header.command.data.format = PACKET_FORMAT_VOIDSTAR;
                    // Safely set length (packed struct)
                    let new_hdr_ptr = &mut new_header as *mut PacketHeader as *mut u8;
                    *(new_hdr_ptr.add(24) as *mut u64) = flat_size as u64;

                    // Print header
                    if print_binary(&new_header as *const PacketHeader as *const u8, 32, errmsg) != 0 {
                        return 1;
                    }

                    // Print metadata
                    let offset = (*header).offset as usize;
                    if offset > 0 {
                        if print_binary(packet.add(32), offset, errmsg) != 0 {
                            return 1;
                        }
                    }

                    // Write flattened voidstar data to stdout
                    match crate::voidstar::write_binary_to_fd(libc::STDOUT_FILENO, voidstar_ptr, &rs) {
                        Ok(_) => {}
                        Err(e) => { set_errmsg(errmsg, &e); return 1; }
                    }
                }
                _ => {
                    // Other formats: print raw packet
                    if print_binary(packet, packet_size, errmsg) != 0 {
                        return 1;
                    }
                }
            }
        }
        _ => {
            set_errmsg(errmsg, &MorlocError::Packet("Invalid source".into()));
            return 1;
        }
    }

    0 // EXIT_PASS
}

/// Write binary data to stdout.
///
/// # Safety
/// `buf` must point to at least `count` readable bytes.
unsafe fn print_binary(
    buf: *const u8,
    count: usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    let mut written: usize = 0;
    while written < count {
        let n = libc::write(
            libc::STDOUT_FILENO,
            buf.add(written) as *const c_void,
            count - written,
        );
        if n < 0 {
            set_errmsg(errmsg, &MorlocError::Io(std::io::Error::last_os_error()));
            return 1;
        }
        written += n as usize;
    }
    0
}


================================================
FILE: data/rust/morloc-runtime/src/pool_ffi.rs
================================================
//! Pool server lifecycle: accept connections, dispatch packets, manage workers.
//! Replaces pool.c. Uses std::thread instead of raw pthreads for thread mode.

use std::ffi::{c_char, c_void};
use std::ptr;
use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
use std::sync::{Arc, Mutex, Condvar};

// ── C-compatible types matching pool.h ───────────────────────────────────────

pub type PoolDispatchFn = unsafe extern "C" fn(
    mid: u32, args: *const *const u8, nargs: usize, ctx: *mut c_void,
) -> *mut u8;

#[repr(C)]
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum PoolConcurrency {
    Threads = 0,
    Fork = 1,
    Single = 2,
}

#[repr(C)]
pub struct PoolConfig {
    pub local_dispatch: PoolDispatchFn,
    pub remote_dispatch: PoolDispatchFn,
    pub dispatch_ctx: *mut c_void,
    pub concurrency: PoolConcurrency,
    pub initial_workers: i32,
    pub dynamic_scaling: bool,
    pub post_fork_child: Option<unsafe extern "C" fn(*mut c_void)>,
}

// SAFETY: PoolConfig contains function pointers and a *mut c_void dispatch_ctx.
// The function pointers are set once at startup and never mutated.
// dispatch_ctx points to language-runtime state that is either thread-local
// (fork mode) or protected by the runtime's own synchronization (thread mode).
// The pool architecture guarantees dispatch_ctx is not concurrently mutated.
unsafe impl Send for PoolConfig {}
unsafe impl Sync for PoolConfig {}

// ── Global state ─────────────────────────────────────────────────────────────

static SHUTTING_DOWN: AtomicBool = AtomicBool::new(false);
static BUSY_COUNT: AtomicI32 = AtomicI32::new(0);
static TOTAL_WORKERS: AtomicI32 = AtomicI32::new(0);

// SAFETY: SHARED_BUSY is set once in pool_main_fork (parent process) before
// forking children. After fork, each process accesses the mmap'd AtomicI32
// via atomic operations only. Reset to null during shutdown.
static mut SHARED_BUSY: *mut AtomicI32 = ptr::null_mut();

#[no_mangle]
pub extern "C" fn pool_mark_busy() {
    // SAFETY: SHARED_BUSY is either null (thread mode, use local atomic) or a valid
    // mmap'd AtomicI32 pointer set during pool_main_fork initialization.
    unsafe {
        if !SHARED_BUSY.is_null() {
            (*SHARED_BUSY).fetch_add(1, Ordering::Relaxed);
        } else {
            BUSY_COUNT.fetch_add(1, Ordering::Relaxed);
        }
    }
}

#[no_mangle]
pub extern "C" fn pool_mark_idle() {
    // SAFETY: Same as pool_mark_busy - SHARED_BUSY is null or a valid mmap'd pointer.
    unsafe {
        if !SHARED_BUSY.is_null() {
            (*SHARED_BUSY).fetch_sub(1, Ordering::Relaxed);
        } else {
            BUSY_COUNT.fetch_sub(1, Ordering::Relaxed);
        }
    }
}

extern "C" fn pool_sigterm_handler(_sig: i32) {
    SHUTTING_DOWN.store(true, Ordering::Relaxed);
}

// ── Packet dispatch ──────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn pool_dispatch_packet(
    packet: *const u8,
    local_dispatch: PoolDispatchFn,
    remote_dispatch: PoolDispatchFn,
    ctx: *mut c_void,
) -> *mut u8 {
    extern "C" {
        fn make_fail_packet(msg: *const c_char) -> *mut u8;
        fn packet_is_ping(packet: *const u8, errmsg: *mut *mut c_char) -> bool;
        fn return_ping(packet: *const u8, errmsg: *mut *mut c_char) -> *mut u8;
        fn packet_is_local_call(packet: *const u8, errmsg: *mut *mut c_char) -> bool;
        fn packet_is_remote_call(packet: *const u8, errmsg: *mut *mut c_char) -> bool;
        fn read_morloc_call_packet(packet: *const u8, errmsg: *mut *mut c_char) -> *mut crate::packet_ffi::MorlocCall;
        fn free_morloc_call(call: *mut crate::packet_ffi::MorlocCall);
    }

    if packet.is_null() {
        return make_fail_packet(b"NULL packet in pool dispatch\0".as_ptr() as *const c_char);
    }

    let mut errmsg: *mut c_char = ptr::null_mut();

    if packet_is_ping(packet, &mut errmsg) {
        if !errmsg.is_null() { return fail_from_errmsg(errmsg); }
        let pong = return_ping(packet, &mut errmsg);
        if !errmsg.is_null() { return fail_from_errmsg(errmsg); }
        return pong;
    }
    if !errmsg.is_null() { return fail_from_errmsg(errmsg); }

    let is_local = packet_is_local_call(packet, &mut errmsg);
    if !errmsg.is_null() { return fail_from_errmsg(errmsg); }
    let is_remote = packet_is_remote_call(packet, &mut errmsg);
    if !errmsg.is_null() { return fail_from_errmsg(errmsg); }

    if is_local || is_remote {
        let call = read_morloc_call_packet(packet, &mut errmsg);
        if !errmsg.is_null() { return fail_from_errmsg(errmsg); }

        let mid = (*call).midx;
        let args = (*call).args as *const *const u8;
        let nargs = (*call).nargs;

        let dispatch_fn = if is_local { local_dispatch } else { remote_dispatch };
        let result = dispatch_fn(mid, args, nargs, ctx);

        free_morloc_call(call);

        if result.is_null() {
            return make_fail_packet(b"dispatch callback returned NULL\0".as_ptr() as *const c_char);
        }
        return result;
    }

    make_fail_packet(b"Unexpected packet type in pool dispatch\0".as_ptr() as *const c_char)
}

unsafe fn fail_from_errmsg(errmsg: *mut c_char) -> *mut u8 {
    extern "C" { fn make_fail_packet(msg: *const c_char) -> *mut u8; }
    let pkt = make_fail_packet(errmsg);
    libc::free(errmsg as *mut c_void);
    pkt
}

// ── Helpers ──────────────────────────────────────────────────────────────────

unsafe fn try_send_fail(client_fd: i32, msg: *const c_char) {
    extern "C" {
        fn make_fail_packet(msg: *const c_char) -> *mut u8;
        fn send_packet_to_foreign_server(fd: i32, packet: *mut u8, errmsg: *mut *mut c_char) -> usize;
    }
    let fail = make_fail_packet(if msg.is_null() { b"Unknown error\0".as_ptr() as *const c_char } else { msg });
    if !fail.is_null() {
        let mut err: *mut c_char = ptr::null_mut();
        send_packet_to_foreign_server(client_fd, fail, &mut err);
        libc::free(fail as *mut c_void);
        if !err.is_null() { libc::free(err as *mut c_void); }
    }
}

// ── Thread mode job queue ────────────────────────────────────────────────────

struct JobQueue {
    jobs: Mutex<Vec<i32>>,
    cond: Condvar,
}

impl JobQueue {
    fn new() -> Self {
        JobQueue { jobs: Mutex::new(Vec::new()), cond: Condvar::new() }
    }

    fn push(&self, fd: i32) {
        let mut jobs = self.jobs.lock().unwrap();
        jobs.push(fd);
        self.cond.notify_one();
    }

    fn pop(&self) -> Option<i32> {
        let mut jobs = self.jobs.lock().unwrap();
        loop {
            if SHUTTING_DOWN.load(Ordering::Relaxed) { return None; }
            if let Some(fd) = jobs.pop() { return Some(fd); }
            let result = self.cond.wait_timeout(jobs, std::time::Duration::from_millis(100)).unwrap();
            jobs = result.0;
        }
    }
}

// ── Worker thread ────────────────────────────────────────────────────────────

unsafe fn worker_loop(queue: &JobQueue, config: &PoolConfig) {
    extern "C" {
        fn stream_from_client(fd: i32, errmsg: *mut *mut c_char) -> *mut u8;
        fn send_packet_to_foreign_server(fd: i32, packet: *mut u8, errmsg: *mut *mut c_char) -> usize;
        fn close_socket(fd: i32);
    }

    while !SHUTTING_DOWN.load(Ordering::Relaxed) {
        let client_fd = match queue.pop() {
            Some(fd) => fd,
            None => break,
        };

        let mut errmsg: *mut c_char = ptr::null_mut();
        let data = stream_from_client(client_fd, &mut errmsg);
        if data.is_null() || !errmsg.is_null() {
            if !errmsg.is_null() {
                try_send_fail(client_fd, errmsg);
                libc::free(errmsg as *mut c_void);
            }
            libc::free(data as *mut c_void);
            close_socket(client_fd);
            continue;
        }

        // Track busy state so the accept loop can spawn new workers if needed
        pool_mark_busy();
        let result = pool_dispatch_packet(data, config.local_dispatch, config.remote_dispatch, config.dispatch_ctx);
        pool_mark_idle();
        libc::free(data as *mut c_void);

        if !result.is_null() {
            send_packet_to_foreign_server(client_fd, result, &mut errmsg);
            libc::free(result as *mut c_void);
            if !errmsg.is_null() { libc::free(errmsg as *mut c_void); }
        }

        libc::fflush(ptr::null_mut()); // flush stdout
        close_socket(client_fd);
    }
}

// ── Pool main: threads mode ──────────────────────────────────────────────────

unsafe fn pool_main_threads(config: &PoolConfig, socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char) -> i32 {
    extern "C" {
        fn start_daemon(socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char, size: usize, errmsg: *mut *mut c_char) -> *mut c_void;
        fn close_daemon(daemon: *mut *mut c_void);
        fn wait_for_client_with_timeout(daemon: *mut c_void, timeout_us: i32, errmsg: *mut *mut c_char) -> i32;
    }

    let mut errmsg: *mut c_char = ptr::null_mut();
    let mut daemon = start_daemon(socket_path, tmpdir, shm_basename, 0xffff, &mut errmsg);
    if !errmsg.is_null() {
        libc::fprintf(libc::fdopen(2, b"w\0".as_ptr() as *const c_char),
            b"Failed to start language server:\n%s\n\0".as_ptr() as *const c_char, errmsg);
        libc::free(errmsg as *mut c_void);
        return 1;
    }

    let queue = Arc::new(JobQueue::new());
    let nthreads = config.initial_workers.max(1) as usize;
    TOTAL_WORKERS.store(nthreads as i32, Ordering::Relaxed);

    let mut handles = Vec::with_capacity(nthreads);
    for _ in 0..nthreads {
        let q = Arc::clone(&queue);
        let cfg = ptr::read(config); // Copy config for thread
        handles.push(std::thread::spawn(move || {
            worker_loop(&q, &cfg);
        }));
    }

    while !SHUTTING_DOWN.load(Ordering::Relaxed) {
        let client_fd = wait_for_client_with_timeout(daemon, 10000, &mut errmsg);
        if !errmsg.is_null() { libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
        if client_fd > 0 {
            queue.push(client_fd);
        }

        // Dynamic scaling: spawn a new worker if all are busy
        if config.dynamic_scaling {
            let busy = BUSY_COUNT.load(Ordering::Relaxed);
            let total = TOTAL_WORKERS.load(Ordering::Relaxed);
            if busy >= total {
                let q = Arc::clone(&queue);
                let cfg = ptr::read(config);
                handles.push(std::thread::spawn(move || {
                    worker_loop(&q, &cfg);
                }));
                TOTAL_WORKERS.fetch_add(1, Ordering::Relaxed);
            }
        }
    }

    SHUTTING_DOWN.store(true, Ordering::Relaxed);
    queue.cond.notify_all();

    for h in handles { let _ = h.join(); }

    close_daemon(&mut daemon);
    0
}

// ── Pool main: single mode ───────────────────────────────────────────────────

unsafe fn pool_main_single(config: &PoolConfig, socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char) -> i32 {
    extern "C" {
        fn start_daemon(socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char, size: usize, errmsg: *mut *mut c_char) -> *mut c_void;
        fn close_daemon(daemon: *mut *mut c_void);
        fn wait_for_client_with_timeout(daemon: *mut c_void, timeout_us: i32, errmsg: *mut *mut c_char) -> i32;
        fn stream_from_client(fd: i32, errmsg: *mut *mut c_char) -> *mut u8;
        fn send_packet_to_foreign_server(fd: i32, packet: *mut u8, errmsg: *mut *mut c_char) -> usize;
        fn close_socket(fd: i32);
    }

    let mut errmsg: *mut c_char = ptr::null_mut();
    let mut daemon = start_daemon(socket_path, tmpdir, shm_basename, 0xffff, &mut errmsg);
    if !errmsg.is_null() {
        libc::fprintf(libc::fdopen(2, b"w\0".as_ptr() as *const c_char),
            b"Failed to start language server:\n%s\n\0".as_ptr() as *const c_char, errmsg);
        libc::free(errmsg as *mut c_void);
        return 1;
    }

    while !SHUTTING_DOWN.load(Ordering::Relaxed) {
        let client_fd = wait_for_client_with_timeout(daemon, 10000, &mut errmsg);
        if !errmsg.is_null() { libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
        if client_fd <= 0 { continue; }

        let data = stream_from_client(client_fd, &mut errmsg);
        if data.is_null() || !errmsg.is_null() {
            if !errmsg.is_null() { try_send_fail(client_fd, errmsg); libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
            libc::free(data as *mut c_void);
            close_socket(client_fd);
            continue;
        }

        let result = pool_dispatch_packet(data, config.local_dispatch, config.remote_dispatch, config.dispatch_ctx);
        libc::free(data as *mut c_void);

        if !result.is_null() {
            send_packet_to_foreign_server(client_fd, result, &mut errmsg);
            libc::free(result as *mut c_void);
            if !errmsg.is_null() { libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
        }

        libc::fflush(ptr::null_mut());
        close_socket(client_fd);
    }

    close_daemon(&mut daemon);
    0
}

// ── Pool main: fork mode ─────────────────────────────────────────────────────

unsafe fn pool_main_fork(config: &PoolConfig, socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char) -> i32 {
    extern "C" {
        fn start_daemon(socket_path: *const c_char, tmpdir: *const c_char, shm_basename: *const c_char, size: usize, errmsg: *mut *mut c_char) -> *mut c_void;
        fn close_daemon(daemon: *mut *mut c_void);
        fn wait_for_client_with_timeout(daemon: *mut c_void, timeout_us: i32, errmsg: *mut *mut c_char) -> i32;
        fn stream_from_client(fd: i32, errmsg: *mut *mut c_char) -> *mut u8;
        fn send_packet_to_foreign_server(fd: i32, packet: *mut u8, errmsg: *mut *mut c_char) -> usize;
        fn close_socket(fd: i32);
        fn shinit(basename: *const c_char, volume: usize, size: usize, errmsg: *mut *mut c_char) -> *mut c_void;
    }

    let mut errmsg: *mut c_char = ptr::null_mut();
    let mut daemon = start_daemon(socket_path, tmpdir, shm_basename, 0xffff, &mut errmsg);
    if !errmsg.is_null() {
        libc::fprintf(libc::fdopen(2, b"w\0".as_ptr() as *const c_char),
            b"Failed to start language server:\n%s\n\0".as_ptr() as *const c_char, errmsg);
        libc::free(errmsg as *mut c_void);
        return 1;
    }

    // Create socketpair for fd passing
    let mut sv = [0i32; 2];
    if libc::socketpair(libc::AF_UNIX, libc::SOCK_STREAM, 0, sv.as_mut_ptr()) < 0 {
        close_daemon(&mut daemon);
        return 1;
    }

    // Shared busy counter via mmap
    let shared_counter = libc::mmap(
        ptr::null_mut(), std::mem::size_of::<AtomicI32>(),
        libc::PROT_READ | libc::PROT_WRITE,
        libc::MAP_SHARED | libc::MAP_ANONYMOUS, -1, 0,
    ) as *mut AtomicI32;
    if shared_counter == libc::MAP_FAILED as *mut AtomicI32 {
        libc::close(sv[0]); libc::close(sv[1]);
        close_daemon(&mut daemon);
        return 1;
    }
    (*shared_counter).store(0, Ordering::Relaxed);
    SHARED_BUSY = shared_counter;

    let nworkers = config.initial_workers.max(1);
    let mut child_pids: Vec<i32> = Vec::new();

    for i in 0..nworkers {
        let pid = libc::fork();
        if pid < 0 { break; }
        if pid == 0 {
            // Child
            libc::close(sv[1]); // close write end
            // Get daemon server_fd from opaque pointer and close it
            // (we can't access the struct fields directly since daemon is *mut c_void,
            //  but the child doesn't need to accept connections)
            if let Some(pfk) = config.post_fork_child {
                pfk(config.dispatch_ctx);
            }

            shinit(shm_basename, (i + 1) as usize, 0xffff, &mut errmsg);
            if !errmsg.is_null() {
                // Print the error to stderr before exiting so the nexus can
                // capture it via the pool's redirected stderr file. Without
                // this, a failed shinit in a forked worker child leaves no
                // diagnostic trace anywhere.
                libc::fprintf(
                    libc::fdopen(2, b"w\0".as_ptr() as *const c_char),
                    b"Worker %d shinit failed: %s\n\0".as_ptr() as *const c_char,
                    i as i32,
                    errmsg,
                );
                libc::free(errmsg as *mut c_void);
                libc::_exit(1);
            }

            // Worker loop: receive fds and process
            loop {
                if SHUTTING_DOWN.load(Ordering::Relaxed) { break; }
                let mut pfd = libc::pollfd { fd: sv[0], events: libc::POLLIN, revents: 0 };
                let ready = libc::poll(&mut pfd, 1, 100);
                if ready <= 0 { continue; }

                let client_fd = recv_fd(sv[0]);
                if client_fd < 0 { break; }

                let data = stream_from_client(client_fd, &mut errmsg);
                if data.is_null() || !errmsg.is_null() {
                    if !errmsg.is_null() { try_send_fail(client_fd, errmsg); libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
                    libc::free(data as *mut c_void);
                    close_socket(client_fd);
                    continue;
                }

                let result = pool_dispatch_packet(data, config.local_dispatch, config.remote_dispatch, config.dispatch_ctx);
                libc::free(data as *mut c_void);

                if !result.is_null() {
                    send_packet_to_foreign_server(client_fd, result, &mut errmsg);
                    libc::free(result as *mut c_void);
                    if !errmsg.is_null() { libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
                }
                libc::fflush(ptr::null_mut());
                close_socket(client_fd);
            }
            libc::close(sv[0]);
            libc::_exit(0);
        }
        child_pids.push(pid);
    }
    TOTAL_WORKERS.store(child_pids.len() as i32, Ordering::Relaxed);

    // Parent: accept loop
    while !SHUTTING_DOWN.load(Ordering::Relaxed) {
        let client_fd = wait_for_client_with_timeout(daemon, 10000, &mut errmsg);
        if !errmsg.is_null() { libc::free(errmsg as *mut c_void); errmsg = ptr::null_mut(); }
        if client_fd > 0 {
            send_fd(sv[1], client_fd);
            close_socket(client_fd);
        }

        // Reap dead children
        for pid in child_pids.iter_mut() {
            if *pid > 0 {
                let mut wstatus: i32 = 0;
                if libc::waitpid(*pid, &mut wstatus, libc::WNOHANG) > 0 {
                    *pid = -1;
                }
            }
        }
    }

    // Shutdown
    for &pid in &child_pids {
        if pid > 0 { libc::kill(pid, libc::SIGTERM); }
    }
    for &pid in &child_pids {
        if pid > 0 { libc::waitpid(pid, ptr::null_mut(), 0); }
    }

    libc::close(sv[0]); libc::close(sv[1]);
    libc::munmap(shared_counter as *mut c_void, std::mem::size_of::<AtomicI32>());
    SHARED_BUSY = ptr::null_mut();

    close_daemon(&mut daemon);
    0
}

// fd-passing helpers
unsafe fn send_fd(sock: i32, fd: i32) -> i32 {
    let mut buf = [0u8; 1];
    let mut iov = libc::iovec { iov_base: buf.as_mut_ptr() as *mut c_void, iov_len: 1 };
    let cmsg_space = libc::CMSG_SPACE(std::mem::size_of::<i32>() as u32) as usize;
    let mut cmsg_buf = vec![0u8; cmsg_space];

    let mut msg: libc::msghdr = std::mem::zeroed();
    msg.msg_iov = &mut iov;
    msg.msg_iovlen = 1;
    msg.msg_control = cmsg_buf.as_mut_ptr() as *mut c_void;
    msg.msg_controllen = cmsg_space as _;

    let cmsg = libc::CMSG_FIRSTHDR(&msg);
    (*cmsg).cmsg_level = libc::SOL_SOCKET;
    (*cmsg).cmsg_type = libc::SCM_RIGHTS;
    (*cmsg).cmsg_len = libc::CMSG_LEN(std::mem::size_of::<i32>() as u32) as _;
    ptr::copy_nonoverlapping(&fd as *const i32 as *const u8, libc::CMSG_DATA(cmsg), std::mem::size_of::<i32>());

    if libc::sendmsg(sock, &msg, 0) >= 0 { 0 } else { -1 }
}

unsafe fn recv_fd(sock: i32) -> i32 {
    let mut buf = [0u8; 1];
    let mut iov = libc::iovec { iov_base: buf.as_mut_ptr() as *mut c_void, iov_len: 1 };
    let cmsg_space = libc::CMSG_SPACE(std::mem::size_of::<i32>() as u32) as usize;
    let mut cmsg_buf = vec![0u8; cmsg_space];

    let mut msg: libc::msghdr = std::mem::zeroed();
    msg.msg_iov = &mut iov;
    msg.msg_iovlen = 1;
    msg.msg_control = cmsg_buf.as_mut_ptr() as *mut c_void;
    msg.msg_controllen = cmsg_space as _;

    let n = libc::recvmsg(sock, &mut msg, 0);
    if n <= 0 { return -1; }

    let cmsg = libc::CMSG_FIRSTHDR(&msg);
    if cmsg.is_null() || (*cmsg).cmsg_level != libc::SOL_SOCKET || (*cmsg).cmsg_type != libc::SCM_RIGHTS {
        return -1;
    }

    let mut fd: i32 = 0;
    ptr::copy_nonoverlapping(libc::CMSG_DATA(cmsg), &mut fd as *mut i32 as *mut u8, std::mem::size_of::<i32>());
    fd
}

// ── Entry point ──────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn pool_main(
    argc: i32,
    argv: *mut *mut c_char,
    config: *mut PoolConfig,
) -> i32 {
    if argc != 4 {
        libc::fprintf(libc::fdopen(2, b"w\0".as_ptr() as *const c_char),
            b"Usage: %s <socket_path> <tmpdir> <shm_basename>\n\0".as_ptr() as *const c_char,
            if argc > 0 { *argv } else { b"pool\0".as_ptr() as *const c_char });
        return 1;
    }

    let cfg = &mut *config;
    if cfg.initial_workers <= 0 { cfg.initial_workers = 1; }

    SHUTTING_DOWN.store(false, Ordering::Relaxed);
    BUSY_COUNT.store(0, Ordering::Relaxed);

    // SIGTERM handler
    let mut sa: libc::sigaction = std::mem::zeroed();
    sa.sa_sigaction = pool_sigterm_handler as *const () as usize;
    libc::sigemptyset(&mut sa.sa_mask);
    libc::sigaction(libc::SIGTERM, &sa, ptr::null_mut());

    let socket_path = *argv.add(1);
    let tmpdir = *argv.add(2);
    let shm_basename = *argv.add(3);

    match cfg.concurrency {
        PoolConcurrency::Threads => pool_main_threads(cfg, socket_path, tmpdir, shm_basename),
        PoolConcurrency::Fork => pool_main_fork(cfg, socket_path, tmpdir, shm_basename),
        PoolConcurrency::Single => pool_main_single(cfg, socket_path, tmpdir, shm_basename),
    }
}


================================================
FILE: data/rust/morloc-runtime/src/router_ffi.rs
================================================
//! C ABI wrappers for router subsystems.
//! Replaces router.c. Routes requests to per-program daemons.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;
use std::sync::atomic::{AtomicBool, Ordering};
use std::time::Instant;

use crate::daemon_ffi::{
    DaemonConfig, DaemonResponse, MorlocSocket,
};
use crate::error::{clear_errmsg, set_errmsg, MorlocError};
use crate::http_ffi::{DaemonMethod, DaemonRequest, HttpMethod, HttpRequest};

// -- Constants ----------------------------------------------------------------

/// Max size of sun_path in sockaddr_un (108 on Linux)
const SUN_PATH_LEN: usize = 108;

// Daemon startup polling (exponential backoff, ~5s total).
// Sum of 100 * 1.25^i for i in 0..16 is ~4650ms.
const DAEMON_POLL_INITIAL_MS: f64 = 100.0;
const DAEMON_POLL_MULTIPLIER: f64 = 1.25;
const DAEMON_POLL_MAX_RETRIES: usize = 16;

// -- Global state -------------------------------------------------------------

static ROUTER_SHUTDOWN_REQUESTED: AtomicBool = AtomicBool::new(false);

extern "C" fn router_signal_handler_fn(_sig: i32) {
    ROUTER_SHUTDOWN_REQUESTED.store(true, Ordering::Relaxed);
}

// -- C-compatible types -------------------------------------------------------

#[repr(C)]
pub struct RouterProgram {
    pub name: *mut c_char,
    pub manifest_path: *mut c_char,
    pub manifest: *mut c_void, // manifest_t*
    pub daemon_pid: libc::pid_t,
    pub daemon_socket: [c_char; SUN_PATH_LEN],
}

#[repr(C)]
pub struct Router {
    pub programs: *mut RouterProgram,
    pub n_programs: usize,
    pub fdb_path: *mut c_char,
}

// -- router_init --------------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn router_init(
    fdb_path: *const c_char,
    errmsg: *mut *mut c_char,
) -> *mut Router {
    clear_errmsg(errmsg);

    extern "C" {
        fn read_manifest(path: *const c_char, errmsg: *mut *mut c_char) -> *mut c_void;
    }

    let dir = libc::opendir(fdb_path);
    if dir.is_null() {
        let errno_msg = CStr::from_ptr(libc::strerror(crate::utility::errno_val()))
            .to_string_lossy();
        let path_str = CStr::from_ptr(fdb_path).to_string_lossy();
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!(
                "Cannot open fdb directory '{}': {}",
                path_str, errno_msg
            )),
        );
        return ptr::null_mut();
    }

    let router = libc::calloc(1, std::mem::size_of::<Router>()) as *mut Router;
    (*router).fdb_path = libc::strdup(fdb_path);

    let mut cap: usize = 8;
    (*router).programs =
        libc::calloc(cap, std::mem::size_of::<RouterProgram>()) as *mut RouterProgram;
    (*router).n_programs = 0;

    loop {
        let entry = libc::readdir(dir);
        if entry.is_null() {
            break;
        }

        let name = CStr::from_ptr((*entry).d_name.as_ptr());
        let name_str = name.to_string_lossy();

        if name_str.len() < 10 || !name_str.ends_with(".manifest") {
            continue;
        }

        // Grow array if needed
        if (*router).n_programs >= cap {
            cap *= 2;
            (*router).programs = libc::realloc(
                (*router).programs as *mut c_void,
                cap * std::mem::size_of::<RouterProgram>(),
            ) as *mut RouterProgram;
        }

        let prog = &mut *(*router).programs.add((*router).n_programs);
        ptr::write_bytes(prog as *mut RouterProgram, 0, 1);

        // Extract program name (filename without .manifest)
        let prog_name_len = name_str.len() - 9;
        let prog_name = &name_str[..prog_name_len];
        let c_prog_name = CString::new(prog_name).unwrap_or_default();
        prog.name = libc::strdup(c_prog_name.as_ptr());

        // Build full path
        let fdb_str = CStr::from_ptr(fdb_path).to_string_lossy();
        let full_path = format!("{}/{}", fdb_str, name_str);
        let c_path = CString::new(full_path).unwrap_or_default();
        prog.manifest_path = libc::strdup(c_path.as_ptr());

        // Read and parse manifest
        let mut child_err: *mut c_char = ptr::null_mut();
        prog.manifest = read_manifest(prog.manifest_path, &mut child_err);
        if !child_err.is_null() {
            let err_str = CStr::from_ptr(child_err).to_string_lossy();
            let path_str = CStr::from_ptr(prog.manifest_path).to_string_lossy();
            eprintln!("router: warning: failed to parse {}: {}", path_str, err_str);
            libc::free(child_err as *mut c_void);
            libc::free(prog.name as *mut c_void);
            libc::free(prog.manifest_path as *mut c_void);
            continue;
        }

        prog.daemon_pid = 0;
        // Set socket path
        let socket_path = format!("/tmp/morloc-router-{}.sock", prog_name);
        let c_socket = CString::new(socket_path).unwrap_or_default();
        let socket_bytes = c_socket.as_bytes_with_nul();
        let copy_len = socket_bytes.len().min(SUN_PATH_LEN);
        ptr::copy_nonoverlapping(
            socket_bytes.as_ptr() as *const c_char,
            prog.daemon_socket.as_mut_ptr(),
            copy_len,
        );

        (*router).n_programs += 1;
    }

    libc::closedir(dir);

    // Empty fdb is fine -- programs can be added while the router is running

    router
}

// -- router_free --------------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn router_free(router: *mut Router) {
    if router.is_null() {
        return;
    }

    extern "C" {
        fn free_manifest(manifest: *mut c_void);
    }

    for i in 0..(*router).n_programs {
        let prog = &mut *(*router).programs.add(i);
        libc::free(prog.name as *mut c_void);
        libc::free(prog.manifest_path as *mut c_void);
        if !prog.manifest.is_null() {
            free_manifest(prog.manifest);
        }
        if prog.daemon_pid > 0 {
            libc::kill(prog.daemon_pid, libc::SIGTERM);
        }
    }
    libc::free((*router).programs as *mut c_void);
    libc::free((*router).fdb_path as *mut c_void);
    libc::free(router as *mut c_void);
}

// -- morloc-nexus path resolution ---------------------------------------------

/// Locate the morloc-nexus executable.
///
/// Tries, in order:
///   1. `$MORLOC_NEXUS` (explicit override)
///   2. `$MORLOC_HOME/bin/morloc-nexus` (deploy convention)
///   3. `morloc-nexus` on `$PATH`
///   4. `$HOME/.local/bin/morloc-nexus` (bare-metal developer install)
///
/// Returns the path on the first candidate whose `access(_, X_OK)` succeeds,
/// or the list of attempted paths on failure.
unsafe fn find_morloc_nexus() -> Result<String, Vec<String>> {
    fn is_executable(path: &str) -> bool {
        if let Ok(c) = CString::new(path) {
            unsafe { libc::access(c.as_ptr(), libc::X_OK) == 0 }
        } else {
            false
        }
    }

    fn getenv_str(name: &str) -> Option<String> {
        let c_name = CString::new(name).ok()?;
        let p = unsafe { libc::getenv(c_name.as_ptr()) };
        if p.is_null() {
            None
        } else {
            Some(unsafe { CStr::from_ptr(p) }.to_string_lossy().into_owned())
        }
    }

    let mut tried: Vec<String> = Vec::new();

    // 1. $MORLOC_NEXUS
    if let Some(p) = getenv_str("MORLOC_NEXUS") {
        if is_executable(&p) {
            return Ok(p);
        }
        tried.push(format!("$MORLOC_NEXUS={}", p));
    }

    // 2. $MORLOC_HOME/bin/morloc-nexus
    if let Some(h) = getenv_str("MORLOC_HOME") {
        let p = format!("{}/bin/morloc-nexus", h);
        if is_executable(&p) {
            return Ok(p);
        }
        tried.push(p);
    }

    // 3. Search $PATH
    if let Some(path) = getenv_str("PATH") {
        for dir in path.split(':') {
            if dir.is_empty() {
                continue;
            }
            let p = format!("{}/morloc-nexus", dir);
            if is_executable(&p) {
                return Ok(p);
            }
        }
        tried.push(format!("$PATH ({})", path));
    }

    // 4. $HOME/.local/bin/morloc-nexus
    if let Some(h) = getenv_str("HOME") {
        let p = format!("{}/.local/bin/morloc-nexus", h);
        if is_executable(&p) {
            return Ok(p);
        }
        tried.push(p);
    }

    Err(tried)
}

// -- router_start_program -----------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn router_start_program(
    prog: *mut RouterProgram,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);

    let nexus_path = match find_morloc_nexus() {
        Ok(p) => p,
        Err(tried) => {
            set_errmsg(
                errmsg,
                &MorlocError::Other(format!(
                    "morloc-nexus binary not found; tried: {}",
                    tried.join(", ")
                )),
            );
            return false;
        }
    };
    let c_nexus = CString::new(nexus_path.as_str()).unwrap_or_default();

    let pid = libc::fork();
    if pid == 0 {
        // Child: exec morloc-nexus with --daemon
        libc::setpgid(0, 0);
        let arg_nexus = CString::new("morloc-nexus").unwrap();
        let arg_daemon = CString::new("--daemon").unwrap();
        let arg_socket = CString::new("--socket").unwrap();
        let socket_path = CStr::from_ptr((*prog).daemon_socket.as_ptr());
        libc::execl(
            c_nexus.as_ptr(),
            arg_nexus.as_ptr(),
            (*prog).manifest_path,
            arg_daemon.as_ptr(),
            arg_socket.as_ptr(),
            socket_path.as_ptr(),
            ptr::null::<c_char>(),
        );
        // If exec fails
        let prog_name = CStr::from_ptr((*prog).name).to_string_lossy();
        let errno_msg = CStr::from_ptr(libc::strerror(crate::utility::errno_val()))
            .to_string_lossy();
        eprintln!(
            "router: failed to exec morloc-nexus for {}: {}",
            prog_name, errno_msg
        );
        libc::_exit(1);
    } else if pid > 0 {
        (*prog).daemon_pid = pid;

        // Poll until the daemon socket is connectable (exponential backoff)
        let mut delay_ms = DAEMON_POLL_INITIAL_MS;
        let mut connected = false;
        for _attempt in 0..DAEMON_POLL_MAX_RETRIES {
            let ts = libc::timespec {
                tv_sec: 0,
                tv_nsec: (delay_ms * 1_000_000.0) as i64,
            };
            libc::nanosleep(&ts, ptr::null_mut());

            // Check if child died during startup
            let mut status: i32 = 0;
            let result = libc::waitpid(pid, &mut status, libc::WNOHANG);
            if result == pid {
                (*prog).daemon_pid = 0;
                let prog_name = CStr::from_ptr((*prog).name).to_string_lossy();
                set_errmsg(
                    errmsg,
                    &MorlocError::Other(format!(
                        "Daemon for '{}' exited during startup (status {})",
                        prog_name, status
                    )),
                );
                return false;
            }

            // Try connecting to the daemon socket
            let test_sock = libc::socket(libc::AF_UNIX, libc::SOCK_STREAM, 0);
            if test_sock >= 0 {
                let mut addr: libc::sockaddr_un = std::mem::zeroed();
                addr.sun_family = libc::AF_UNIX as libc::sa_family_t;
                let socket_path = (*prog).daemon_socket.as_ptr();
                let path_bytes = CStr::from_ptr(socket_path).to_bytes();
                let copy_len = path_bytes.len().min(addr.sun_path.len() - 1);
                ptr::copy_nonoverlapping(
                    path_bytes.as_ptr() as *const c_char,
                    addr.sun_path.as_mut_ptr(),
                    copy_len,
                );
                let rc = libc::connect(
                    test_sock,
                    &addr as *const libc::sockaddr_un as *const libc::sockaddr,
                    std::mem::size_of::<libc::sockaddr_un>() as libc::socklen_t,
                );
                libc::close(test_sock);
                if rc == 0 {
                    connected = true;
                    break;
                }
            }

            delay_ms *= DAEMON_POLL_MULTIPLIER;
        }

        if !connected {
            // Final check: did the daemon die?
            let mut status: i32 = 0;
            let result = libc::waitpid(pid, &mut status, libc::WNOHANG);
            if result == pid {
                (*prog).daemon_pid = 0;
                let prog_name = CStr::from_ptr((*prog).name).to_string_lossy();
                set_errmsg(
                    errmsg,
                    &MorlocError::Other(format!(
                        "Daemon for '{}' exited during startup (status {})",
                        prog_name, status
                    )),
                );
                return false;
            }
            // Daemon alive but socket not yet connectable -- proceed anyway,
            // router_forward() will retry on connect failure.
        }

        true
    } else {
        let errno_msg = CStr::from_ptr(libc::strerror(crate::utility::errno_val()))
            .to_string_lossy();
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!("fork failed: {}", errno_msg)),
        );
        false
    }
}

// -- router_forward -----------------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn router_forward(
    router: *mut Router,
    program: *const c_char,
    request: *mut DaemonRequest,
    errmsg: *mut *mut c_char,
) -> *mut DaemonResponse {
    clear_errmsg(errmsg);

    extern "C" {
        fn daemon_parse_response(
            json: *const c_char,
            len: usize,
            errmsg: *mut *mut c_char,
        ) -> *mut DaemonResponse;
    }

    // Find program
    let program_name = CStr::from_ptr(program);
    let mut prog: *mut RouterProgram = ptr::null_mut();
    for i in 0..(*router).n_programs {
        let p = (*router).programs.add(i);
        if CStr::from_ptr((*p).name) == program_name {
            prog = p;
            break;
        }
    }

    if prog.is_null() {
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!(
                "Unknown program: {}",
                program_name.to_string_lossy()
            )),
        );
        return ptr::null_mut();
    }

    // Check if a previously-started daemon has exited (crash recovery)
    if (*prog).daemon_pid > 0 {
        let mut status: i32 = 0;
        let result = libc::waitpid((*prog).daemon_pid, &mut status, libc::WNOHANG);
        if result == (*prog).daemon_pid || result < 0 {
            let prog_name = CStr::from_ptr((*prog).name).to_string_lossy();
            eprintln!(
                "router: daemon for '{}' exited (status {}), will restart",
                prog_name, status
            );
            (*prog).daemon_pid = 0;
        }
    }

    // Start daemon if not running
    if (*prog).daemon_pid <= 0 {
        let mut child_err: *mut c_char = ptr::null_mut();
        if !router_start_program(prog, &mut child_err) {
            if !child_err.is_null() {
                *errmsg = child_err;
            } else {
                set_errmsg(
                    errmsg,
                    &MorlocError::Other("Failed to start program daemon".into()),
                );
            }
            return ptr::null_mut();
        }
    }

    // Serialize request to JSON
    let req_json = serialize_request_to_json(request);
    let c_req = CString::new(req_json.as_str()).unwrap_or_default();
    let req_len = req_json.len();

    // Try to connect, retry once on failure
    let sock = connect_to_daemon(prog, errmsg);
    let sock = if sock < 0 {
        // Try restarting daemon
        (*prog).daemon_pid = 0;
        // Clear previous error
        if !(*errmsg).is_null() {
            libc::free(*errmsg as *mut c_void);
            *errmsg = ptr::null_mut();
        }
        let mut child_err: *mut c_char = ptr::null_mut();
        if !router_start_program(prog, &mut child_err) {
            if !child_err.is_null() {
                *errmsg = child_err;
            }
            return ptr::null_mut();
        }
        let sock2 = connect_to_daemon(prog, errmsg);
        if sock2 < 0 {
            return ptr::null_mut();
        }
        sock2
    } else {
        sock
    };

    // Send length-prefixed message
    let len_buf: [u8; 4] = [
        ((req_len >> 24) & 0xFF) as u8,
        ((req_len >> 16) & 0xFF) as u8,
        ((req_len >> 8) & 0xFF) as u8,
        (req_len & 0xFF) as u8,
    ];

    let n = libc::send(
        sock,
        len_buf.as_ptr() as *const c_void,
        4,
        crate::utility::SEND_NOSIGNAL,
    );
    if n != 4 {
        libc::close(sock);
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to send request length to daemon".into()),
        );
        return ptr::null_mut();
    }

    let mut total_sent: usize = 0;
    while total_sent < req_len {
        let n = libc::send(
            sock,
            c_req.as_ptr().add(total_sent) as *const c_void,
            req_len - total_sent,
            crate::utility::SEND_NOSIGNAL,
        );
        if n <= 0 {
            libc::close(sock);
            set_errmsg(
                errmsg,
                &MorlocError::Other("Failed to send request body to daemon".into()),
            );
            return ptr::null_mut();
        }
        total_sent += n as usize;
    }

    // Read response length
    let mut resp_len_buf = [0u8; 4];
    let n = libc::recv(
        sock,
        resp_len_buf.as_mut_ptr() as *mut c_void,
        4,
        libc::MSG_WAITALL,
    );
    if n != 4 {
        libc::close(sock);
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to read response length from daemon".into()),
        );
        return ptr::null_mut();
    }

    let resp_len = ((resp_len_buf[0] as u32) << 24)
        | ((resp_len_buf[1] as u32) << 16)
        | ((resp_len_buf[2] as u32) << 8)
        | (resp_len_buf[3] as u32);

    let resp_json = libc::malloc(resp_len as usize + 1) as *mut c_char;
    if resp_json.is_null() {
        libc::close(sock);
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to allocate response buffer".into()),
        );
        return ptr::null_mut();
    }

    let mut total_recv: usize = 0;
    while total_recv < resp_len as usize {
        let n = libc::recv(
            sock,
            resp_json.add(total_recv) as *mut c_void,
            resp_len as usize - total_recv,
            0,
        );
        if n <= 0 {
            libc::free(resp_json as *mut c_void);
            libc::close(sock);
            set_errmsg(
                errmsg,
                &MorlocError::Other("Failed to read response body from daemon".into()),
            );
            return ptr::null_mut();
        }
        total_recv += n as usize;
    }
    *resp_json.add(resp_len as usize) = 0;
    libc::close(sock);

    let resp = daemon_parse_response(resp_json, resp_len as usize, errmsg);
    libc::free(resp_json as *mut c_void);
    resp
}

/// Helper: connect to a program daemon's unix socket with 60s timeouts.
unsafe fn connect_to_daemon(
    prog: *mut RouterProgram,
    errmsg: *mut *mut c_char,
) -> i32 {
    let sock = libc::socket(libc::AF_UNIX, libc::SOCK_STREAM, 0);
    if sock < 0 {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to create socket".into()),
        );
        return -1;
    }
    crate::utility::set_nosigpipe(sock);

    let tv = libc::timeval {
        tv_sec: 60,
        tv_usec: 0,
    };
    libc::setsockopt(
        sock,
        libc::SOL_SOCKET,
        libc::SO_RCVTIMEO,
        &tv as *const libc::timeval as *const c_void,
        std::mem::size_of::<libc::timeval>() as libc::socklen_t,
    );
    libc::setsockopt(
        sock,
        libc::SOL_SOCKET,
        libc::SO_SNDTIMEO,
        &tv as *const libc::timeval as *const c_void,
        std::mem::size_of::<libc::timeval>() as libc::socklen_t,
    );

    let mut addr: libc::sockaddr_un = std::mem::zeroed();
    addr.sun_family = libc::AF_UNIX as libc::sa_family_t;
    let socket_path = (*prog).daemon_socket.as_ptr();
    let path_bytes = CStr::from_ptr(socket_path).to_bytes();
    let copy_len = path_bytes.len().min(addr.sun_path.len() - 1);
    ptr::copy_nonoverlapping(
        path_bytes.as_ptr() as *const c_char,
        addr.sun_path.as_mut_ptr(),
        copy_len,
    );

    if libc::connect(
        sock,
        &addr as *const libc::sockaddr_un as *const libc::sockaddr,
        std::mem::size_of::<libc::sockaddr_un>() as libc::socklen_t,
    ) < 0
    {
        libc::close(sock);
        let prog_name = CStr::from_ptr((*prog).name).to_string_lossy();
        set_errmsg(
            errmsg,
            &MorlocError::Other(format!(
                "Failed to connect to daemon for '{}'",
                prog_name
            )),
        );
        return -1;
    }

    sock
}

/// Serialize a DaemonRequest to JSON using serde_json.
unsafe fn serialize_request_to_json(request: *mut DaemonRequest) -> String {
    let mut map = serde_json::Map::new();

    if !(*request).id.is_null() {
        let id = CStr::from_ptr((*request).id).to_string_lossy();
        map.insert("id".into(), serde_json::Value::String(id.into_owned()));
    }

    let method_str = match (*request).method {
        DaemonMethod::Call => "call",
        DaemonMethod::Discover => "discover",
        DaemonMethod::Health => "health",
        DaemonMethod::Eval => "eval",
        DaemonMethod::Typecheck => "typecheck",
        DaemonMethod::Bind => "bind",
        DaemonMethod::Bindings => "bindings",
        DaemonMethod::Unbind => "unbind",
    };
    map.insert(
        "method".into(),
        serde_json::Value::String(method_str.into()),
    );

    if !(*request).command.is_null() {
        let cmd = CStr::from_ptr((*request).command).to_string_lossy();
        map.insert(
            "command".into(),
            serde_json::Value::String(cmd.into_owned()),
        );
    }

    if !(*request).args_json.is_null() {
        let args_str = CStr::from_ptr((*request).args_json).to_string_lossy();
        // Try to parse as JSON value to embed directly
        if let Ok(v) = serde_json::from_str::<serde_json::Value>(&args_str) {
            map.insert("args".into(), v);
        }
    }

    if !(*request).expr.is_null() {
        let expr = CStr::from_ptr((*request).expr).to_string_lossy();
        map.insert("expr".into(), serde_json::Value::String(expr.into_owned()));
    }

    if !(*request).name.is_null() {
        let name = CStr::from_ptr((*request).name).to_string_lossy();
        map.insert("name".into(), serde_json::Value::String(name.into_owned()));
    }

    serde_json::to_string(&map).unwrap_or_else(|_| "{}".into())
}

// -- router_build_discovery ---------------------------------------------------

#[no_mangle]
pub unsafe extern "C" fn router_build_discovery(router: *mut Router) -> *mut c_char {
    // Walk the canonical Manifest C struct from manifest_ffi.rs. No
    // local mirror -- the in-memory layout is shared.
    use crate::manifest_ffi::Manifest as ManifestC;

    #[derive(serde::Serialize)]
    struct CommandInfo {
        name: String,
        r#type: String,
        return_type: String,
    }

    #[derive(serde::Serialize)]
    struct ProgramInfo {
        name: String,
        running: bool,
        #[serde(skip_serializing_if = "Option::is_none")]
        commands: Option<Vec<CommandInfo>>,
    }

    #[derive(serde::Serialize)]
    struct Discovery {
        programs: Vec<ProgramInfo>,
    }

    let mut programs = Vec::with_capacity((*router).n_programs);

    for i in 0..(*router).n_programs {
        let prog = &*(*router).programs.add(i);
        let name = CStr::from_ptr(prog.name).to_string_lossy().into_owned();
        let running =
            prog.daemon_pid > 0 && libc::kill(prog.daemon_pid, 0) == 0;

        let commands = if !prog.manifest.is_null() {
            let mv = prog.manifest as *const ManifestC;
            let mut cmds = Vec::with_capacity((*mv).n_commands);
            for c in 0..(*mv).n_commands {
                let cmd = &*(*mv).commands.add(c);
                let cmd_name = CStr::from_ptr(cmd.name).to_string_lossy().into_owned();
                let cmd_type = if cmd.is_pure { "pure" } else { "remote" };
                let ret_type = if !cmd.ret.type_desc.is_null() {
                    CStr::from_ptr(cmd.ret.type_desc)
                        .to_string_lossy()
                        .into_owned()
                } else {
                    String::new()
                };
                cmds.push(CommandInfo {
                    name: cmd_name,
                    r#type: cmd_type.into(),
                    return_type: ret_type,
                });
            }
            Some(cmds)
        } else {
            None
        };

        programs.push(ProgramInfo {
            name,
            running,
            commands,
        });
    }

    let disco = Discovery { programs };
    let json = serde_json::to_string(&disco).unwrap_or_else(|_| "{}".into());
    let c = CString::new(json).unwrap_or_default();
    libc::strdup(c.as_ptr())
}

// -- Router HTTP request routing ----------------------------------------------

/// Route HTTP requests for the router. Sets *out_program to the target program
/// name (caller-owned) for per-program requests, or NULL for router-level requests.
unsafe fn router_http_to_request(
    req: *mut HttpRequest,
    out_program: *mut *mut c_char,
    errmsg: *mut *mut c_char,
) -> *mut DaemonRequest {
    clear_errmsg(errmsg);

    let dreq = libc::calloc(1, std::mem::size_of::<DaemonRequest>()) as *mut DaemonRequest;
    if dreq.is_null() {
        set_errmsg(
            errmsg,
            &MorlocError::Other("Failed to allocate daemon_request_t".into()),
        );
        return ptr::null_mut();
    }

    *out_program = ptr::null_mut();

    let path = CStr::from_ptr((*req).path.as_ptr())
        .to_str()
        .unwrap_or("");
    let method = (*req).method;

    let body_str = if !(*req).body.is_null() && (*req).body_len > 0 {
        std::str::from_utf8(std::slice::from_raw_parts(
            (*req).body as *const u8,
            (*req).body_len,
        ))
        .unwrap_or("")
    } else {
        ""
    };

    // GET /health or GET /health/<program>
    if method == HttpMethod::Get && (path == "/health" || path.starts_with("/health/")) {
        (*dreq).method = DaemonMethod::Health;
        if path.starts_with("/health/") {
            let prog_name = &path[8..];
            if !prog_name.is_empty() {
                let c = CString::new(prog_name).unwrap_or_default();
                *out_program = libc::strdup(c.as_ptr());
            }
        }
        return dreq;
    }

    // GET /programs or GET /discover
    if method == HttpMethod::Get && (path == "/programs" || path == "/discover") {
        (*dreq).method = DaemonMethod::Discover;
        return dreq;
    }

    // GET /discover/<program>
    if method == HttpMethod::Get && path.starts_with("/discover/") {
        let prog_name = &path[10..];
        if !prog_name.is_empty() {
            let c = CString::new(prog_name).unwrap_or_default();
            *out_program = libc::strdup(c.as_ptr());
            (*dreq).method = DaemonMethod::Discover;
            return dreq;
        }
    }

    // POST /eval
    if method == HttpMethod::Post && path == "/eval" {
        (*dreq).method = DaemonMethod::Eval;
        if !body_str.is_empty() {
            if let Ok(v) = serde_json::from_str::<serde_json::Value>(body_str) {
                if let Some(expr) = v.get("expr").and_then(|e| e.as_str()) {
                    let c = CString::new(expr).unwrap_or_default();
                    (*dreq).expr = libc::strdup(c.as_ptr());
                }
            }
        }
        if (*dreq).expr.is_null() {
            libc::free(dreq as *mut c_void);
            set_errmsg(
                errmsg,
                &MorlocError::Other("Missing 'expr' field in /eval request body".into()),
            );
            return ptr::null_mut();
        }
        return dreq;
    }

    // POST /call/<program>/<command>
    if method == HttpMethod::Post && path.starts_with("/call/") {
        let rest = &path[6..];
        let slash = rest.find('/');
        match slash {
            Some(pos) if pos + 1 < rest.len() => {
                let prog_name = &rest[..pos];
                let cmd_name = &rest[pos + 1..];
                let c_prog = CString::new(prog_name).unwrap_or_default();
                *out_program = libc::strdup(c_prog.as_ptr());
                (*dreq).method = DaemonMethod::Call;
                let c_cmd = CString::new(cmd_name).unwrap_or_default();
                (*dreq).command = libc::strdup(c_cmd.as_ptr());

                // Parse body for args
                let trimmed = body_str.trim();
                if trimmed.starts_with('[') {
                    let c = CString::new(trimmed).unwrap_or_default();
                    (*dreq).args_json = libc::strdup(c.as_ptr());
                } else if trimmed.starts_with('{') {
                    if let Ok(v) = serde_json::from_str::<serde_json::Value>(trimmed) {
                        if let Some(args) = v.get("args") {
                            let args_str = serde_json::to_string(args).unwrap_or_default();
                            let c = CString::new(args_str).unwrap_or_default();
                            (*dreq).args_json = libc::strdup(c.as_ptr());
                        }
                    }
                }
                return dreq;
            }
            _ => {
                libc::free(dreq as *mut c_void);
                set_errmsg(
                    errmsg,
                    &MorlocError::Other("Expected /call/<program>/<command>".into()),
                );
                return ptr::null_mut();
            }
        }
    }

    // OPTIONS (CORS)
    if method == HttpMethod::Options {
        (*dreq).method = DaemonMethod::Health;
        return dreq;
    }

    libc::free(dreq as *mut c_void);
    let method_str = match method {
        HttpMethod::Get => "GET",
        HttpMethod::Post => "POST",
        HttpMethod::Delete => "DELETE",
        HttpMethod::Options => "OPTIONS",
    };
    set_errmsg(
        errmsg,
        &MorlocError::Other(format!("Unknown router endpoint: {} {}", method_str, path)),
    );
    ptr::null_mut()
}

// -- Router event loop --------------------------------------------------------

const ROUTER_MAX_LISTENERS: usize = 3;

#[no_mangle]
pub unsafe extern "C" fn router_run(config: *mut DaemonConfig, router: *mut Router) {
    extern "C" {
        fn http_parse_request(fd: i32, errmsg: *mut *mut c_char) -> *mut HttpRequest;
        fn http_free_request(req: *mut HttpRequest);
        fn http_write_response(
            fd: i32,
            status: i32,
            content_type: *const c_char,
            body: *const c_char,
            body_len: usize,
        ) -> bool;
        fn daemon_dispatch(
            manifest: *mut c_void,
            request: *mut DaemonRequest,
            sockets: *mut MorlocSocket,
            shm_basename: *const c_char,
        ) -> *mut DaemonResponse;
        fn daemon_serialize_response(
            response: *mut DaemonResponse,
            out_len: *mut usize,
        ) -> *mut c_char;
        fn daemon_free_request(req: *mut DaemonRequest);
        fn daemon_free_response(resp: *mut DaemonResponse);
        fn daemon_set_eval_timeout(timeout_sec: i32);
        fn manifest_to_discovery_json(manifest: *const c_void) -> *mut c_char;
    }

    daemon_set_eval_timeout((*config).eval_timeout);

    // Install signal handlers
    ROUTER_SHUTDOWN_REQUESTED.store(false, Ordering::Relaxed);
    let handler: libc::sighandler_t =
        std::mem::transmute::<extern "C" fn(i32), libc::sighandler_t>(router_signal_handler_fn);
    libc::signal(libc::SIGTERM, handler);
    libc::signal(libc::SIGINT, handler);

    let mut fds = [libc::pollfd {
        fd: -1,
        events: 0,
        revents: 0,
    }; ROUTER_MAX_LISTENERS];
    let mut nfds: usize = 0;

    let ct = b"application/json\0";

    // HTTP listener
    if (*config).http_port > 0 {
        let http_fd = libc::socket(libc::AF_INET, libc::SOCK_STREAM, 0);
        if http_fd < 0 {
            eprintln!("router: failed to create http socket");
            return;
        }
        let opt: i32 = 1;
        libc::setsockopt(
            http_fd,
            libc::SOL_SOCKET,
            libc::SO_REUSEADDR,
            &opt as *const i32 as *const c_void,
            std::mem::size_of::<i32>() as libc::socklen_t,
        );
        let mut addr: libc::sockaddr_in = std::mem::zeroed();
        addr.sin_family = libc::AF_INET as libc::sa_family_t;
        addr.sin_addr.s_addr = libc::INADDR_ANY;
        addr.sin_port = ((*config).http_port as u16).to_be();
        if libc::bind(
            http_fd,
            &addr as *const libc::sockaddr_in as *const libc::sockaddr,
            std::mem::size_of::<libc::sockaddr_in>() as libc::socklen_t,
        ) < 0
        {
            eprintln!(
                "router: failed to bind http port {}",
                (*config).http_port
            );
            libc::close(http_fd);
            return;
        }
        libc::listen(http_fd, 16);
        eprintln!("router: listening on http port {}", (*config).http_port);
        fds[nfds].fd = http_fd;
        fds[nfds].events = libc::POLLIN as i16;
        nfds += 1;
    }

    // Unix socket
    if !(*config).unix_socket_path.is_null() {
        let sock_fd = libc::socket(libc::AF_UNIX, libc::SOCK_STREAM, 0);
        if sock_fd < 0 {
            eprintln!("router: failed to create unix socket");
            return;
        }
        let mut addr: libc::sockaddr_un = std::mem::zeroed();
        addr.sun_family = libc::AF_UNIX as libc::sa_family_t;
        let path_bytes = CStr::from_ptr((*config).unix_socket_path).to_bytes();
        let copy_len = path_bytes.len().min(addr.sun_path.len() - 1);
        ptr::copy_nonoverlapping(
            path_bytes.as_ptr() as *const c_char,
            addr.sun_path.as_mut_ptr(),
            copy_len,
        );
        libc::unlink((*config).unix_socket_path);
        if libc::bind(
            sock_fd,
            &addr as *const libc::sockaddr_un as *const libc::sockaddr,
            std::mem::size_of::<libc::sockaddr_un>() as libc::socklen_t,
        ) < 0
        {
            eprintln!("router: failed to bind unix socket");
            libc::close(sock_fd);
            return;
        }
        libc::listen(sock_fd, 16);
        eprintln!(
            "router: listening on unix socket {}",
            CStr::from_ptr((*config).unix_socket_path).to_string_lossy()
        );
        fds[nfds].fd = sock_fd;
        fds[nfds].events = libc::POLLIN as i16;
        nfds += 1;
    }

    if nfds == 0 {
        eprintln!("router: no listeners configured");
        return;
    }

    // Eagerly start all program daemons so /health reports ok immediately
    for i in 0..(*router).n_programs {
        let prog = &mut *(*router).programs.add(i);
        if (*prog).daemon_pid <= 0 {
            let mut child_err: *mut c_char = ptr::null_mut();
            if router_start_program(prog, &mut child_err) {
                eprintln!(
                    "router: started daemon for '{}'",
                    CStr::from_ptr((*prog).name).to_string_lossy()
                );
            } else {
                let err_msg = if !child_err.is_null() {
                    let s = CStr::from_ptr(child_err).to_string_lossy().to_string();
                    libc::free(child_err as *mut c_void);
                    s
                } else {
                    "unknown error".to_string()
                };
                eprintln!(
                    "router: warning: failed to start daemon for '{}': {}",
                    CStr::from_ptr((*prog).name).to_string_lossy(),
                    err_msg
                );
            }
        }
    }

    while !ROUTER_SHUTDOWN_REQUESTED.load(Ordering::Relaxed) {
        let ready = libc::poll(fds.as_mut_ptr(), nfds as libc::nfds_t, 1000);
        if ready < 0 {
            if crate::utility::errno_val() == libc::EINTR {
                continue;
            }
            eprintln!("router: poll error");
            break;
        }
        if ready == 0 {
            continue;
        }

        for i in 0..nfds {
            if fds[i].revents & libc::POLLIN as i16 == 0 {
                continue;
            }

            let client_fd = libc::accept(fds[i].fd, ptr::null_mut(), ptr::null_mut());
            if client_fd < 0 {
                continue;
            }
            let req_start = Instant::now();
            crate::utility::set_nosigpipe(client_fd);

            let tv = libc::timeval {
                tv_sec: 30,
                tv_usec: 0,
            };
            libc::setsockopt(
                client_fd,
                libc::SOL_SOCKET,
                libc::SO_RCVTIMEO,
                &tv as *const libc::timeval as *const c_void,
                std::mem::size_of::<libc::timeval>() as libc::socklen_t,
            );
            libc::setsockopt(
                client_fd,
                libc::SOL_SOCKET,
                libc::SO_SNDTIMEO,
                &tv as *const libc::timeval as *const c_void,
                std::mem::size_of::<libc::timeval>() as libc::socklen_t,
            );

            let mut err: *mut c_char = ptr::null_mut();

            let http_req = http_parse_request(client_fd, &mut err);
            if !err.is_null() {
                let body = b"{\"status\":\"error\",\"error\":\"Bad request\"}\0";
                http_write_response(
                    client_fd,
                    400,
                    ct.as_ptr() as *const c_char,
                    body.as_ptr() as *const c_char,
                    body.len() - 1,
                );
                libc::free(err as *mut c_void);
                let elapsed = req_start.elapsed();
                eprintln!("router: ??? ??? -> 400 ({:.1}ms)", elapsed.as_secs_f64() * 1000.0);
                libc::close(client_fd);
                continue;
            }

            // Extract method and path for access logging before request is consumed
            let log_method = match (*http_req).method {
                HttpMethod::Get => "GET",
                HttpMethod::Post => "POST",
                HttpMethod::Delete => "DELETE",
                HttpMethod::Options => "OPTIONS",
            };
            let log_path_cstr = CStr::from_ptr((*http_req).path.as_ptr());
            let log_path = log_path_cstr.to_str().unwrap_or("???").to_string();

            let mut target_program: *mut c_char = ptr::null_mut();
            let dreq = router_http_to_request(http_req, &mut target_program, &mut err);
            http_free_request(http_req);

            if !err.is_null() {
                let err_json = make_error_json(&CStr::from_ptr(err).to_string_lossy());
                let c = CString::new(err_json.as_str()).unwrap_or_default();
                http_write_response(
                    client_fd,
                    404,
                    ct.as_ptr() as *const c_char,
                    c.as_ptr(),
                    err_json.len(),
                );
                libc::free(err as *mut c_void);
                let elapsed = req_start.elapsed();
                eprintln!("router: {} {} -> 404 ({:.1}ms)", log_method, log_path, elapsed.as_secs_f64() * 1000.0);
                libc::close(client_fd);
                continue;
            }

            // Track response status for access log
            let mut resp_status: i32 = 200;

            // Router-level requests
            if target_program.is_null() {
                if (*dreq).method == DaemonMethod::Health {
                    // Aggregate per-program health
                    let mut all_ok = true;
                    let mut prog_entries = Vec::new();
                    for i in 0..(*router).n_programs {
                        let prog = &*(*router).programs.add(i);
                        let name = CStr::from_ptr(prog.name).to_string_lossy();
                        let alive =
                            prog.daemon_pid > 0 && libc::kill(prog.daemon_pid, 0) == 0;
                        if !alive {
                            all_ok = false;
                        }
                        let status_str = if alive { "ok" } else { "error" };
                        prog_entries.push(serde_json::json!({
                            "program": name.as_ref(),
                            "status": status_str,
                        }));
                    }
                    let overall = if all_ok { "ok" } else { "degraded" };
                    let body = serde_json::json!({
                        "status": overall,
                        "programs": prog_entries,
                    }).to_string();
                    let status_code = if all_ok { 200 } else { 503 };
                    resp_status = status_code;
                    let c = CString::new(body.as_str()).unwrap_or_default();
                    http_write_response(
                        client_fd,
                        status_code,
                        ct.as_ptr() as *const c_char,
                        c.as_ptr(),
                        body.len(),
                    );
                } else if (*dreq).method == DaemonMethod::Discover {
                    let disco = router_build_discovery(router);
                    let disco_len = libc::strlen(disco);
                    http_write_response(
                        client_fd,
                        200,
                        ct.as_ptr() as *const c_char,
                        disco,
                        disco_len,
                    );
                    libc::free(disco as *mut c_void);
                } else if (*dreq).method == DaemonMethod::Eval {
                    // daemon_dispatch takes manifest as first arg, NULL is fine for eval
                    let resp = daemon_dispatch(ptr::null_mut(), dreq, ptr::null_mut(), ptr::null());
                    let mut resp_len: usize = 0;
                    let resp_json = daemon_serialize_response(resp, &mut resp_len);
                    let status = if (*resp).success { 200 } else { 500 };
                    resp_status = status;
                    http_write_response(
                        client_fd,
                        status,
                        ct.as_ptr() as *const c_char,
                        resp_json,
                        resp_len,
                    );
                    libc::free(resp_json as *mut c_void);
                    daemon_free_response(resp);
                }
                daemon_free_request(dreq);
                let elapsed = req_start.elapsed();
                eprintln!("router: {} {} -> {} ({:.1}ms)", log_method, log_path, resp_status, elapsed.as_secs_f64() * 1000.0);
                libc::close(client_fd);
                continue;
            }

            // Per-program request
            if (*dreq).method == DaemonMethod::Health {
                let mut found = false;
                for p in 0..(*router).n_programs {
                    let rprog = &*(*router).programs.add(p);
                    if CStr::from_ptr(rprog.name) == CStr::from_ptr(target_program) {
                        found = true;
                        let alive =
                            rprog.daemon_pid > 0 && libc::kill(rprog.daemon_pid, 0) == 0;
                        let prog_str = CStr::from_ptr(rprog.name).to_string_lossy();
                        let body = if alive {
                            serde_json::json!({
                                "status": "ok",
                                "program": prog_str.as_ref(),
                            }).to_string()
                        } else {
                            resp_status = 503;
                            serde_json::json!({
                                "status": "error",
                                "program": prog_str.as_ref(),
                                "error": "daemon not running",
                            }).to_string()
                        };
                        let c = CString::new(body.as_str()).unwrap_or_default();
                        http_write_response(
                            client_fd,
                            resp_status,
                            ct.as_ptr() as *const c_char,
                            c.as_ptr(),
                            body.len(),
                        );
                        break;
                    }
                }
                if !found {
                    resp_status = 404;
                    let body = b"{\"status\":\"error\",\"error\":\"Unknown program\"}\0";
                    http_write_response(
                        client_fd,
                        404,
                        ct.as_ptr() as *const c_char,
                        body.as_ptr() as *const c_char,
                        body.len() - 1,
                    );
                }
            } else if (*dreq).method == DaemonMethod::Discover {
                let mut found = false;
                for p in 0..(*router).n_programs {
                    let rprog = &*(*router).programs.add(p);
                    if CStr::from_ptr(rprog.name) == CStr::from_ptr(target_program) {
                        if !rprog.manifest.is_null() {
                            let disco = manifest_to_discovery_json(rprog.manifest);
                            let disco_len = libc::strlen(disco);
                            http_write_response(
                                client_fd,
                                200,
                                ct.as_ptr() as *const c_char,
                                disco,
                                disco_len,
                            );
                            libc::free(disco as *mut c_void);
                            found = true;
                        }
                        break;
                    }
                }
                if !found {
                    resp_status = 404;
                    let body = b"{\"status\":\"error\",\"error\":\"Unknown program\"}\0";
                    http_write_response(
                        client_fd,
                        404,
                        ct.as_ptr() as *const c_char,
                        body.as_ptr() as *const c_char,
                        body.len() - 1,
                    );
                }
            } else {
                // Forward to program daemon
                let resp = router_forward(router, target_program, dreq, &mut err);
                if !err.is_null() {
                    resp_status = 500;
                    let err_json =
                        make_error_json(&CStr::from_ptr(err).to_string_lossy());
                    let c = CString::new(err_json.as_str()).unwrap_or_default();
                    http_write_response(
                        client_fd,
                        500,
                        ct.as_ptr() as *const c_char,
                        c.as_ptr(),
                        err_json.len(),
                    );
                    libc::free(err as *mut c_void);
                } else {
                    let mut resp_len: usize = 0;
                    let resp_json = daemon_serialize_response(resp, &mut resp_len);
                    let status = if (*resp).success { 200 } else { 500 };
                    resp_status = status;
                    http_write_response(
                        client_fd,
                        status,
                        ct.as_ptr() as *const c_char,
                        resp_json,
                        resp_len,
                    );
                    libc::free(resp_json as *mut c_void);
                    daemon_free_response(resp);
                }
            }

            libc::free(target_program as *mut c_void);
            daemon_free_request(dreq);
            let elapsed = req_start.elapsed();
            eprintln!("router: {} {} -> {} ({:.1}ms)", log_method, log_path, resp_status, elapsed.as_secs_f64() * 1000.0);
            libc::close(client_fd);
        }
    }

    // Kill all program daemons
    for i in 0..(*router).n_programs {
        let prog = &*(*router).programs.add(i);
        if prog.daemon_pid > 0 {
            libc::kill(prog.daemon_pid, libc::SIGTERM);
            libc::unlink(prog.daemon_socket.as_ptr());
        }
    }

    // Wait for children
    for i in 0..(*router).n_programs {
        let prog = &*(*router).programs.add(i);
        if prog.daemon_pid > 0 {
            libc::waitpid(prog.daemon_pid, ptr::null_mut(), 0);
        }
    }

    // Close listeners
    for i in 0..nfds {
        libc::close(fds[i].fd);
    }

    if !(*config).unix_socket_path.is_null() {
        libc::unlink((*config).unix_socket_path);
    }
}

/// Build a JSON error response string.
fn make_error_json(error: &str) -> String {
    let map: serde_json::Map<String, serde_json::Value> = [
        ("status".into(), serde_json::Value::String("error".into())),
        ("error".into(), serde_json::Value::String(error.into())),
    ]
    .into_iter()
    .collect();
    serde_json::to_string(&map).unwrap_or_else(|_| "{}".into())
}


================================================
FILE: data/rust/morloc-runtime/src/schema.rs
================================================
use crate::error::MorlocError;

/// Morloc serial type identifiers, matching the C enum morloc_serial_type.
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
#[repr(u32)]
pub enum SerialType {
    Nil = 0,
    Bool = 1,
    Sint8 = 2,
    Sint16 = 3,
    Sint32 = 4,
    Sint64 = 5,
    Uint8 = 6,
    Uint16 = 7,
    Uint32 = 8,
    Uint64 = 9,
    Float32 = 10,
    Float64 = 11,
    Tensor = 12,
    String = 13,
    Array = 14,
    Tuple = 15,
    Map = 16,
    Optional = 17,
}

/// Schema character codes for parsing schema strings.
const SCHEMA_NIL: u8 = b'z';
const SCHEMA_BOOL: u8 = b'b';
const SCHEMA_SINT: u8 = b'i';
const SCHEMA_UINT: u8 = b'u';
const SCHEMA_FLOAT: u8 = b'f';
const SCHEMA_STRING: u8 = b's';
const SCHEMA_ARRAY: u8 = b'a';
const SCHEMA_TENSOR: u8 = b'T';
const SCHEMA_TUPLE: u8 = b't';
const SCHEMA_MAP: u8 = b'm';
const SCHEMA_OPTIONAL: u8 = b'?';

/// Recursive schema definition, mirroring the C Schema struct.
#[derive(Debug, Clone)]
pub struct Schema {
    pub serial_type: SerialType,
    /// Number of parameters (e.g., array has 1, tuple has N).
    pub size: usize,
    /// Byte width when stored in a fixed-width array.
    pub width: usize,
    /// Field offsets for tuples/records, or ndim storage for tensors.
    pub offsets: Vec<usize>,
    /// Optional type hint string.
    pub hint: Option<String>,
    /// Child schemas (element type for arrays, field types for tuples, etc.).
    pub parameters: Vec<Schema>,
    /// Field names for records (None for non-record types).
    pub keys: Vec<String>,
}

impl Schema {
    pub fn primitive(serial_type: SerialType) -> Self {
        use crate::shm;
        let width = match serial_type {
            SerialType::Nil => 0,
            SerialType::Bool | SerialType::Sint8 | SerialType::Uint8 => 1,
            SerialType::Sint16 | SerialType::Uint16 => 2,
            SerialType::Sint32 | SerialType::Uint32 | SerialType::Float32 => 4,
            SerialType::Sint64 | SerialType::Uint64 | SerialType::Float64 => 8,
            SerialType::String => std::mem::size_of::<shm::Array>(),
            _ => 0,
        };
        Schema {
            serial_type,
            size: 0,
            width,
            offsets: Vec::new(),
            hint: None,
            parameters: Vec::new(),
            keys: Vec::new(),
        }
    }

    /// Returns true if this type has a fixed byte width (no variable-length data).
    pub fn is_fixed_width(&self) -> bool {
        match self.serial_type {
            SerialType::Nil
            | SerialType::Bool
            | SerialType::Sint8
            | SerialType::Sint16
            | SerialType::Sint32
            | SerialType::Sint64
            | SerialType::Uint8
            | SerialType::Uint16
            | SerialType::Uint32
            | SerialType::Uint64
            | SerialType::Float32
            | SerialType::Float64 => true,
            SerialType::Tuple => self.parameters.iter().all(|p| p.is_fixed_width()),
            SerialType::Optional => false,
            _ => false,
        }
    }

    /// Alignment requirement for this type.
    pub fn alignment(&self) -> usize {
        match self.serial_type {
            SerialType::Nil => 1,
            SerialType::Bool | SerialType::Sint8 | SerialType::Uint8 => 1,
            SerialType::Sint16 | SerialType::Uint16 => 2,
            SerialType::Sint32 | SerialType::Uint32 | SerialType::Float32 => 4,
            SerialType::Sint64 | SerialType::Uint64 | SerialType::Float64 => 8,
            SerialType::String | SerialType::Array | SerialType::Map | SerialType::Tensor => {
                std::mem::size_of::<usize>() // pointer-sized alignment
            }
            SerialType::Tuple => {
                self.parameters
                    .iter()
                    .map(|p| p.alignment())
                    .max()
                    .unwrap_or(1)
            }
            SerialType::Optional => {
                if let Some(inner) = self.parameters.first() {
                    std::cmp::max(1, inner.alignment())
                } else {
                    1
                }
            }
        }
    }
}

/// Parse a schema string into a Schema tree.
///
/// Positional format (no parentheses/commas):
/// - `z` -> Nil, `b` -> Bool, `s` -> String
/// - `i4` -> Sint32, `u8` -> Uint64, `f8` -> Float64
/// - `ai4` -> Array of Sint32
/// - `t2i4s` -> Tuple of (Sint32, String)
/// - `m24namesi4` -> Map with keys "name"->String, "i4"  (base-62 field count, then key-len + key + value for each)
/// - `?i4` -> Optional Sint32
/// - `T2f8` -> 2D Tensor of Float64
/// - `<hint>i4` -> Sint32 with hint annotation
pub fn parse_schema(input: &str) -> Result<Schema, MorlocError> {
    let bytes = input.as_bytes();
    let (schema, consumed) = parse_schema_r(bytes, 0)?;
    if consumed != bytes.len() {
        return Err(MorlocError::Schema(format!(
            "trailing characters after schema at position {consumed}"
        )));
    }
    Ok(schema)
}

/// Recursive schema parser matching the C `parse_schema_r` format exactly.
fn parse_schema_r(bytes: &[u8], pos: usize) -> Result<(Schema, usize), MorlocError> {
    if pos >= bytes.len() {
        return Err(MorlocError::Schema("unexpected end of schema".into()));
    }

    let c = bytes[pos];
    let cur = pos + 1;

    match c {
        b'<' => {
            // Hint: <...> with nesting support, then parse the actual type
            let (hint, after_hint) = parse_hint(bytes, cur)?;
            let (mut schema, end) = parse_schema_r(bytes, after_hint)?;
            schema.hint = Some(hint);
            Ok((schema, end))
        }
        SCHEMA_NIL => Ok((Schema::primitive(SerialType::Nil), cur)),
        SCHEMA_BOOL => Ok((Schema::primitive(SerialType::Bool), cur)),
        SCHEMA_STRING => {
            // String schema has one parameter (uint8) for array compatibility,
            // matching the C string_schema() constructor.
            Ok((Schema {
                serial_type: SerialType::String,
                size: 1,
                width: std::mem::size_of::<crate::shm::Array>(),
                offsets: Vec::new(),
                hint: None,
                parameters: vec![Schema::primitive(SerialType::Uint8)],
                keys: Vec::new(),
            }, cur))
        }
        SCHEMA_SINT => parse_sized_int(bytes, cur, true),
        SCHEMA_UINT => parse_sized_int(bytes, cur, false),
        SCHEMA_FLOAT => parse_sized_float(bytes, cur),
        SCHEMA_ARRAY => {
            // Array: one child schema follows immediately
            let (child, end) = parse_schema_r(bytes, cur)?;
            Ok((make_array_schema(child), end))
        }
        SCHEMA_OPTIONAL => {
            // Optional: one child schema follows immediately
            let (child, end) = parse_schema_r(bytes, cur)?;
            Ok((make_optional_schema(child), end))
        }
        SCHEMA_TUPLE => {
            // Tuple: base-62 size char, then N child schemas
            if cur >= bytes.len() {
                return Err(MorlocError::Schema("expected tuple size".into()));
            }
            let n = decode_base62(bytes[cur])?;
            let mut params = Vec::with_capacity(n);
            let mut p = cur + 1;
            for _ in 0..n {
                let (child, end) = parse_schema_r(bytes, p)?;
                params.push(child);
                p = end;
            }
            Ok((make_tuple_schema(params), p))
        }
        SCHEMA_MAP => {
            // Map/record: base-62 size char, then N (key_len_char + key_bytes + value_schema)
            if cur >= bytes.len() {
                return Err(MorlocError::Schema("expected map size".into()));
            }
            let n = decode_base62(bytes[cur])?;
            let mut params = Vec::with_capacity(n);
            let mut keys = Vec::with_capacity(n);
            let mut p = cur + 1;
            for _ in 0..n {
                // Read key: base-62 length char + that many bytes
                if p >= bytes.len() {
                    return Err(MorlocError::Schema("expected map key length".into()));
                }
                let key_len = decode_base62(bytes[p])?;
                p += 1;
                if p + key_len > bytes.len() {
                    return Err(MorlocError::Schema("map key extends past end".into()));
                }
                let key = std::str::from_utf8(&bytes[p..p + key_len])
                    .map_err(|_| MorlocError::Schema("invalid UTF-8 in map key".into()))?
                    .to_string();
                p += key_len;
                keys.push(key);
                // Read value schema
                let (child, end) = parse_schema_r(bytes, p)?;
                params.push(child);
                p = end;
            }
            Ok((make_map_schema(params, keys), p))
        }
        SCHEMA_TENSOR => {
            // Tensor: base-62 ndim char, then element schema
            if cur >= bytes.len() {
                return Err(MorlocError::Schema("expected tensor ndim".into()));
            }
            let ndim = decode_base62(bytes[cur])?;
            let (child, end) = parse_schema_r(bytes, cur + 1)?;
            Ok((make_tensor_schema(ndim, child), end))
        }
        _ => Err(MorlocError::Schema(format!(
            "unknown schema character '{}' at position {pos}",
            c as char
        ))),
    }
}

/// Parse hint with nested angle bracket support: `<std::vector<$1>>` etc.
fn parse_hint(bytes: &[u8], pos: usize) -> Result<(String, usize), MorlocError> {
    let mut depth: usize = 1;
    let start = pos;
    let mut cur = pos;
    while cur < bytes.len() {
        match bytes[cur] {
            b'<' => depth += 1,
            b'>' => {
                depth -= 1;
                if depth == 0 {
                    let hint = std::str::from_utf8(&bytes[start..cur])
                        .unwrap_or("")
                        .to_string();
                    return Ok((hint, cur + 1)); // skip closing '>'
                }
            }
            _ => {}
        }
        cur += 1;
    }
    Err(MorlocError::Schema("unclosed '<' in hint".into()))
}

fn parse_sized_int(
    bytes: &[u8],
    pos: usize,
    signed: bool,
) -> Result<(Schema, usize), MorlocError> {
    if pos >= bytes.len() {
        return Err(MorlocError::Schema("expected size after 'i'/'u'".into()));
    }
    // Size is a SINGLE base-62 character, not a multi-digit number
    let size = decode_base62(bytes[pos])?;
    let next = pos + 1;
    let st = match (signed, size) {
        (true, 1) => SerialType::Sint8,
        (true, 2) => SerialType::Sint16,
        (true, 4) => SerialType::Sint32,
        (true, 8) => SerialType::Sint64,
        (false, 1) => SerialType::Uint8,
        (false, 2) => SerialType::Uint16,
        (false, 4) => SerialType::Uint32,
        (false, 8) => SerialType::Uint64,
        _ => return Err(MorlocError::Schema(format!("invalid integer size {size}"))),
    };
    Ok((Schema::primitive(st), next))
}

fn parse_sized_float(bytes: &[u8], pos: usize) -> Result<(Schema, usize), MorlocError> {
    if pos >= bytes.len() {
        return Err(MorlocError::Schema("expected size after 'f'".into()));
    }
    // Size is a SINGLE base-62 character, not a multi-digit number
    let size = decode_base62(bytes[pos])?;
    let next = pos + 1;
    let st = match size {
        4 => SerialType::Float32,
        8 => SerialType::Float64,
        _ => return Err(MorlocError::Schema(format!("invalid float size {size}"))),
    };
    Ok((Schema::primitive(st), next))
}

/// Decode a single base-62 character to a number (0-63).
/// 0-9 -> 0-9, a-z -> 10-35, A-Z -> 36-61, + -> 62, / -> 63
fn decode_base62(c: u8) -> Result<usize, MorlocError> {
    match c {
        b'0'..=b'9' => Ok((c - b'0') as usize),
        b'a'..=b'z' => Ok((c - b'a') as usize + 10),
        b'A'..=b'Z' => Ok((c - b'A') as usize + 36),
        b'+' => Ok(62),
        b'/' => Ok(63),
        _ => Err(MorlocError::Schema(format!(
            "invalid base-62 size character '{}'",
            c as char
        ))),
    }
}

fn encode_base62(n: usize) -> char {
    match n {
        0..=9 => (b'0' + n as u8) as char,
        10..=35 => (b'a' + (n - 10) as u8) as char,
        36..=61 => (b'A' + (n - 36) as u8) as char,
        62 => '+',
        63 => '/',
        _ => '\x07', // bell - error
    }
}

// ── Schema constructors ────────────────────────────────────────────────────

fn make_array_schema(child: Schema) -> Schema {
    Schema {
        serial_type: SerialType::Array,
        size: 1,
        width: std::mem::size_of::<crate::shm::Array>(),
        offsets: Vec::new(),
        hint: None,
        parameters: vec![child],
        keys: Vec::new(),
    }
}

fn make_optional_schema(child: Schema) -> Schema {
    let align = child.alignment().max(1);
    let inner_offset = crate::shm::align_up(1, align);
    Schema {
        serial_type: SerialType::Optional,
        size: 1,
        width: inner_offset + child.width,
        offsets: vec![inner_offset],
        hint: None,
        parameters: vec![child],
        keys: Vec::new(),
    }
}

fn make_tuple_schema(params: Vec<Schema>) -> Schema {
    let (width, offsets) = calculate_tuple_layout(&params);
    let size = params.len();
    Schema {
        serial_type: SerialType::Tuple,
        size,
        width,
        offsets,
        hint: None,
        parameters: params,
        keys: Vec::new(),
    }
}

fn make_map_schema(params: Vec<Schema>, keys: Vec<String>) -> Schema {
    let (width, offsets) = calculate_tuple_layout(&params);
    let size = params.len();
    Schema {
        serial_type: SerialType::Map,
        size,
        width,
        offsets,
        hint: None,
        parameters: params,
        keys,
    }
}

fn make_tensor_schema(ndim: usize, child: Schema) -> Schema {
    Schema {
        serial_type: SerialType::Tensor,
        size: 1,
        width: std::mem::size_of::<crate::shm::Tensor>(),
        offsets: vec![ndim],
        hint: None,
        parameters: vec![child],
        keys: Vec::new(),
    }
}

/// Calculate byte offsets for tuple fields (C struct layout with natural alignment).
fn calculate_tuple_layout(params: &[Schema]) -> (usize, Vec<usize>) {
    let mut offsets = Vec::with_capacity(params.len());
    let mut offset: usize = 0;
    let mut max_align: usize = 1;

    for param in params {
        let align = param.alignment();
        max_align = std::cmp::max(max_align, align);
        // Align the offset
        offset = (offset + align - 1) & !(align - 1);
        offsets.push(offset);
        offset += param.width;
    }

    // Total width padded to max alignment
    let width = (offset + max_align - 1) & !(max_align - 1);
    (width, offsets)
}

/// Render a schema back to its string representation.
pub fn schema_to_string(schema: &Schema) -> String {
    let mut buf = String::new();
    schema_to_string_inner(schema, &mut buf);
    buf
}

fn schema_to_string_inner(schema: &Schema, buf: &mut String) {
    // Write hint if present
    if let Some(ref hint) = schema.hint {
        buf.push('<');
        buf.push_str(hint);
        buf.push('>');
    }

    match schema.serial_type {
        SerialType::Nil => buf.push('z'),
        SerialType::Bool => buf.push('b'),
        SerialType::Sint8 => buf.push_str("i1"),
        SerialType::Sint16 => buf.push_str("i2"),
        SerialType::Sint32 => buf.push_str("i4"),
        SerialType::Sint64 => buf.push_str("i8"),
        SerialType::Uint8 => buf.push_str("u1"),
        SerialType::Uint16 => buf.push_str("u2"),
        SerialType::Uint32 => buf.push_str("u4"),
        SerialType::Uint64 => buf.push_str("u8"),
        SerialType::Float32 => buf.push_str("f4"),
        SerialType::Float64 => buf.push_str("f8"),
        SerialType::String => buf.push('s'),
        SerialType::Array => {
            buf.push('a');
            schema_to_string_inner(&schema.parameters[0], buf);
        }
        SerialType::Tuple => {
            buf.push('t');
            buf.push(encode_base62(schema.size));
            for p in &schema.parameters {
                schema_to_string_inner(p, buf);
            }
        }
        SerialType::Map => {
            buf.push('m');
            buf.push(encode_base62(schema.size));
            for (i, p) in schema.parameters.iter().enumerate() {
                if i < schema.keys.len() {
                    let key = &schema.keys[i];
                    buf.push(encode_base62(key.len()));
                    buf.push_str(key);
                }
                schema_to_string_inner(p, buf);
            }
        }
        SerialType::Optional => {
            buf.push('?');
            schema_to_string_inner(&schema.parameters[0], buf);
        }
        SerialType::Tensor => {
            let ndim = schema.offsets.first().copied().unwrap_or(0);
            buf.push('T');
            buf.push(encode_base62(ndim));
            schema_to_string_inner(&schema.parameters[0], buf);
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_parse_primitives() {
        assert_eq!(parse_schema("z").unwrap().serial_type, SerialType::Nil);
        assert_eq!(parse_schema("b").unwrap().serial_type, SerialType::Bool);
        assert_eq!(parse_schema("i4").unwrap().serial_type, SerialType::Sint32);
        assert_eq!(parse_schema("u8").unwrap().serial_type, SerialType::Uint64);
        assert_eq!(parse_schema("f8").unwrap().serial_type, SerialType::Float64);
        assert_eq!(parse_schema("s").unwrap().serial_type, SerialType::String);
    }

    #[test]
    fn test_parse_array() {
        let s = parse_schema("ai4").unwrap();
        assert_eq!(s.serial_type, SerialType::Array);
        assert_eq!(s.parameters.len(), 1);
        assert_eq!(s.parameters[0].serial_type, SerialType::Sint32);
    }

    #[test]
    fn test_parse_tuple() {
        let s = parse_schema("t3i4sf8").unwrap();
        assert_eq!(s.serial_type, SerialType::Tuple);
        assert_eq!(s.parameters.len(), 3);
    }

    #[test]
    fn test_parse_nested() {
        let s = parse_schema("at2i4s").unwrap();
        assert_eq!(s.serial_type, SerialType::Array);
        assert_eq!(s.parameters[0].serial_type, SerialType::Tuple);
        assert_eq!(s.parameters[0].parameters.len(), 2);
    }

    #[test]
    fn test_parse_map() {
        let s = parse_schema("m21as1bi4").unwrap();
        assert_eq!(s.serial_type, SerialType::Map);
        assert_eq!(s.parameters.len(), 2);
        assert_eq!(s.keys[0], "a");
        assert_eq!(s.keys[1], "b");
    }

    #[test]
    fn test_parse_optional() {
        let s = parse_schema("?f8").unwrap();
        assert_eq!(s.serial_type, SerialType::Optional);
        assert_eq!(s.parameters[0].serial_type, SerialType::Float64);
    }

    #[test]
    fn test_parse_tensor() {
        let s = parse_schema("T2f8").unwrap();
        assert_eq!(s.serial_type, SerialType::Tensor);
        assert_eq!(s.offsets[0], 2); // ndim
        assert_eq!(s.parameters[0].serial_type, SerialType::Float64);
    }

    #[test]
    fn test_parse_with_hints() {
        let s = parse_schema("<float>f8").unwrap();
        assert_eq!(s.serial_type, SerialType::Float64);
        assert_eq!(s.hint.as_deref(), Some("float"));

        // Nested hints: <std::vector<$1>>
        let s = parse_schema("<std::vector<$1>>ai4").unwrap();
        assert_eq!(s.serial_type, SerialType::Array);
        assert_eq!(s.hint.as_deref(), Some("std::vector<$1>"));
    }

    #[test]
    fn test_roundtrip() {
        let cases = ["z", "b", "i4", "u8", "f8", "s", "ai4", "t2i4s", "?i4", "T2f8"];
        for case in cases {
            let schema = parse_schema(case).unwrap();
            let rendered = schema_to_string(&schema);
            assert_eq!(rendered, case, "roundtrip failed for '{case}'");
        }
    }

    #[test]
    fn test_roundtrip_map() {
        let input = "m24names4infoi4";
        let schema = parse_schema(input).unwrap();
        assert_eq!(schema.serial_type, SerialType::Map);
        assert_eq!(schema.keys, vec!["name", "info"]);
        let rendered = schema_to_string(&schema);
        assert_eq!(rendered, input);
    }
}

#[cfg(test)]
mod compat_tests {
    use super::*;

    fn dump(label: &str, s: &Schema, depth: usize) {
        let indent = "  ".repeat(depth);
        print!("{}{}: type={} size={} width={}", indent, label, s.serial_type as u32, s.size, s.width);
        if !s.offsets.is_empty() {
            print!(" offsets={:?}", s.offsets);
        }
        if let Some(ref h) = s.hint { print!(" hint=\"{}\"", h); }
        if !s.keys.is_empty() { print!(" keys={:?}", s.keys); }
        println!();
        for (i, p) in s.parameters.iter().enumerate() {
            dump(&format!("param[{}]", i), p, depth + 1);
        }
    }

    #[test]
    fn test_schema_compat_with_c() {
        // These must match the C output exactly
        let cases = vec![
            ("s", "type=13 size=1 width=16"),
            ("ai4", "type=14 size=1 width=16"),
            ("t2i4s", "type=15 size=2 width=24"),
            ("?i4", "type=17 size=1 width=8"),
            ("?s", "type=17 size=1 width=24"),
            ("T2f8", "type=12 size=1 width=32"),
        ];
        for (input, expected_root) in &cases {
            let s = parse_schema(input).unwrap();
            let got = format!("type={} size={} width={}", s.serial_type as u32, s.size, s.width);
            assert_eq!(&got, *expected_root, "Schema '{}' mismatch", input);
        }

        // Verify tuple offsets
        let t = parse_schema("t2i4s").unwrap();
        assert_eq!(t.offsets, vec![0, 8], "t2i4s offsets");

        // Verify optional offsets
        let o = parse_schema("?i4").unwrap();
        assert_eq!(o.offsets, vec![4], "?i4 offsets");
        let os = parse_schema("?s").unwrap();
        assert_eq!(os.offsets, vec![8], "?s offsets");

        // Verify string has uint8 parameter
        let s = parse_schema("s").unwrap();
        assert_eq!(s.parameters.len(), 1);
        assert_eq!(s.parameters[0].serial_type, SerialType::Uint8);
        assert_eq!(s.parameters[0].width, 1);

        // Verify tensor
        let t = parse_schema("T2f8").unwrap();
        assert_eq!(t.offsets, vec![2]); // ndim
        assert_eq!(t.width, 32); // sizeof(Tensor)
    }
}


================================================
FILE: data/rust/morloc-runtime/src/shm.rs
================================================
//! Shared memory management with multi-volume support.
//!
//! Replaces shm.c / memory.h. Uses AtomicU32 + futex for cross-process locking
//! instead of pthread_rwlock_t, providing crash-safety and portability.

use crate::error::MorlocError;
use std::sync::atomic::{AtomicU32, Ordering};
use std::sync::Mutex;

/// Cross-platform file pre-allocation.
/// Linux: posix_fallocate (allocates disk blocks).
/// macOS: ftruncate (extends file, may be sparse).
#[cfg(target_os = "linux")]
unsafe fn preallocate_fd(fd: i32, size: i64) -> i32 {
    libc::posix_fallocate(fd, 0, size)
}

#[cfg(target_os = "macos")]
unsafe fn preallocate_fd(fd: i32, size: i64) -> i32 {
    if libc::ftruncate(fd, size) == -1 { -1 } else { 0 }
}

// ── Constants ──────────────────────────────────────────────────────────────

pub const SHM_MAGIC: u32 = 0xFECA_0DF0;
pub const BLK_MAGIC: u32 = 0x0CB1_0DF0;
pub const MAX_VOLUME_NUMBER: usize = 32;
pub const MAX_FILENAME_SIZE: usize = 128;
pub const MAX_PATH_SIZE: usize = 512;

const LOCK_UNLOCKED: u32 = 0;
const LOCK_LOCKED: u32 = 1;
const SPIN_LIMIT: u32 = 40;
#[cfg(target_os = "linux")]
const LOCK_TIMEOUT_SECS: u64 = 5;

// ── Pointer types ──────────────────────────────────────────────────────────

/// Relative pointer: index into the multi-volume pool (cross-process safe).
pub type RelPtr = isize;
/// Volume-local pointer: offset within a single volume.
pub type VolPtr = isize;
/// Absolute pointer: virtual address in this process.
pub type AbsPtr = *mut u8;

pub const RELNULL: RelPtr = -1;
pub const VOLNULL: VolPtr = -1;

// ── Block alignment ────────────────────────────────────────────────────────

pub const BLOCK_ALIGN: usize = std::mem::align_of::<BlockHeader>();

#[inline]
pub const fn align_up(x: usize, align: usize) -> usize {
    (x + align - 1) & !(align - 1)
}

// ── Shared memory header (lives in mmap'd region) ──────────────────────────

#[repr(C)]
pub struct ShmHeader {
    pub magic: u32,
    pub volume_name: [u8; MAX_FILENAME_SIZE],
    pub volume_index: i32,
    pub volume_size: usize,
    pub relative_offset: usize,
    pub lock: AtomicU32,
    pub cursor: VolPtr,
}

#[repr(C)]
pub struct BlockHeader {
    pub magic: u32,
    pub reference_count: AtomicU32,
    pub size: usize,
}

const _: () = assert!(
    std::mem::size_of::<BlockHeader>()
        == std::mem::size_of::<u32>()
            + std::mem::size_of::<AtomicU32>()
            + std::mem::size_of::<usize>()
);

// ── Voidstar data structures (used by serialization) ───────────────────────

/// Variable-length array/string representation in SHM.
#[derive(Clone, Copy)]
#[repr(C)]
pub struct Array {
    pub size: usize,
    pub data: RelPtr,
}

/// N-dimensional dense tensor in SHM.
#[repr(C)]
pub struct Tensor {
    pub total_elements: usize,
    pub device_type: u32,
    pub device_id: u32,
    pub data: RelPtr,
    pub shape: RelPtr,
}

// ── Send wrapper for raw pointers ──────────────────────────────────────────

#[derive(Clone, Copy)]
struct SendPtr(*mut ShmHeader);
// SAFETY: ShmHeader lives in mmap'd shared memory that outlives all threads.
// Access is serialized via VOLUMES Mutex and per-volume AtomicU32 futex locks.
unsafe impl Send for SendPtr {}
impl SendPtr {
    const fn null() -> Self { SendPtr(std::ptr::null_mut()) }
    fn is_null(&self) -> bool { self.0.is_null() }
    fn ptr(&self) -> *mut ShmHeader { self.0 }
    fn set(&mut self, p: *mut ShmHeader) { self.0 = p; }
}

fn get_cstr_buf(buf: &[u8; MAX_FILENAME_SIZE]) -> &str {
    get_cstr(buf.as_slice())
}

// ── Global state ───────────────────────────────────────────────────────────

static CURRENT_VOLUME: std::sync::atomic::AtomicUsize = std::sync::atomic::AtomicUsize::new(0);

static VOLUMES: Mutex<[SendPtr; MAX_VOLUME_NUMBER]> =
    Mutex::new([SendPtr::null(); MAX_VOLUME_NUMBER]);

static ALLOC_MUTEX: Mutex<()> = Mutex::new(());

static COMMON_BASENAME: Mutex<[u8; MAX_FILENAME_SIZE]> = Mutex::new([0u8; MAX_FILENAME_SIZE]);

static FALLBACK_DIR: Mutex<[u8; MAX_FILENAME_SIZE]> = Mutex::new([0u8; MAX_FILENAME_SIZE]);

fn set_cstr(buf: &mut [u8], s: &str) {
    let bytes = s.as_bytes();
    let len = bytes.len().min(buf.len() - 1);
    buf[..len].copy_from_slice(&bytes[..len]);
    buf[len] = 0;
}

fn get_cstr(buf: &[u8]) -> &str {
    let end = buf.iter().position(|&b| b == 0).unwrap_or(buf.len());
    std::str::from_utf8(&buf[..end]).unwrap_or("")
}

// ── Public API ─────────────────────────────────────────────────────────────

/// Set fallback directory for file-backed SHM when /dev/shm is too small.
pub fn shm_set_fallback_dir(dir: &str) {
    let mut fb = FALLBACK_DIR.lock().unwrap();
    set_cstr(&mut *fb, dir);
}

/// Initialize a new SHM volume.
pub fn shinit(
    shm_basename: &str,
    volume_index: usize,
    shm_size: usize,
) -> Result<*mut ShmHeader, MorlocError> {
    let full_size = shm_size + std::mem::size_of::<ShmHeader>();
    let shm_name = format!("{}_{}", shm_basename, volume_index);

    // Store common basename
    {
        let mut cb = COMMON_BASENAME.lock().unwrap();
        set_cstr(&mut *cb, shm_basename);
    }

    // Try POSIX shared memory first, fall back to file-backed
    let (fd, created, volume_label, actual_full_size) =
        try_open_shm(&shm_name, full_size)?;

    // SAFETY: mmap with MAP_SHARED on a valid fd obtained from shm_open/open above.
    // The returned pointer is checked against MAP_FAILED before use.
    let ptr = unsafe {
        libc::mmap(
            std::ptr::null_mut(),
            actual_full_size,
            libc::PROT_READ | libc::PROT_WRITE,
            libc::MAP_SHARED,
            fd,
            0,
        )
    };
    // SAFETY: fd is a valid file descriptor opened above.
    unsafe { libc::close(fd) };

    if ptr == libc::MAP_FAILED {
        return Err(MorlocError::Shm(format!(
            "Failed to mmap volume '{}' ({} bytes)",
            volume_label, actual_full_size
        )));
    }

    let shm = ptr as *mut ShmHeader;

    // Store in volumes array
    {
        let mut vols = VOLUMES.lock().unwrap();
        vols[volume_index].set(shm);
    }

    let actual_data_size = actual_full_size - std::mem::size_of::<ShmHeader>();

    if created {
        // SAFETY: shm points to the start of our mmap'd region of actual_full_size bytes.
        // We just created it, so we have exclusive access for initialization.
        unsafe {
            (*shm).magic = SHM_MAGIC;
            let mut name_buf = [0u8; MAX_FILENAME_SIZE];
            set_cstr(&mut name_buf, &volume_label);
            (*shm).volume_name = name_buf;
            (*shm).volume_index = volume_index as i32;

            // Calculate relative offset from prior volumes
            let vols = VOLUMES.lock().unwrap();
            let mut rel_offset = 0usize;
            for i in 0..volume_index {
                if !vols[i].is_null() {
                    rel_offset += (*vols[i].ptr()).volume_size;
                }
            }
            (*shm).relative_offset = rel_offset;
            (*shm).volume_size = actual_data_size;
            (*shm).lock = AtomicU32::new(LOCK_UNLOCKED);
            (*shm).cursor = 0;

            // Initialize first block header
            let first_block =
                (shm as *mut u8).add(std::mem::size_of::<ShmHeader>()) as *mut BlockHeader;
            (*first_block).magic = BLK_MAGIC;
            (*first_block).reference_count = AtomicU32::new(0);
            (*first_block).size = actual_data_size - std::mem::size_of::<BlockHeader>();
        }
    }

    Ok(shm)
}

/// Open an existing SHM volume (or return cached pointer).
pub fn shopen(volume_index: usize) -> Result<Option<*mut ShmHeader>, MorlocError> {
    {
        let vols = VOLUMES.lock().unwrap();
        if !vols[volume_index].is_null() {
            return Ok(Some(vols[volume_index].ptr()));
        }
    }

    let basename = {
        let cb = COMMON_BASENAME.lock().unwrap();
        get_cstr_buf(&cb).to_string()
    };
    if basename.is_empty() {
        return Ok(None);
    }

    let shm_name = format!("{}_{}", basename, volume_index);

    // Try POSIX SHM
    let name_cstr = std::ffi::CString::new(shm_name.as_str()).unwrap();
    // SAFETY: name_cstr is a valid null-terminated CString.
    let fd = unsafe { libc::shm_open(name_cstr.as_ptr(), libc::O_RDWR, 0o666) };

    let fd = if fd == -1 {
        // Try file-backed fallback
        let fb = FALLBACK_DIR.lock().unwrap();
        let fallback = get_cstr_buf(&fb);
        if fallback.is_empty() {
            return Ok(None);
        }
        let file_path = format!("{}/{}", fallback, shm_name);
        let path_cstr = std::ffi::CString::new(file_path.as_str()).unwrap();
        let fd2 = unsafe { libc::open(path_cstr.as_ptr(), libc::O_RDWR) };
        if fd2 == -1 {
            return Ok(None);
        }
        fd2
    } else {
        fd
    };

    // SAFETY: zeroed memory is valid for libc::stat. fstat/close on valid fd.
    let mut sb: libc::stat = unsafe { std::mem::zeroed() };
    if unsafe { libc::fstat(fd, &mut sb) } == -1 {
        unsafe { libc::close(fd) };
        return Err(MorlocError::Shm(format!(
            "Cannot fstat SHM volume '{}'",
            shm_name
        )));
    }
    let volume_size = sb.st_size as usize;

    // SAFETY: mmap with MAP_SHARED on a valid fd; result checked against MAP_FAILED.
    let ptr = unsafe {
        libc::mmap(
            std::ptr::null_mut(),
            volume_size,
            libc::PROT_READ | libc::PROT_WRITE,
            libc::MAP_SHARED,
            fd,
            0,
        )
    };
    // SAFETY: fd is a valid file descriptor opened above.
    unsafe { libc::close(fd) };

    if ptr == libc::MAP_FAILED {
        return Err(MorlocError::Shm(format!(
            "Cannot mmap SHM volume '{}'",
            shm_name
        )));
    }

    let shm = ptr as *mut ShmHeader;
    {
        let mut vols = VOLUMES.lock().unwrap();
        vols[volume_index].set(shm);
    }

    Ok(Some(shm))
}

/// Close and unlink all SHM volumes.
pub fn shclose() -> Result<(), MorlocError> {
    let _lock = ALLOC_MUTEX.lock().unwrap();
    let mut vols = VOLUMES.lock().unwrap();

    for i in 0..MAX_VOLUME_NUMBER {
        let shm = if !vols[i].is_null() {
            vols[i].ptr()
        } else {
            continue;
        };

        // SAFETY: shm is a valid mmap'd pointer stored in VOLUMES.
        // munmap/unlink on regions we own. Name read from valid ShmHeader.
        unsafe {
            let name = get_cstr(&(*shm).volume_name).to_string();
            let full_size = (*shm).volume_size + std::mem::size_of::<ShmHeader>();
            libc::munmap(shm as *mut libc::c_void, full_size);

            // Unlink: file-backed volumes start with '/', POSIX SHM does not
            if name.starts_with('/') {
                let cstr = std::ffi::CString::new(name.as_str()).unwrap();
                libc::unlink(cstr.as_ptr());
            } else {
                let cstr = std::ffi::CString::new(name.as_str()).unwrap();
                libc::shm_unlink(cstr.as_ptr());
            }
        }
        vols[i] = SendPtr::null();
    }
    Ok(())
}

/// Allocate `size` bytes from shared memory.
pub fn shmalloc(size: usize) -> Result<AbsPtr, MorlocError> {
    // Allow 0-size: round up to minimum block alignment.
    // Needed for nil type (width=0) in morloc_eval.
    let size = if size == 0 { BLOCK_ALIGN } else { align_up(size, BLOCK_ALIGN) };
    let _lock = ALLOC_MUTEX.lock().unwrap();
    shmalloc_unlocked(size)
}

/// Copy data into a new SHM allocation.
pub fn shmemcpy(src: *const u8, size: usize) -> Result<AbsPtr, MorlocError> {
    let dest = shmalloc(size)?;
    // SAFETY: dest is a freshly allocated SHM block of `size` bytes.
    // Caller guarantees src points to `size` readable bytes.
    unsafe { std::ptr::copy_nonoverlapping(src, dest, size) };
    Ok(dest)
}

/// Allocate and zero-fill.
pub fn shcalloc(nmemb: usize, size: usize) -> Result<AbsPtr, MorlocError> {
    let total = nmemb * size;
    let ptr = shmalloc(total)?;
    // SAFETY: ptr is a freshly allocated SHM block of `total` bytes.
    unsafe { std::ptr::write_bytes(ptr, 0, total) };
    Ok(ptr)
}

/// Free a shared memory block (decrement reference count).
pub fn shfree(ptr: AbsPtr) -> Result<(), MorlocError> {
    let _lock = ALLOC_MUTEX.lock().unwrap();
    shfree_unlocked(ptr)
}

/// Increment reference count on a shared memory block.
pub fn shincref(ptr: AbsPtr) -> Result<(), MorlocError> {
    if ptr.is_null() {
        return Err(MorlocError::Shm("Cannot incref NULL pointer".into()));
    }
    // SAFETY: ptr was returned by shmalloc, which places a BlockHeader immediately before
    // the returned data pointer. Magic check below validates the header.
    let blk = unsafe { &*(ptr.sub(std::mem::size_of::<BlockHeader>()) as *const BlockHeader) };
    if blk.magic != BLK_MAGIC {
        return Err(MorlocError::Shm("Corrupted memory - invalid magic".into()));
    }
    blk.reference_count.fetch_add(1, Ordering::AcqRel);
    Ok(())
}

/// Convert relative pointer to absolute pointer.
pub fn rel2abs(ptr: RelPtr) -> Result<AbsPtr, MorlocError> {
    if ptr < 0 {
        return Err(MorlocError::Shm(format!("Illegal relptr value {}", ptr)));
    }
    let mut remaining = ptr as usize;

    // First try with volumes already mapped
    {
        let vols = VOLUMES.lock().unwrap();
        for i in 0..MAX_VOLUME_NUMBER {
            if vols[i].is_null() {
                break; // No more volumes mapped
            }
            let shm = vols[i].ptr();
            // SAFETY: shm is a valid mmap'd ShmHeader pointer from VOLUMES.
            let vol_size = unsafe { (*shm).volume_size };
            if remaining < vol_size {
                // SAFETY: data region starts after ShmHeader; remaining < vol_size
                // guarantees the offset is within the mmap'd region.
                let base = unsafe {
                    (shm as *const u8).add(std::mem::size_of::<ShmHeader>())
                };
                return Ok(unsafe { base.add(remaining) as AbsPtr });
            }
            remaining -= vol_size;
        }
    }

    // If not found, try opening unmapped volumes
    remaining = ptr as usize;
    for i in 0..MAX_VOLUME_NUMBER {
        let shm = match shopen(i)? {
            Some(s) => s,
            None => {
                return Err(MorlocError::Shm(format!(
                    "Failed to find volume for relptr {}", ptr
                )));
            }
        };
        // SAFETY: shm is a valid mmap'd ShmHeader pointer from shopen.
        let vol_size = unsafe { (*shm).volume_size };
        if remaining < vol_size {
            // SAFETY: same as above - offset within mmap'd region.
            let base = unsafe {
                (shm as *const u8).add(std::mem::size_of::<ShmHeader>())
            };
            return Ok(unsafe { base.add(remaining) as AbsPtr });
        }
        remaining -= vol_size;
    }

    Err(MorlocError::Shm(format!(
        "Shared memory pool does not contain index {}", ptr
    )))
}

/// Convert absolute pointer to relative pointer.
pub fn abs2rel(ptr: AbsPtr) -> Result<RelPtr, MorlocError> {
    let vols = VOLUMES.lock().unwrap();
    for i in 0..MAX_VOLUME_NUMBER {
        let shm = vols[i].ptr();
        if shm.is_null() {
            continue;
        }
        // SAFETY: shm is a valid mmap'd ShmHeader from VOLUMES. We compute
        // data region bounds and check ptr falls within before computing offset.
        unsafe {
            let data_start = (shm as *const u8).add(std::mem::size_of::<ShmHeader>());
            let data_end = data_start.add((*shm).volume_size);
            let p = ptr as *const u8;
            if p >= data_start && p < data_end {
                let offset = p.offset_from(data_start) as usize;
                return Ok(((*shm).relative_offset + offset) as RelPtr);
            }
        }
    }
    Err(MorlocError::Shm(format!(
        "Failed to find absptr {:?} in shared memory",
        ptr
    )))
}

/// Find the ShmHeader for a given absolute pointer.
pub fn abs2shm(ptr: AbsPtr) -> Result<*mut ShmHeader, MorlocError> {
    let vols = VOLUMES.lock().unwrap();
    for i in 0..MAX_VOLUME_NUMBER {
        let shm = vols[i].ptr();
        if shm.is_null() {
            continue;
        }
        // SAFETY: shm is a valid mmap'd ShmHeader from VOLUMES.
        unsafe {
            let data_start = (shm as *const u8).add(std::mem::size_of::<ShmHeader>());
            let data_end = data_start.add((*shm).volume_size);
            let p = ptr as *const u8;
            if p >= data_start && p < data_end {
                return Ok(shm);
            }
        }
    }
    Err(MorlocError::Shm("Failed to find absptr in SHM".into()))
}

/// Total size of all SHM volumes.
pub fn total_shm_size() -> usize {
    let vols = VOLUMES.lock().unwrap();
    let mut total = 0;
    for i in 0..MAX_VOLUME_NUMBER {
        if !vols[i].is_null() {
            // SAFETY: non-null VOLUMES entries are valid mmap'd ShmHeader pointers.
            total += unsafe { (*vols[i].ptr()).volume_size };
        }
    }
    total
}

// ── Internal helpers ───────────────────────────────────────────────────────

fn try_open_shm(
    shm_name: &str,
    full_size: usize,
) -> Result<(i32, bool, String, usize), MorlocError> {
    let name_cstr = std::ffi::CString::new(shm_name).unwrap();

    // Try POSIX SHM
    let fd = unsafe {
        libc::shm_open(
            name_cstr.as_ptr(),
            libc::O_RDWR | libc::O_CREAT,
            0o666,
        )
    };

    if fd >= 0 {
        let mut sb: libc::stat = unsafe { std::mem::zeroed() };
        if unsafe { libc::fstat(fd, &mut sb) } == -1 {
            unsafe { libc::close(fd) };
            return Err(MorlocError::Shm(format!("fstat failed for '{}'", shm_name)));
        }
        let created = sb.st_size == 0;
        if created {
            let err = unsafe { preallocate_fd(fd, full_size as i64) };
            if err == 0 {
                return Ok((fd, true, shm_name.to_string(), full_size));
            }
            // /dev/shm too small, clean up and try file-backed
            unsafe {
                libc::close(fd);
                libc::shm_unlink(name_cstr.as_ptr());
            }
        } else {
            return Ok((fd, false, shm_name.to_string(), sb.st_size as usize));
        }
    }

    // Try file-backed fallback
    let fb = FALLBACK_DIR.lock().unwrap();
    let fallback = get_cstr_buf(&fb);
    if fallback.is_empty() {
        return Err(MorlocError::Shm(format!(
            "Failed to allocate SHM '{}': /dev/shm too small and no fallback directory",
            shm_name
        )));
    }
    let file_path = format!("{}/{}", fallback, shm_name);
    drop(fb);

    let path_cstr = std::ffi::CString::new(file_path.as_str()).unwrap();
    let fd = unsafe { libc::open(path_cstr.as_ptr(), libc::O_RDWR | libc::O_CREAT, 0o666) };
    if fd == -1 {
        return Err(MorlocError::Shm(format!(
            "Failed to create file-backed volume '{}'",
            file_path
        )));
    }

    let mut sb: libc::stat = unsafe { std::mem::zeroed() };
    if unsafe { libc::fstat(fd, &mut sb) } == -1 {
        unsafe { libc::close(fd) };
        return Err(MorlocError::Shm(format!("fstat failed for '{}'", file_path)));
    }
    let created = sb.st_size == 0;
    let actual_size = if created {
        let err = unsafe { preallocate_fd(fd, full_size as i64) };
        if err != 0 {
            unsafe {
                libc::close(fd);
                libc::unlink(path_cstr.as_ptr());
            }
            return Err(MorlocError::Shm(format!(
                "Failed to allocate file-backed volume '{}' ({} bytes)",
                file_path, full_size
            )));
        }
        full_size
    } else {
        sb.st_size as usize
    };

    Ok((fd, created, file_path, actual_size))
}

fn shmalloc_unlocked(size: usize) -> Result<AbsPtr, MorlocError> {
    let mut shm: *mut ShmHeader = std::ptr::null_mut();
    let blk = find_free_block(size, &mut shm)?;

    // Split and claim
    let final_blk = split_block(shm, blk, size)?;
    // SAFETY: final_blk is a valid BlockHeader in mmap'd SHM found by find_free_block.
    // The data region starts immediately after the header.
    unsafe {
        (*final_blk).reference_count.store(1, Ordering::Release);
        Ok((final_blk as *mut u8).add(std::mem::size_of::<BlockHeader>()))
    }
}

fn shfree_unlocked(ptr: AbsPtr) -> Result<(), MorlocError> {
    if ptr.is_null() {
        return Err(MorlocError::Shm("Cannot free NULL pointer".into()));
    }
    // SAFETY: ptr was returned by shmalloc, which places a BlockHeader
    // immediately before the data. Magic check validates correctness.
    let blk = unsafe {
        &*(ptr.sub(std::mem::size_of::<BlockHeader>()) as *const BlockHeader)
    };
    if blk.magic != BLK_MAGIC {
        return Err(MorlocError::Shm("Corrupted memory".into()));
    }
    if blk.reference_count.load(Ordering::Acquire) == 0 {
        return Err(MorlocError::Shm("Reference count already 0".into()));
    }
    let prev = blk.reference_count.fetch_sub(1, Ordering::AcqRel);
    if prev == 1 {
        // SAFETY: ptr points to blk.size bytes of SHM data we own (refcount just hit 0).
        unsafe {
            std::ptr::write_bytes(ptr, 0, blk.size);
        }
    }
    Ok(())
}

fn find_free_block(
    size: usize,
    shm_out: &mut *mut ShmHeader,
) -> Result<*mut BlockHeader, MorlocError> {
    let cv = CURRENT_VOLUME.load(Ordering::Relaxed);
    let vols = VOLUMES.lock().unwrap();

    // Try current volume first
    let shm = vols[cv].ptr();
    if !shm.is_null() {
        if let Some(blk) = find_free_block_in_volume(shm, size)? {
            *shm_out = shm;
            return Ok(blk);
        }
    }

    // Search all volumes
    for i in 0..MAX_VOLUME_NUMBER {
        let shm = vols[i].ptr();
        if shm.is_null() {
            // Create a new volume
            drop(vols);
            let new_size = std::cmp::max(size * 2, 0xffff);
            let basename = {
                let cb = COMMON_BASENAME.lock().unwrap();
                get_cstr_buf(&cb).to_string()
            };
            let new_shm = shinit(&basename, i, new_size)?;
            CURRENT_VOLUME.store(i, Ordering::Relaxed);
            *shm_out = new_shm;
            let blk = unsafe {
                (new_shm as *mut u8).add(std::mem::size_of::<ShmHeader>()) as *mut BlockHeader
            };
            return Ok(blk);
        }

        if let Some(blk) = find_free_block_in_volume(shm, size)? {
            CURRENT_VOLUME.store(i, Ordering::Relaxed);
            *shm_out = shm;
            return Ok(blk);
        }
    }

    Err(MorlocError::Shm(format!(
        "Could not find suitable block for {} bytes",
        size
    )))
}

fn find_free_block_in_volume(
    shm: *mut ShmHeader,
    size: usize,
) -> Result<Option<*mut BlockHeader>, MorlocError> {
    unsafe {
        let shm_end = (shm as *const u8)
            .add(std::mem::size_of::<ShmHeader>())
            .add((*shm).volume_size);

        shm_lock(&(*shm).lock)?;

        // Try cursor position first
        let cursor = (*shm).cursor;
        if cursor != VOLNULL {
            let blk = vol2abs_raw(cursor, shm);
            let blk = blk as *mut BlockHeader;
            if (*blk).magic == BLK_MAGIC
                && (*blk).reference_count.load(Ordering::Relaxed) == 0
                && (*blk).size >= size
            {
                shm_unlock(&(*shm).lock);
                return Ok(Some(blk));
            }
        }

        // Scan from cursor forward
        let start_blk = if cursor != VOLNULL {
            vol2abs_raw(cursor, shm) as *mut BlockHeader
        } else {
            vol2abs_raw(0, shm) as *mut BlockHeader
        };

        if let Some(blk) = scan_volume(start_blk, size, shm_end as *const u8) {
            shm_unlock(&(*shm).lock);
            return Ok(Some(blk));
        }

        // Wrap around: scan from beginning to cursor
        if cursor > 0 {
            let first_blk = vol2abs_raw(0, shm) as *mut BlockHeader;
            let cursor_end = vol2abs_raw(cursor, shm);
            if let Some(blk) = scan_volume(first_blk, size, cursor_end as *const u8) {
                shm_unlock(&(*shm).lock);
                return Ok(Some(blk));
            }
        }

        shm_unlock(&(*shm).lock);
        Ok(None)
    }
}

/// Scan a volume region for a free block of at least `size` bytes, merging adjacent free blocks.
///
/// # Safety
/// `blk` must point to a valid BlockHeader within an mmap'd SHM volume.
/// `end` must point to the byte past the end of the volume's data region.
unsafe fn scan_volume(
    mut blk: *mut BlockHeader,
    size: usize,
    end: *const u8,
) -> Option<*mut BlockHeader> {
    let hdr_size = std::mem::size_of::<BlockHeader>();
    while (blk as *const u8).add(hdr_size + size) <= end {
        if blk.is_null() || (*blk).magic != BLK_MAGIC {
            return None;
        }

        // Merge adjacent free blocks
        while (*blk).reference_count.load(Ordering::Relaxed) == 0 {
            let next = (blk as *mut u8).add(hdr_size + (*blk).size) as *mut BlockHeader;
            if (next as *const u8) >= end
                || (*next).magic != BLK_MAGIC
                || (*next).reference_count.load(Ordering::Relaxed) != 0
            {
                break;
            }
            (*blk).size += hdr_size + (*next).size;
        }

        if (*blk).reference_count.load(Ordering::Relaxed) == 0 && (*blk).size >= size {
            return Some(blk);
        }

        blk = (blk as *mut u8).add(hdr_size + (*blk).size) as *mut BlockHeader;
    }
    None
}

fn split_block(
    shm: *mut ShmHeader,
    blk: *mut BlockHeader,
    size: usize,
) -> Result<*mut BlockHeader, MorlocError> {
    unsafe {
        if (*blk).size == size {
            return Ok(blk);
        }

        shm_lock(&(*shm).lock)?;

        let remaining = (*blk).size - size;
        (*blk).size = size;

        let hdr_size = std::mem::size_of::<BlockHeader>();
        let new_free = (blk as *mut u8).add(hdr_size + size) as *mut BlockHeader;

        if remaining > hdr_size {
            (*new_free).magic = BLK_MAGIC;
            (*new_free).reference_count = AtomicU32::new(0);
            (*new_free).size = remaining - hdr_size;

            // Update cursor
            let data_start = (shm as *const u8).add(std::mem::size_of::<ShmHeader>());
            (*shm).cursor = (new_free as *const u8).offset_from(data_start) as VolPtr;
        } else {
            (*blk).size += remaining;
            (*shm).cursor = VOLNULL;
        }

        shm_unlock(&(*shm).lock);
        Ok(blk)
    }
}

/// Convert a volume-local offset to an absolute pointer.
///
/// # Safety
/// `shm` must be a valid mmap'd ShmHeader. `ptr` must be within the volume's data region.
#[inline]
unsafe fn vol2abs_raw(ptr: VolPtr, shm: *const ShmHeader) -> *mut u8 {
    (shm as *const u8)
        .add(std::mem::size_of::<ShmHeader>())
        .add(ptr as usize) as *mut u8
}

// ── Futex-based lock ───────────────────────────────────────────────────────

/// Acquire a futex-based cross-process lock on shared memory.
///
/// # Safety
/// `lock` must point to an AtomicU32 in mmap'd shared memory that
/// persists for the duration of the lock. The caller must call shm_unlock
/// on the same lock when done.
pub unsafe fn shm_lock(lock: &AtomicU32) -> Result<(), MorlocError> {
    if lock
        .compare_exchange_weak(LOCK_UNLOCKED, LOCK_LOCKED, Ordering::Acquire, Ordering::Relaxed)
        .is_ok()
    {
        return Ok(());
    }

    for _ in 0..SPIN_LIMIT {
        std::hint::spin_loop();
        if lock
            .compare_exchange_weak(LOCK_UNLOCKED, LOCK_LOCKED, Ordering::Acquire, Ordering::Relaxed)
            .is_ok()
        {
            return Ok(());
        }
    }

    shm_lock_slow(lock)
}

#[cfg(target_os = "linux")]
unsafe fn shm_lock_slow(lock: &AtomicU32) -> Result<(), MorlocError> {
    let timeout = libc::timespec {
        tv_sec: LOCK_TIMEOUT_SECS as i64,
        tv_nsec: 0,
    };

    loop {
        let ptr = lock as *const AtomicU32 as *const u32;
        libc::syscall(
            libc::SYS_futex, ptr, libc::FUTEX_WAIT, LOCK_LOCKED,
            &timeout as *const libc::timespec, std::ptr::null::<u32>(), 0u32,
        );

        if lock
            .compare_exchange_weak(LOCK_UNLOCKED, LOCK_LOCKED, Ordering::Acquire, Ordering::Relaxed)
            .is_ok()
        {
            return Ok(());
        }

        if lock.load(Ordering::Relaxed) == LOCK_LOCKED {
            if lock
                .compare_exchange(LOCK_LOCKED, LOCK_UNLOCKED, Ordering::AcqRel, Ordering::Relaxed)
                .is_ok()
            {
                if lock
                    .compare_exchange(LOCK_UNLOCKED, LOCK_LOCKED, Ordering::Acquire, Ordering::Relaxed)
                    .is_ok()
                {
                    return Ok(());
                }
            }
        }
    }
}

/// macOS fallback: spin-yield loop (no futex available).
#[cfg(target_os = "macos")]
unsafe fn shm_lock_slow(lock: &AtomicU32) -> Result<(), MorlocError> {
    loop {
        std::thread::yield_now();
        if lock
            .compare_exchange_weak(LOCK_UNLOCKED, LOCK_LOCKED, Ordering::Acquire, Ordering::Relaxed)
            .is_ok()
        {
            return Ok(());
        }
    }
}

/// Release a futex-based cross-process lock on shared memory.
///
/// # Safety
/// `lock` must be the same AtomicU32 previously acquired via shm_lock.
pub unsafe fn shm_unlock(lock: &AtomicU32) {
    lock.store(LOCK_UNLOCKED, Ordering::Release);
    #[cfg(target_os = "linux")]
    {
        let ptr = lock as *const AtomicU32 as *const u32;
        libc::syscall(
            libc::SYS_futex, ptr, libc::FUTEX_WAKE, 1,
            std::ptr::null::<libc::timespec>(), std::ptr::null::<u32>(), 0u32,
        );
    }
    // macOS: no futex wake needed; spin-yield waiters will see the store.
}

// ── Pointer conversion helpers ─────────────────────────────────────────────

#[inline]
pub fn vol2rel(ptr: VolPtr, shm: &ShmHeader) -> RelPtr {
    shm.relative_offset as RelPtr + ptr
}

/// # Safety
/// `shm` must be a valid mmap'd ShmHeader. `ptr` must be within the volume's data region.
#[inline]
pub unsafe fn vol2abs(ptr: VolPtr, shm: *const ShmHeader) -> AbsPtr {
    vol2abs_raw(ptr, shm)
}

// ── Tests ──────────────────────────────────────────────────────────────────

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_block_header_no_padding() {
        assert_eq!(
            std::mem::size_of::<BlockHeader>(),
            4 + 4 + std::mem::size_of::<usize>()
        );
    }

    #[test]
    fn test_align_up() {
        assert_eq!(align_up(0, 8), 0);
        assert_eq!(align_up(1, 8), 8);
        assert_eq!(align_up(7, 8), 8);
        assert_eq!(align_up(8, 8), 8);
        assert_eq!(align_up(9, 8), 16);
    }

    #[test]
    fn test_pointer_constants() {
        assert_eq!(RELNULL, -1);
        assert_eq!(VOLNULL, -1);
    }

    #[test]
    fn test_lock_unlock() {
        let lock = AtomicU32::new(LOCK_UNLOCKED);
        unsafe {
            shm_lock(&lock).unwrap();
            assert_eq!(lock.load(Ordering::Relaxed), LOCK_LOCKED);
            shm_unlock(&lock);
            assert_eq!(lock.load(Ordering::Relaxed), LOCK_UNLOCKED);
        }
    }

    #[test]
    fn test_array_struct_size() {
        assert_eq!(
            std::mem::size_of::<Array>(),
            std::mem::size_of::<usize>() + std::mem::size_of::<RelPtr>()
        );
    }

    #[test]
    fn test_shinit_and_shmalloc() {
        // Use file-backed SHM via tmpdir to avoid /dev/shm permission issues in test
        let tmpdir = std::env::temp_dir();
        let test_dir = tmpdir.join(format!("morloc_test_{}", std::process::id()));
        std::fs::create_dir_all(&test_dir).unwrap();
        shm_set_fallback_dir(test_dir.to_str().unwrap());

        let basename = format!("test_shm_{}", std::process::id());
        let shm = shinit(&basename, 0, 4096).unwrap();
        assert!(!shm.is_null());
        assert_eq!(unsafe { (*shm).magic }, SHM_MAGIC);

        // Allocate some memory
        let ptr1 = shmalloc(64).unwrap();
        assert!(!ptr1.is_null());

        // Write and read back
        unsafe {
            std::ptr::write_bytes(ptr1, 0xAB, 64);
            assert_eq!(*ptr1, 0xAB);
        }

        // Convert to relptr and back
        let rel = abs2rel(ptr1).unwrap();
        assert!(rel >= 0);
        let abs = rel2abs(rel).unwrap();
        assert_eq!(abs, ptr1);

        // Free
        shfree(ptr1).unwrap();

        // Cleanup
        shclose().unwrap();
        let _ = std::fs::remove_dir_all(&test_dir);
    }
}


================================================
FILE: data/rust/morloc-runtime/src/slurm_ffi.rs
================================================
//! C ABI wrappers for SLURM job submission.
//! Replaces slurm.c.

use std::ffi::{c_char, c_void, CStr, CString};
use std::ptr;

use crate::error::{clear_errmsg, set_errmsg, MorlocError};

const MAX_SLURM_COMMAND_LENGTH: usize = 1024;
const DEFAULT_XXHASH_SEED: u64 = 0;

// ── C-compatible types ───────────────────────────────────────────────────────

#[repr(C)]
pub struct Resources {
    pub memory: i32,  // in Gb
    pub time: i32,    // walltime in seconds
    pub cpus: i32,
    pub gpus: i32,
}

// ── parse_slurm_time ─────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn parse_slurm_time(
    time_str: *const c_char,
    errmsg: *mut *mut c_char,
) -> usize {
    clear_errmsg(errmsg);
    let s = CStr::from_ptr(time_str).to_string_lossy();

    let mut days: i32 = 0;
    let hours: i32;
    let minutes: i32;
    let seconds: i32;

    // Try D-HH:MM:SS format
    if let Some(dash_pos) = s.find('-') {
        days = match s[..dash_pos].parse() {
            Ok(d) => d,
            Err(_) => {
                set_errmsg(errmsg, &MorlocError::Other(format!("Failed to scan slurm walltime string '{}'", s)));
                return 0;
            }
        };
        let rest = &s[dash_pos + 1..];
        let parts: Vec<&str> = rest.split(':').collect();
        if parts.len() != 3 {
            set_errmsg(errmsg, &MorlocError::Other(format!("Failed to scan slurm walltime string '{}'", s)));
            return 0;
        }
        hours = parts[0].parse().unwrap_or(-1);
        minutes = parts[1].parse().unwrap_or(-1);
        seconds = parts[2].parse().unwrap_or(-1);
    } else {
        // Try HH:MM:SS format
        let parts: Vec<&str> = s.split(':').collect();
        if parts.len() != 3 {
            set_errmsg(errmsg, &MorlocError::Other(format!("Failed to scan slurm walltime string '{}'", s)));
            return 0;
        }
        hours = parts[0].parse().unwrap_or(-1);
        minutes = parts[1].parse().unwrap_or(-1);
        seconds = parts[2].parse().unwrap_or(-1);
    }

    if days < 0 || hours < 0 || minutes < 0 || seconds < 0 {
        set_errmsg(errmsg, &MorlocError::Other(format!("Negative time component in '{}'", s)));
        return 0;
    }
    if hours > 23 || minutes > 59 || seconds > 59 {
        set_errmsg(errmsg, &MorlocError::Other(format!("Invalid time component in '{}' (HH<=23 MM<=59 SS<=59)", s)));
        return 0;
    }
    if days > 3650 {
        set_errmsg(errmsg, &MorlocError::Other("Do you really want to run this job for more than 10 years?".into()));
        return 0;
    }

    (seconds + 60 * minutes + 60 * 60 * hours + 60 * 60 * 24 * days) as usize
}

#[no_mangle]
pub unsafe extern "C" fn write_slurm_time(seconds: i32) -> *mut c_char {
    let mut rem = seconds;
    let days = rem / (60 * 60 * 24);
    rem -= days * 60 * 60 * 24;
    let hours = rem / (60 * 60);
    rem -= hours * 60 * 60;
    let minutes = rem / 60;
    rem -= minutes * 60;

    let s = format!("{}-{:02}:{:02}:{:02}", days, hours, minutes, rem);
    match CString::new(s) {
        Ok(cs) => cs.into_raw(),
        Err(_) => ptr::null_mut(),
    }
}

// ── parse_morloc_call_arguments ──────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn parse_morloc_call_arguments(
    packet: *mut u8,
    args: *mut *mut u8,
    nargs: *mut usize,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    *nargs = 0;

    let header = &*(packet as *const crate::packet::PacketHeader);
    let packet_size = 32 + header.offset as usize + header.length as usize;

    if header.command_type() != crate::packet::PACKET_TYPE_CALL {
        set_errmsg(errmsg, &MorlocError::Packet("Unexpected packet type (BUG)".into()));
        return false;
    }

    // First pass: count args
    let mut pos = 32 + header.offset as usize;
    while pos < packet_size {
        let arg_header = &*(packet.add(pos) as *const crate::packet::PacketHeader);
        pos += 32 + arg_header.offset as usize + arg_header.length as usize;
        *nargs += 1;
    }

    // Second pass: set pointers
    pos = 32 + header.offset as usize;
    for i in 0..*nargs {
        *args.add(i) = packet.add(pos);
        let arg_header = &*(packet.add(pos) as *const crate::packet::PacketHeader);
        pos += 32 + arg_header.offset as usize + arg_header.length as usize;
    }

    true
}

// ── slurm_job_is_complete ────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn slurm_job_is_complete(job_id: u32) -> bool {
    let cmd = format!("sacct -j {} --format=State --noheader\0", job_id);
    let sacct = libc::popen(cmd.as_ptr() as *const c_char, b"r\0".as_ptr() as *const c_char);
    if sacct.is_null() { return false; }

    let mut state = [0u8; 64];
    let mut done = false;
    while !libc::fgets(state.as_mut_ptr() as *mut c_char, 64, sacct).is_null() {
        let s = std::str::from_utf8(&state).unwrap_or("");
        if s.contains("COMPLETED") || s.contains("FAILED") || s.contains("CANCELLED") {
            done = true;
            break;
        }
    }
    libc::pclose(sacct);
    done
}

// ── shell_escape ─────────────────────────────────────────────────────────────

fn shell_escape(input: &str) -> String {
    let mut out = String::with_capacity(input.len() + 10);
    out.push('\'');
    for ch in input.chars() {
        if ch == '\'' {
            out.push_str("'\\''");
        } else {
            out.push(ch);
        }
    }
    out.push('\'');
    out
}

// ── submit_morloc_slurm_job ──────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn submit_morloc_slurm_job(
    nexus_path: *const c_char,
    socket_basename: *const c_char,
    call_packet_filename: *const c_char,
    result_cache_filename: *const c_char,
    output_filename: *const c_char,
    error_filename: *const c_char,
    resources: *const Resources,
    errmsg: *mut *mut c_char,
) -> u32 {
    clear_errmsg(errmsg);

    macro_rules! check_null {
        ($ptr:expr, $name:expr) => {
            if $ptr.is_null() {
                set_errmsg(errmsg, &MorlocError::Other(format!("{} undefined", $name)));
                return 0;
            }
        };
    }
    check_null!(nexus_path, "nexus path");
    check_null!(socket_basename, "socket basename");
    check_null!(call_packet_filename, "call packet filename");
    check_null!(result_cache_filename, "result cache filename");
    check_null!(output_filename, "slurm output filename");
    check_null!(error_filename, "slurm error filename");

    let res = &*resources;
    let nexus = CStr::from_ptr(nexus_path).to_string_lossy();
    let call = CStr::from_ptr(call_packet_filename).to_string_lossy();
    let socket = CStr::from_ptr(socket_basename).to_string_lossy();
    let result_cache = CStr::from_ptr(result_cache_filename).to_string_lossy();
    let output = CStr::from_ptr(output_filename).to_string_lossy();
    let error = CStr::from_ptr(error_filename).to_string_lossy();

    let time_str_raw = write_slurm_time(res.time);
    let time_str = CStr::from_ptr(time_str_raw).to_string_lossy().into_owned();
    libc::free(time_str_raw as *mut c_void);

    let mem_arg = format!("--mem={}G", res.memory);
    let time_arg = format!("--time={}", time_str);
    let cpus_arg = format!("--cpus-per-task={}", res.cpus);
    let gpus_arg = format!("--gres=gpu:{}", res.gpus);

    let esc_nexus = shell_escape(&nexus);
    let esc_call = shell_escape(&call);
    let esc_socket = shell_escape(&socket);
    let esc_result = shell_escape(&result_cache);

    let wrap_cmd = format!(
        "{} --call-packet {} --socket-base {} --output-file {} --output-form packet",
        esc_nexus, esc_call, esc_socket, esc_result
    );

    if wrap_cmd.len() >= MAX_SLURM_COMMAND_LENGTH {
        set_errmsg(errmsg, &MorlocError::Other("Wrap command too long".into()));
        return 0;
    }

    let wrap_arg = format!("--wrap={}", wrap_cmd);

    // Fork/exec sbatch
    let mut pipefd = [0i32; 2];
    if libc::pipe(pipefd.as_mut_ptr()) == -1 {
        set_errmsg(errmsg, &MorlocError::Other("Failed to create pipe for sbatch".into()));
        return 0;
    }

    let pid = libc::fork();
    if pid == -1 {
        libc::close(pipefd[0]);
        libc::close(pipefd[1]);
        set_errmsg(errmsg, &MorlocError::Other("Failed to fork for sbatch".into()));
        return 0;
    }

    if pid == 0 {
        // Child
        libc::close(pipefd[0]);
        libc::dup2(pipefd[1], libc::STDOUT_FILENO);
        libc::close(pipefd[1]);

        let sbatch = CString::new("sbatch").unwrap();
        let parsable = CString::new("--parsable").unwrap();
        let o_flag = CString::new("-o").unwrap();
        let e_flag = CString::new("-e").unwrap();
        let c_output = CString::new(output.as_ref()).unwrap();
        let c_error = CString::new(error.as_ref()).unwrap();
        let c_mem = CString::new(mem_arg).unwrap();
        let c_time = CString::new(time_arg).unwrap();
        let c_cpus = CString::new(cpus_arg).unwrap();
        let c_gpus = CString::new(gpus_arg).unwrap();
        let c_wrap = CString::new(wrap_arg).unwrap();

        libc::execlp(
            sbatch.as_ptr(),
            sbatch.as_ptr(),
            parsable.as_ptr(),
            o_flag.as_ptr(), c_output.as_ptr(),
            e_flag.as_ptr(), c_error.as_ptr(),
            c_mem.as_ptr(), c_time.as_ptr(), c_cpus.as_ptr(), c_gpus.as_ptr(),
            c_wrap.as_ptr(),
            ptr::null::<c_char>(),
        );
        libc::_exit(127);
    }

    // Parent
    libc::close(pipefd[1]);

    let mut buf = [0u8; 64];
    let nread = libc::read(pipefd[0], buf.as_mut_ptr() as *mut c_void, 63);
    libc::close(pipefd[0]);

    let mut status: i32 = 0;
    libc::waitpid(pid, &mut status, 0);

    if !libc::WIFEXITED(status) || libc::WEXITSTATUS(status) != 0 {
        set_errmsg(errmsg, &MorlocError::Other("sbatch exited with error".into()));
        return 0;
    }
    if nread <= 0 {
        set_errmsg(errmsg, &MorlocError::Other("Failed to read sbatch output".into()));
        return 0;
    }

    let output_str = std::str::from_utf8(&buf[..nread as usize]).unwrap_or("");
    match output_str.trim().parse::<u32>() {
        Ok(job_id) => job_id,
        Err(_) => {
            set_errmsg(errmsg, &MorlocError::Other("Failed to parse job ID from sbatch output".into()));
            0
        }
    }
}

// ── remote_call ──────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn remote_call(
    midx: i32,
    socket_basename: *const c_char,
    cache_path: *const c_char,
    resources: *const Resources,
    arg_packets: *const *const u8,
    nargs: usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);

    // Use extern C declarations for functions from other modules
    extern "C" {
        fn read_schema_from_packet_meta(packet: *const u8, errmsg: *mut *mut c_char) -> *mut c_char;
        fn parse_schema(schema_str: *const c_char, errmsg: *mut *mut c_char) -> *mut crate::cschema::CSchema;
        fn free_schema(schema: *mut crate::cschema::CSchema);
        fn get_morloc_data_packet_value(data: *const u8, schema: *const crate::cschema::CSchema, errmsg: *mut *mut c_char) -> *mut u8;
        fn hash_voidstar(data: *const u8, schema: *const crate::cschema::CSchema, seed: u64, hash: *mut u64, errmsg: *mut *mut c_char) -> bool;
        fn mix(a: u64, b: u64) -> u64;
        fn mkdir_p(path: *const c_char, errmsg: *mut *mut c_char) -> i32;
        fn check_cache_packet(key: u64, cache_path: *const c_char, errmsg: *mut *mut c_char) -> *mut c_char;
        fn get_cache_packet(key: u64, cache_path: *const c_char, errmsg: *mut *mut c_char) -> *mut u8;
        fn put_cache_packet(data: *const u8, schema: *const crate::cschema::CSchema, key: u64, cache_path: *const c_char, errmsg: *mut *mut c_char) -> *mut c_char;
        fn make_cache_filename(hash: u64, cache_path: *const c_char, errmsg: *mut *mut c_char) -> *mut c_char;
        fn make_cache_filename_ext(hash: u64, cache_path: *const c_char, ext: *const c_char, errmsg: *mut *mut c_char) -> *mut c_char;
        fn make_morloc_remote_call_packet(midx: u32, arg_packets: *const *const u8, nargs: usize, errmsg: *mut *mut c_char) -> *mut u8;
        fn morloc_packet_size(packet: *const u8, errmsg: *mut *mut c_char) -> usize;
        fn read_binary_file(filename: *const c_char, file_size: *mut usize, errmsg: *mut *mut c_char) -> *mut u8;
        fn write_atomic(filename: *const c_char, data: *const u8, size: usize, errmsg: *mut *mut c_char) -> i32;
        fn get_morloc_data_packet_error_message(data: *const u8, errmsg: *mut *mut c_char) -> *mut c_char;
    }

    let seed = midx as u64;
    let mut err: *mut c_char = ptr::null_mut();

    // Cleanup tracking
    let mut return_packet: *mut u8 = ptr::null_mut();
    let mut arg_hashes: Vec<u64> = vec![0; nargs];
    let mut arg_voidstars: Vec<*mut u8> = vec![ptr::null_mut(); nargs];
    let mut arg_schemas: Vec<*mut crate::cschema::CSchema> = vec![ptr::null_mut(); nargs];
    let mut cached_arg_filenames: Vec<*mut c_char> = vec![ptr::null_mut(); nargs];
    let mut cached_arg_packets: Vec<*mut u8> = vec![ptr::null_mut(); nargs];

    let mut function_hash = mix(seed, DEFAULT_XXHASH_SEED);

    // Hash each argument
    for i in 0..nargs {
        let schema_str = read_schema_from_packet_meta(*arg_packets.add(i), &mut err);
        if schema_str.is_null() || !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

        arg_schemas[i] = parse_schema(schema_str, &mut err);
        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

        arg_voidstars[i] = get_morloc_data_packet_value(*arg_packets.add(i), arg_schemas[i], &mut err);
        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

        let mut h: u64 = 0;
        hash_voidstar(arg_voidstars[i], arg_schemas[i], DEFAULT_XXHASH_SEED, &mut h, &mut err);
        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }
        arg_hashes[i] = h;

        function_hash = mix(function_hash, h);
    }

    mkdir_p(cache_path, &mut err);
    if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

    // Check if result is cached
    let mut result_cache_filename = check_cache_packet(function_hash, cache_path, &mut err);
    if !err.is_null() { libc::free(err as *mut c_void); err = ptr::null_mut(); }

    if !result_cache_filename.is_null() {
        return_packet = get_cache_packet(function_hash, cache_path, &mut err);
        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }
    } else {
        result_cache_filename = make_cache_filename(function_hash, cache_path, &mut err);
        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

        // Cache arguments
        for i in 0..nargs {
            cached_arg_filenames[i] = check_cache_packet(arg_hashes[i], cache_path, &mut err);
            if cached_arg_filenames[i].is_null() {
                if !err.is_null() { libc::free(err as *mut c_void); err = ptr::null_mut(); }
                cached_arg_filenames[i] = put_cache_packet(arg_voidstars[i], arg_schemas[i], arg_hashes[i], cache_path, &mut err);
                if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }
            }
        }

        // Read cached arg packets
        for i in 0..nargs {
            let mut file_size: usize = 0;
            cached_arg_packets[i] = read_binary_file(cached_arg_filenames[i], &mut file_size, &mut err);
            if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }
        }

        // Build call packet
        let cached_ptrs: Vec<*const u8> = cached_arg_packets.iter().map(|p| *p as *const u8).collect();
        let call_packet = make_morloc_remote_call_packet(midx as u32, cached_ptrs.as_ptr(), nargs, &mut err);
        if !err.is_null() {
            libc::free(call_packet as *mut c_void);
            goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet);
        }

        let call_packet_size = morloc_packet_size(call_packet, &mut err);

        // Hash call packet with xxhash
        let call_packet_hash = crate::hash::xxh64_with_seed(std::slice::from_raw_parts(call_packet, call_packet_size), DEFAULT_XXHASH_SEED);

        let call_ext = CString::new("-call.dat").unwrap();
        let call_packet_filename = make_cache_filename_ext(call_packet_hash, cache_path, call_ext.as_ptr(), &mut err);

        // Write call packet to disk
        write_atomic(call_packet_filename, call_packet, call_packet_size, &mut err);
        libc::free(call_packet as *mut c_void);

        let out_ext = CString::new(".out").unwrap();
        let err_ext = CString::new(".err").unwrap();
        let output_filename = make_cache_filename_ext(function_hash, cache_path, out_ext.as_ptr(), &mut err);
        let error_filename = make_cache_filename_ext(function_hash, cache_path, err_ext.as_ptr(), &mut err);

        // Submit SLURM job
        let nexus_c = CString::new("./nexus").unwrap();
        let pid = submit_morloc_slurm_job(
            nexus_c.as_ptr(), socket_basename, call_packet_filename,
            result_cache_filename, output_filename, error_filename,
            resources, &mut err,
        );

        libc::free(call_packet_filename as *mut c_void);
        libc::free(output_filename as *mut c_void);
        libc::free(error_filename as *mut c_void);

        if !err.is_null() { goto_cleanup!(errmsg, err, arg_schemas, cached_arg_filenames, cached_arg_packets, return_packet); }

        // Wait for job completion
        while !slurm_job_is_complete(pid) {
            libc::sleep(1);
        }

        let mut return_packet_size: usize = 0;
        return_packet = read_binary_file(result_cache_filename, &mut return_packet_size, &mut err);

        let failure = get_morloc_data_packet_error_message(return_packet, &mut err);
        if !failure.is_null() {
            libc::fprintf(
                libc::fdopen(libc::STDERR_FILENO, b"w\0".as_ptr() as *const c_char),
                b"Failed, deleting result %s\n\0".as_ptr() as *const c_char,
                result_cache_filename,
            );
            libc::unlink(result_cache_filename);
            libc::free(failure as *mut c_void);
        }
    }

    // Cleanup
    for i in 0..nargs {
        if !arg_schemas[i].is_null() { free_schema(arg_schemas[i]); }
        if !cached_arg_filenames[i].is_null() { libc::free(cached_arg_filenames[i] as *mut c_void); }
        if !cached_arg_packets[i].is_null() { libc::free(cached_arg_packets[i] as *mut c_void); }
    }
    if !result_cache_filename.is_null() { libc::free(result_cache_filename as *mut c_void); }

    return_packet
}

// Cleanup macro for goto-like pattern
macro_rules! goto_cleanup {
    ($errmsg:expr, $err:expr, $schemas:expr, $filenames:expr, $packets:expr, $return_packet:expr) => {{
        *$errmsg = $err;
        for i in 0..$schemas.len() {
            if !$schemas[i].is_null() {
                extern "C" { fn free_schema(s: *mut crate::cschema::CSchema); }
                free_schema($schemas[i]);
            }
            if !$filenames[i].is_null() { libc::free($filenames[i] as *mut c_void); }
            if !$packets[i].is_null() { libc::free($packets[i] as *mut c_void); }
        }
        return $return_packet;
    }};
}
use goto_cleanup;


================================================
FILE: data/rust/morloc-runtime/src/utility.rs
================================================
//! File I/O and string utility functions.
//! Replaces utility.c.

use std::ffi::{c_char, c_void, CStr};
use std::io::Write;
use std::ptr;

use crate::error::{clear_errmsg, set_errmsg, MorlocError};

// ── Cross-platform helpers ─────────────────────────────────────────────────

/// Return the current errno value (cross-platform).
#[cfg(target_os = "linux")]
#[inline]
pub unsafe fn errno_val() -> i32 {
    *libc::__errno_location()
}

#[cfg(target_os = "macos")]
#[inline]
pub unsafe fn errno_val() -> i32 {
    *libc::__error()
}

/// Suppress SIGPIPE on send(). Linux: per-call flag. macOS: use set_nosigpipe() on the socket.
#[cfg(target_os = "linux")]
pub const SEND_NOSIGNAL: i32 = libc::MSG_NOSIGNAL;
#[cfg(target_os = "macos")]
pub const SEND_NOSIGNAL: i32 = 0;

/// Set SO_NOSIGPIPE on a socket (macOS). No-op on Linux (uses MSG_NOSIGNAL per-call).
#[allow(unused_variables)]
pub unsafe fn set_nosigpipe(fd: i32) {
    #[cfg(target_os = "macos")]
    {
        let val: libc::c_int = 1;
        libc::setsockopt(
            fd,
            libc::SOL_SOCKET,
            libc::SO_NOSIGPIPE,
            &val as *const _ as *const libc::c_void,
            std::mem::size_of::<libc::c_int>() as libc::socklen_t,
        );
    }
}

// ── File operations ────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn file_exists(filename: *const c_char) -> bool {
    if filename.is_null() {
        return false;
    }
    let path = CStr::from_ptr(filename).to_string_lossy();
    std::path::Path::new(path.as_ref()).exists()
}

#[no_mangle]
pub unsafe extern "C" fn mkdir_p(path: *const c_char, errmsg: *mut *mut c_char) -> i32 {
    clear_errmsg(errmsg);
    if path.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL path".into()));
        return -1;
    }
    let p = CStr::from_ptr(path).to_string_lossy();
    match std::fs::create_dir_all(p.as_ref()) {
        Ok(_) => 0,
        Err(e) => {
            set_errmsg(
                errmsg,
                &MorlocError::Io(e),
            );
            -1
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn delete_directory(path: *const c_char) {
    if path.is_null() {
        return;
    }
    let p = CStr::from_ptr(path).to_string_lossy();
    let _ = std::fs::remove_dir_all(p.as_ref());
}

#[no_mangle]
pub unsafe extern "C" fn has_suffix(x: *const c_char, suffix: *const c_char) -> bool {
    if x.is_null() || suffix.is_null() {
        return false;
    }
    let xs = CStr::from_ptr(x).to_string_lossy();
    let ss = CStr::from_ptr(suffix).to_string_lossy();
    xs.ends_with(ss.as_ref())
}

#[no_mangle]
pub unsafe extern "C" fn write_atomic(
    filename: *const c_char,
    data: *const u8,
    size: usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    if filename.is_null() || (data.is_null() && size != 0) {
        set_errmsg(errmsg, &MorlocError::Other("invalid arguments".into()));
        return -1;
    }
    let path_str = CStr::from_ptr(filename).to_string_lossy();
    let path = std::path::Path::new(path_str.as_ref());

    // Get parent directory
    let dir = path.parent().unwrap_or(std::path::Path::new("."));

    // Create temp file in same directory
    let tmp_path = dir.join(format!("morloc-tmp_{}", std::process::id()));

    let result = (|| -> Result<(), std::io::Error> {
        // Write to temp file
        let mut f = std::fs::File::create(&tmp_path)?;
        if size > 0 {
            let bytes = std::slice::from_raw_parts(data, size);
            f.write_all(bytes)?;
        }
        f.sync_all()?;
        drop(f);

        // Atomic rename
        std::fs::rename(&tmp_path, path)?;

        // Sync parent directory
        if let Ok(dir_f) = std::fs::File::open(dir) {
            let _ = dir_f.sync_all();
        }
        Ok(())
    })();

    match result {
        Ok(_) => 0,
        Err(e) => {
            let _ = std::fs::remove_file(&tmp_path);
            set_errmsg(errmsg, &MorlocError::Io(e));
            -1
        }
    }
}

// ── Binary I/O ─────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn read_binary_file(
    filename: *const c_char,
    file_size: *mut usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    if filename.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL filename".into()));
        return ptr::null_mut();
    }
    let path = CStr::from_ptr(filename).to_string_lossy();
    match std::fs::read(path.as_ref()) {
        Ok(data) => {
            *file_size = data.len();
            let buf = libc::malloc(data.len()) as *mut u8;
            if buf.is_null() {
                set_errmsg(errmsg, &MorlocError::Other("malloc failed".into()));
                return ptr::null_mut();
            }
            std::ptr::copy_nonoverlapping(data.as_ptr(), buf, data.len());
            buf
        }
        Err(e) => {
            set_errmsg(errmsg, &MorlocError::Io(e));
            ptr::null_mut()
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn read_binary_fd(
    file: *mut libc::FILE,
    file_size: *mut usize,
    errmsg: *mut *mut c_char,
) -> *mut u8 {
    clear_errmsg(errmsg);
    if file.is_null() {
        set_errmsg(errmsg, &MorlocError::Other("NULL file".into()));
        return ptr::null_mut();
    }

    // Try seek-based size detection
    if libc::fseek(file, 0, libc::SEEK_END) == 0 {
        let size = libc::ftell(file) as usize;
        if size > 0 {
            libc::rewind(file);
            let buf = libc::malloc(size) as *mut u8;
            if buf.is_null() {
                set_errmsg(errmsg, &MorlocError::Other("malloc failed".into()));
                return ptr::null_mut();
            }
            let read = libc::fread(buf as *mut c_void, 1, size, file);
            if read == size {
                *file_size = size;
                return buf;
            }
            libc::free(buf as *mut c_void);
        }
    }

    // Streaming read for non-seekable files
    let chunk_size: usize = 0xffff;
    let mut buf: *mut u8 = ptr::null_mut();
    let mut allocated: usize = 0;

    loop {
        let new_buf = libc::realloc(buf as *mut c_void, allocated + chunk_size) as *mut u8;
        if new_buf.is_null() {
            libc::free(buf as *mut c_void);
            set_errmsg(errmsg, &MorlocError::Other("realloc failed".into()));
            return ptr::null_mut();
        }
        buf = new_buf;
        let read = libc::fread(buf.add(allocated) as *mut c_void, 1, chunk_size, file);
        allocated += read;

        if read < chunk_size {
            if libc::feof(file) != 0 {
                *file_size = allocated;
                return buf;
            }
            if libc::ferror(file) != 0 {
                libc::free(buf as *mut c_void);
                set_errmsg(errmsg, &MorlocError::Other("read error".into()));
                return ptr::null_mut();
            }
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn write_binary_fd(
    fd: i32,
    buf: *const c_char,
    count: usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    clear_errmsg(errmsg);
    let mut total: usize = 0;
    while total < count {
        let written = libc::write(fd, buf.add(total) as *const c_void, count - total);
        if written < 0 {
            set_errmsg(
                errmsg,
                &MorlocError::Other(format!("write failed: {}", std::io::Error::last_os_error())),
            );
            return -1;
        }
        total += written as usize;
    }
    0
}

#[no_mangle]
pub unsafe extern "C" fn print_binary(
    buf: *const c_char,
    count: usize,
    errmsg: *mut *mut c_char,
) -> i32 {
    write_binary_fd(libc::STDOUT_FILENO, buf, count, errmsg)
}

// ── Display ────────────────────────────────────────────────────────────────

#[no_mangle]
pub unsafe extern "C" fn hex(ptr: *const c_void, size: usize) {
    if ptr.is_null() || size == 0 {
        return;
    }
    let bytes = std::slice::from_raw_parts(ptr as *const u8, size);
    for (i, b) in bytes.iter().enumerate() {
        if i > 0 && i % 8 == 0 {
            eprint!(" ");
        }
        eprint!("{:02X}", b);
        if i < size - 1 {
            eprint!(" ");
        }
    }
}

#[no_mangle]
pub unsafe extern "C" fn print_hex_dump(
    data: *const u8,
    size: usize,
    errmsg: *mut *mut c_char,
) -> bool {
    clear_errmsg(errmsg);
    if data.is_null() && size > 0 {
        set_errmsg(errmsg, &MorlocError::Other("NULL data".into()));
        return false;
    }
    let bytes = if size > 0 {
        std::slice::from_raw_parts(data, size)
    } else {
        &[]
    };
    for (i, b) in bytes.iter().enumerate() {
        if i > 0 && i % 4 == 0 {
            if i % 24 == 0 {
                println!();
            } else {
                print!(" ");
            }
        }
        print!("{:02X}", b);
    }
    if !bytes.is_empty() {
        println!();
    }
    true
}

// ── xxHash wrapper and mix ─────────────────────────────────────────────────

/// Mix two 64-bit hash values. Matches the C implementation in cache.c.
#[no_mangle]
pub extern "C" fn mix(a: u64, b: u64) -> u64 {
    const PRIME64_1: u64 = 0x9E3779B185EBCA87;
    const PRIME64_2: u64 = 0xC2B2AE3D27D4EB4F;
    let mut a = a ^ b.wrapping_mul(PRIME64_1);
    a = (a << 31) | (a >> 33);
    a.wrapping_mul(PRIME64_2)
}

#[no_mangle]
pub unsafe extern "C" fn morloc_xxh64(
    input: *const c_void,
    length: usize,
    seed: u64,
) -> u64 {
    if input.is_null() || length == 0 {
        return crate::hash::xxh64_with_seed(&[], seed);
    }
    let data = std::slice::from_raw_parts(input as *const u8, length);
    crate::hash::xxh64_with_seed(data, seed)
}

// ── String utilities ───────────────────────────────────────────────────────

/// dirname - returns pointer into the input string (modifies it in-place)
/// Matches the C behavior: returns "." for empty/NULL, strips trailing slashes
#[no_mangle]
pub unsafe extern "C" fn dirname(path: *mut c_char) -> *mut c_char {
    // Return a pointer to the static string "." for empty/null paths and paths with no slash.
    static DOT: [u8; 2] = [b'.', 0];
    let dot_ptr = DOT.as_ptr() as *mut c_char;

    if path.is_null() || *path == 0 {
        return dot_ptr;
    }

    let len = libc::strlen(path);
    let mut end = path.add(len - 1);

    // Remove trailing slashes
    while end > path && *end == b'/' as c_char {
        *end = 0;
        end = end.sub(1);
    }

    // Find last slash
    let last_slash = libc::strrchr(path, b'/' as i32);
    if last_slash.is_null() {
        return dot_ptr;
    }
    if last_slash == path {
        *path.add(1) = 0; // root case "/"
    } else {
        *last_slash = 0;
    }
    path
}


================================================
FILE: data/rust/morloc-runtime/src/voidstar.rs
================================================
//! Shared voidstar operations: relptr adjustment, binary serialization,
//! schema-aware free, and flatten-to-buffer.
//!
//! These functions operate on the morloc voidstar binary format in SHM.
//! They are used by packet.rs, cli.rs, and json.rs.

use crate::error::MorlocError;
use crate::schema::{Schema, SerialType};
use crate::shm::{self, AbsPtr, Array, RelPtr, Tensor};

// ── adjust_voidstar_relptrs ────────────────────────────────────────────────

/// Adjust all relptrs in a voidstar blob by adding base_rel.
/// Used after copying a flattened blob into SHM.
pub fn adjust_relptrs(
    data: AbsPtr,
    schema: &Schema,
    base_rel: RelPtr,
) -> Result<(), MorlocError> {
    // SAFETY: data points to a voidstar blob in SHM. We adjust relptrs in-place;
    // all pointer arithmetic stays within the blob's bounds as defined by schema.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &mut *(data as *mut Array);
                arr.data += base_rel;
                if !schema.parameters.is_empty() && !schema.parameters[0].is_fixed_width() {
                    let arr_data = shm::rel2abs(arr.data)?;
                    let w = schema.parameters[0].width;
                    for i in 0..arr.size {
                        adjust_relptrs(arr_data.add(i * w), &schema.parameters[0], base_rel)?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    adjust_relptrs(data.add(schema.offsets[i]), &schema.parameters[i], base_rel)?;
                }
            }
            SerialType::Optional => {
                if *data != 0 && !schema.parameters.is_empty() {
                    let off = schema.offsets.first().copied()
                        .unwrap_or_else(|| shm::align_up(1, schema.parameters[0].alignment().max(1)));
                    adjust_relptrs(data.add(off), &schema.parameters[0], base_rel)?;
                }
            }
            SerialType::Tensor => {
                let t = &mut *(data as *mut Tensor);
                if t.total_elements > 0 {
                    t.shape += base_rel;
                    t.data += base_rel;
                }
            }
            _ => {}
        }
    }
    Ok(())
}

// ── read_voidstar_binary ───────────────────────────────────────────────────

/// Read a flat voidstar binary blob into SHM, adjusting relptrs.
pub fn read_binary(blob: &[u8], schema: &Schema) -> Result<AbsPtr, MorlocError> {
    let base = shm::shmalloc(blob.len())?;
    // SAFETY: base is freshly allocated with blob.len() bytes.
    unsafe { std::ptr::copy_nonoverlapping(blob.as_ptr(), base, blob.len()) };
    let base_rel = shm::abs2rel(base)?;
    adjust_relptrs(base, schema, base_rel)?;
    Ok(base)
}

// ── shfree_by_schema ───────────────────────────────────────────────────────

/// Zero metadata for nested structures so the parent block can be cleanly freed.
/// Does NOT call shfree on sub-pointers (they're cursor-packed in the same block).
pub fn free_by_schema(ptr: AbsPtr, schema: &Schema) -> Result<(), MorlocError> {
    // SAFETY: ptr points to voidstar data in SHM with layout described by schema.
    // We zero metadata at schema.width offsets within the structure.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let arr = &*(ptr as *const Array);
                if arr.data > 0 && !schema.parameters.is_empty() && !schema.parameters[0].is_fixed_width() {
                    let arr_data = shm::rel2abs(arr.data)?;
                    let w = schema.parameters[0].width;
                    for i in 0..arr.size {
                        free_by_schema(arr_data.add(i * w), &schema.parameters[0])?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    free_by_schema(ptr.add(schema.offsets[i]), &schema.parameters[i])?;
                }
            }
            SerialType::Tensor => {} // inline, freed by parent
            _ => {}
        }
        std::ptr::write_bytes(ptr, 0, schema.width);
    }
    Ok(())
}

// ── flatten_voidstar_to_buffer ─────────────────────────────────────────────

/// Flatten a voidstar structure in SHM into a self-contained byte buffer.
/// Relptrs in the output are offsets from position 0 of the buffer.
pub fn flatten_to_buffer(data: AbsPtr, schema: &Schema) -> Result<Vec<u8>, MorlocError> {
    let total = crate::ffi::calc_voidstar_size_inner(data, schema)?;
    let mut buf = vec![0u8; total];

    // SAFETY: data points to at least schema.width bytes in SHM; buf has total >= schema.width bytes.
    unsafe { std::ptr::copy_nonoverlapping(data, buf.as_mut_ptr(), schema.width) };

    // Phase 2: fix up relptrs and copy variable-length data
    let mut cursor = schema.width;
    flatten_fixup(&mut buf, 0, data, schema, &mut cursor)?;

    Ok(buf)
}

fn flatten_fixup(
    buf: &mut [u8],
    buf_offset: usize,
    data: AbsPtr,
    schema: &Schema,
    cursor: &mut usize,
) -> Result<(), MorlocError> {
    // SAFETY: buf is sized by calc_voidstar_size_inner to hold the entire flattened structure.
    // data points to corresponding SHM data. cursor tracks write position within buf.
    unsafe {
        match schema.serial_type {
            SerialType::String | SerialType::Array => {
                let orig_arr = &*(data as *const Array);
                let buf_arr = &mut *(buf.as_mut_ptr().add(buf_offset) as *mut Array);
                if orig_arr.size == 0 {
                    buf_arr.data = 0;
                    return Ok(());
                }
                let orig_data = shm::rel2abs(orig_arr.data)?;
                let elem_schema = &schema.parameters[0];
                let align = elem_schema.alignment();
                *cursor = shm::align_up(*cursor, align);
                buf_arr.data = *cursor as RelPtr;
                let elem_w = elem_schema.width;
                let total_bytes = elem_w * orig_arr.size;
                buf[*cursor..*cursor + total_bytes].copy_from_slice(
                    std::slice::from_raw_parts(orig_data, total_bytes)
                );
                let elem_start = *cursor;
                *cursor += total_bytes;
                if !elem_schema.is_fixed_width() {
                    for i in 0..orig_arr.size {
                        flatten_fixup(
                            buf, elem_start + i * elem_w,
                            orig_data.add(i * elem_w), elem_schema, cursor,
                        )?;
                    }
                }
            }
            SerialType::Tuple | SerialType::Map => {
                for i in 0..schema.parameters.len() {
                    flatten_fixup(
                        buf, buf_offset + schema.offsets[i],
                        data.add(schema.offsets[i]), &schema.parameters[i], cursor,
                    )?;
                }
            }
            SerialType::Optional => {
                let tag = *buf.as_ptr().add(buf_offset);
                if tag != 0 && !schema.parameters.is_empty() {
                    let off = schema.offsets.first().copied()
                        .unwrap_or_else(|| shm::align_up(1, schema.parameters[0].alignment().max(1)));
                    flatten_fixup(
                        buf, buf_offset + off,
                        data.add(off), &schema.parameters[0], cursor,
                    )?;
                }
            }
            SerialType::Tensor => {
                let orig = &*(data as *const Tensor);
                let buf_t = &mut *(buf.as_mut_ptr().add(buf_offset) as *mut Tensor);
                if orig.total_elements == 0 {
                    buf_t.shape = 0;
                    buf_t.data = 0;
                    return Ok(());
                }
                let ndim = schema.offsets.first().copied().unwrap_or(0);
                let orig_shape = shm::rel2abs(orig.shape)?;
                *cursor = shm::align_up(*cursor, std::mem::align_of::<i64>());
                buf_t.shape = *cursor as RelPtr;
                let shape_bytes = ndim * std::mem::size_of::<i64>();
                buf[*cursor..*cursor + shape_bytes].copy_from_slice(
                    std::slice::from_raw_parts(orig_shape, shape_bytes)
                );
                *cursor += shape_bytes;

                let orig_data = shm::rel2abs(orig.data)?;
                let elem_w = schema.parameters[0].width;
                let elem_align = schema.parameters[0].alignment();
                *cursor = shm::align_up(*cursor, elem_align);
                buf_t.data = *cursor as RelPtr;
                let data_bytes = orig.total_elements * elem_w;
                buf[*cursor..*cursor + data_bytes].copy_from_slice(
                    std::slice::from_raw_parts(orig_data, data_bytes)
                );
                *cursor += data_bytes;
            }
            _ => {} // primitives already copied by parent
        }
    }
    Ok(())
}

// ── write_voidstar_binary (to fd) ──────────────────────────────────────────

/// Flatten voidstar and write to a file descriptor. Returns bytes written.
pub fn write_binary_to_fd(fd: i32, data: AbsPtr, schema: &Schema) -> Result<usize, MorlocError> {
    let buf = flatten_to_buffer(data, schema)?;
    // SAFETY: buf is a valid byte slice; fd is a valid file descriptor from the caller.
    let written = unsafe {
        libc::write(fd, buf.as_ptr() as *const std::ffi::c_void, buf.len())
    };
    if written < 0 {
        return Err(MorlocError::Io(std::io::Error::last_os_error()));
    }
    Ok(written as usize)
}


================================================
FILE: exe/morloc-codegen-generic/Main.hs
================================================
{- |
Module      : Main
Description : Generic pool code generator for morloc
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0

Standalone executable that assembles pool files for dynamically-typed
interpreted languages. Receives a serialized IProgram via a binary file
and a language descriptor via lang.yaml.

Usage: morloc-codegen-generic <lang.yaml> <iprogram.bin>

Reads:
  - argv[1]: path to lang.yaml (language descriptor)
  - argv[2]: path to binary-encoded IProgram

Writes to stdout:
  - JSON CodegenManifest with pool_code and build_commands
-}
module Main (main) where

import qualified Data.Aeson as Aeson
import qualified Data.Binary as Binary
import qualified Data.ByteString.Lazy as BL
import qualified Data.Text as T
import qualified Data.Text.IO as TIO
import GHC.IO.Encoding (setLocaleEncoding, utf8)
import System.Environment (getArgs)
import System.Exit (exitFailure)
import System.FilePath (takeDirectory, (</>))
import System.IO (hPutStrLn, stderr)

import Morloc.CodeGenerator.Grammars.Translator.Generic (CodegenManifest (..), printProgram)
import Morloc.CodeGenerator.Grammars.Translator.Imperative (IProgram)
import Morloc.CodeGenerator.LanguageDescriptor (LangDescriptor (..), loadLangDescriptor)
import Morloc.Data.Doc (render)

main :: IO ()
main = do
  setLocaleEncoding utf8
  args <- getArgs
  case args of
    [langYamlPath, iprogramPath] -> run langYamlPath iprogramPath
    _ -> do
      hPutStrLn stderr "Usage: morloc-codegen-generic <lang.yaml> <iprogram.bin>"
      exitFailure

run :: FilePath -> FilePath -> IO ()
run langYamlPath iprogramPath = do
  -- load language descriptor
  descResult <- loadLangDescriptor langYamlPath
  desc <- case descResult of
    Left err -> do
      hPutStrLn stderr $ "Failed to load " ++ langYamlPath ++ ": " ++ err
      exitFailure
    Right d -> return d

  -- load pool template from disk if not inline
  desc' <-
    if T.null (ldPoolTemplate desc)
      then do
        let langDir = takeDirectory langYamlPath
            ext = ldExtension desc
            poolPath = langDir </> "pool." ++ ext
        poolText <- TIO.readFile poolPath
        return desc {ldPoolTemplate = poolText}
      else return desc

  -- deserialize IProgram
  binaryData <- BL.readFile iprogramPath
  let program = Binary.decode binaryData :: IProgram

  -- assemble pool file
  let poolCode = render (printProgram desc' program)

  -- output manifest as JSON
  let manifest =
        CodegenManifest
          { cgmPoolCode = poolCode
          , cgmBuildCommands = []
          }
  BL.putStr (Aeson.encode manifest)


================================================
FILE: executable/CppPrinter.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE QuasiQuotes #-}
{-# LANGUAGE TemplateHaskell #-}

{- |
Module      : CppPrinter
Description : Pretty-print the imperative IR as C++ source code
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Converts 'IStmt' and 'IExpr' IR nodes into C++ source text. Handles
type rendering, struct definitions, forward declarations, and C++
idioms (templates, shared_ptr, std::variant).
-}
module CppPrinter
  ( printExpr
  , printStmt
  , printStmts

    -- * Pool-level rendering
  , printDispatch
  , printProgram

    -- * Struct/serializer rendering
  , printStructTypedef
  , printSerializer
  , printDeserializer
  , printTemplateHeader
  , printRecordTemplate
  ) where

import Morloc.CodeGenerator.Grammars.Common (DispatchEntry (..), manNamer)
import Morloc.CodeGenerator.Grammars.Translator.Imperative
import Morloc.CodeGenerator.Namespace (MDoc)
import Morloc.Data.Doc
import Morloc.DataFiles as DF
import Morloc.Quasi

printExpr :: IExpr -> MDoc
printExpr (IVar v) = pretty v
printExpr (IBoolLit True) = "true"
printExpr (IBoolLit False) = "false"
printExpr (INullLit (Just t)) = "std::optional<" <> renderIType t <> ">()"
printExpr (INullLit Nothing) = "std::nullopt"
printExpr (IIntLit Nothing i) = viaShow i
printExpr (IIntLit (Just t) i)
  | t == "int" = viaShow i
  | otherwise = "static_cast<" <> pretty t <> ">(" <> viaShow i <> ")"
printExpr (IRealLit Nothing r) = viaShow r
printExpr (IRealLit (Just t) r)
  | t == "double" = viaShow r
  | otherwise = "static_cast<" <> pretty t <> ">(" <> viaShow r <> ")"
printExpr (IStrLit s) = [idoc|std::string(#{textEsc' s})|]
printExpr (IListLit es) = encloseSep "{" "}" "," (map printExpr es)
printExpr (ITupleLit es) = "std::make_tuple" <> tupled (map printExpr es)
printExpr (IRecordLit _ _ entries) =
  encloseSep "{" "}" "," (map (printExpr . snd) entries)
printExpr (IAccess e (IIdx i)) = "std::get<" <> pretty i <> ">(" <> printExpr e <> ")"
printExpr (IAccess e (IKey _)) = printExpr e -- should not be reached for C++
printExpr (IAccess e (IField f)) = printExpr e <> "." <> pretty f
printExpr (ISerCall schema e) = [idoc|_put_value(#{printExpr e}, "#{pretty schema}")|]
printExpr (IDesCall schema (Just rawtype) e) = [idoc|_get_value<#{renderIType rawtype}>(#{printExpr e}, "#{pretty schema}")|]
printExpr (IDesCall schema Nothing e) = [idoc|_get_value(#{printExpr e}, "#{pretty schema}")|]
printExpr (IPack packer e) = pretty packer <> parens (printExpr e)
printExpr (ICall f Nothing argGroups) =
  pretty f <> hsep (map (tupled . map printExpr) argGroups)
printExpr (ICall f (Just ts) argGroups) =
  pretty f
    <> encloseSep "<" ">" "," (map renderIType ts)
    <> hsep (map (tupled . map printExpr) argGroups)
printExpr (IForeignCall _ _ _) = error "use IRawExpr for C++ foreign calls"
printExpr (IRemoteCall _ _ _ _) = error "use IRawExpr for C++ remote calls"
printExpr (ILambda args body) =
  "[&]("
    <> hsep (punctuate "," ["auto" <+> pretty a | a <- args])
    <> "){return "
    <> printExpr body
    <> ";}"
printExpr (IRawExpr d) = pretty d
printExpr (IDoBlock e) = "[&](){return " <> printExpr e <> ";}"
printExpr (IEval e) = printExpr e <> "()"
printExpr (IIntrinsicHash schema e) =
  [idoc|_mlc_hash(#{printExpr e}, "#{pretty schema}")|]
printExpr (IIntrinsicSave fmt schema e path)
  | fmt == "json" = [idoc|_mlc_save_json(#{printExpr e}, "#{pretty schema}", #{printExpr path})|]
  | fmt == "voidstar" = [idoc|_mlc_save_voidstar(#{printExpr e}, "#{pretty schema}", #{printExpr path})|]
  | otherwise = [idoc|_mlc_save(#{printExpr e}, "#{pretty schema}", #{printExpr path})|]
printExpr (IIntrinsicLoad schema (Just t) path) =
  [idoc|_mlc_load<#{renderIType t}>("#{pretty schema}", #{printExpr path})|]
printExpr (IIntrinsicLoad schema Nothing path) =
  [idoc|_mlc_load("#{pretty schema}", #{printExpr path})|]
printExpr (IIntrinsicShow schema e) =
  [idoc|_mlc_show(#{printExpr e}, "#{pretty schema}")|]
printExpr (IIntrinsicRead schema (Just t) e) =
  [idoc|_mlc_read<#{renderIType t}>("#{pretty schema}", #{printExpr e})|]
printExpr (IIntrinsicRead schema Nothing e) =
  [idoc|_mlc_read("#{pretty schema}", #{printExpr e})|]

printStmt :: IStmt -> MDoc
printStmt (IAssign v Nothing e) = "auto" <+> pretty v <+> "=" <+> printExpr e <> ";"
printStmt (IAssign v (Just t) e) = renderIType t <+> pretty v <+> "=" <+> printExpr e <> ";"
-- C++ uses an indexed for loop with push_back
printStmt (IMapList resultVar resultType iterVar collection bodyStmts yieldExpr) =
  vsep
    [ resultDecl
    , block
        4
        [idoc|for(size_t #{pretty iterVar}_idx = 0; #{pretty iterVar}_idx < #{printExpr collection}.size(); #{pretty iterVar}_idx++)|]
        ( vsep
            ( [idoc|auto #{pretty iterVar} = #{printExpr collection}[#{pretty iterVar}_idx];|]
                : map printStmt bodyStmts
                ++ [[idoc|#{pretty resultVar}.push_back(#{printExpr yieldExpr});|]]
            )
        )
    ]
  where
    resultDecl = case resultType of
      Just t -> [idoc|#{renderIType t} #{pretty resultVar};|]
      Nothing -> printStmt (IAssign resultVar Nothing (IListLit []))
printStmt (IIf resultVar resultType condExpr thenStmts thenExpr elseStmts elseExpr) =
  vsep
    [ resultDecl
    , block 4 [idoc|if(#{printExpr condExpr})|]
        (vsep (map printStmt thenStmts ++ [[idoc|#{pretty resultVar} = #{printExpr thenExpr};|]]))
    , block 4 "else"
        (vsep (map printStmt elseStmts ++ [[idoc|#{pretty resultVar} = #{printExpr elseExpr};|]]))
    ]
  where
    resultDecl = case resultType of
      Just t -> [idoc|#{renderIType t} #{pretty resultVar};|]
      Nothing -> [idoc|auto #{pretty resultVar};|]
printStmt (IReturn e) = "return(" <> printExpr e <> ");"
printStmt (IExprStmt e) = printExpr e <> ";"
printStmt (IFunDef _ _ _ _) = error "IFunDef not yet implemented for C++ printer"

printStmts :: [IStmt] -> [MDoc]
printStmts = map printStmt

-- | Render C++ dispatch functions from structured dispatch entries.
printDispatch :: [DispatchEntry] -> [DispatchEntry] -> MDoc
printDispatch locals remotes =
  [idoc|uint8_t* local_dispatch(uint32_t mid, const uint8_t** args){
    switch(mid){
        #{align (vsep localCases)}
        default:
            std::ostringstream oss;
            oss << "Invalid local manifold id: " << mid;
            throw std::runtime_error(oss.str());
    }
}

uint8_t* remote_dispatch(uint32_t mid, const uint8_t** args){
    switch(mid){
        #{align (vsep remoteCases)}
        default:
            std::ostringstream oss;
            oss << "Invalid remote manifold id: " << mid;
            throw std::runtime_error(oss.str());
    }
}|]
  where
    localCases = map (makeCase "") locals
    remoteCases = map (makeCase "_remote") remotes

    makeCase :: MDoc -> DispatchEntry -> MDoc
    makeCase suffix (DispatchEntry i n) =
      "case" <+> pretty i
        <> ":"
          <+> "return"
          <+> manNamer i
        <> suffix
        <> tupled ["args[" <> pretty j <> "]" | j <- take n ([0 ..] :: [Int])]
        <> ";"

-- | Assemble a complete C++ pool file from an IProgram and C++-specific extras.
printProgram :: [MDoc] -> [MDoc] -> IProgram -> MDoc
printProgram serialization signatures prog =
  format
    (DF.embededFileText (DF.poolTemplate "cpp"))
    "// <<<BREAK>>>"
    [ vsep (map pretty (ipSources prog))
    , vsep serialization
    , vsep signatures
    , vsep (map pretty (ipManifolds prog))
    , printDispatch (ipLocalDispatch prog) (ipRemoteDispatch prog)
    ]

printTemplateHeader :: [MDoc] -> MDoc
printTemplateHeader [] = ""
printTemplateHeader ts = "template" <+> encloseSep "<" ">" "," ["class" <+> t | t <- ts]

printRecordTemplate :: [MDoc] -> MDoc
printRecordTemplate [] = ""
printRecordTemplate ts = encloseSep "<" ">" "," ts

-- | Render a C++ struct definition.
printStructTypedef ::
  [MDoc] -> -- template parameters (e.g., ["T"])
  MDoc -> -- the name of the structure (e.g., "Person")
  [(MDoc, MDoc)] -> -- key and type for all fields
  MDoc
printStructTypedef params rname fields = vsep [template, struct]
  where
    template = printTemplateHeader params
    struct =
      block
        4
        ("struct" <+> rname)
        (vsep [t <+> k <> ";" | (k, t) <- fields])
        <> ";"

-- | Render a C++ serializer (toAnything) for a struct.
printSerializer ::
  [MDoc] -> -- template parameters
  MDoc -> -- type of thing being serialized
  [(MDoc, MDoc)] -> -- key and type for all fields
  MDoc
printSerializer params rtype fields =
  [idoc|
#{printTemplateHeader params}
void* toAnything(void* dest, void** cursor, const Schema* schema, const #{rtype}& obj)
{
    return toAnything(dest, cursor, schema, std::make_tuple#{arguments});
}
|]
  where
    arguments = tupled ["obj." <> key | (key, _) <- fields]

-- | Render a C++ deserializer (fromAnything + get_shm_size) for a struct.
printDeserializer ::
  Bool -> -- build object with constructor
  [MDoc] -> -- template parameters
  MDoc -> -- type of thing being deserialized
  [(MDoc, MDoc)] -> -- key and type for all fields
  MDoc
printDeserializer _ params rtype fields =
  [idoc|
#{printTemplateHeader params}
#{block 4 header body}

#{printTemplateHeader params}
#{block 4 headerGetSize bodyGetSize}
|]
  where
    header =
      [idoc|#{rtype} fromAnything(const Schema* schema, const void * anything, #{rtype}* dummy = nullptr, const void* base_ptr = nullptr)|]
    body =
      vsep $
        [[idoc|#{rtype} obj;|]]
          <> zipWith assignFields [0 ..] fields
          <> ["return obj;"]

    assignFields :: Int -> (MDoc, MDoc) -> MDoc
    assignFields idx (keyName, keyType) =
      vsep
        [ [idoc|#{keyType}* elemental_dumby_#{keyName} = nullptr;|]
        , [idoc|obj.#{keyName} = fromAnything(schema->parameters[#{pretty idx}], (char*)anything + schema->offsets[#{pretty idx}], elemental_dumby_#{keyName}, base_ptr);|]
        ]

    headerGetSize = [idoc|size_t get_shm_size(const Schema* schema, const #{rtype}& data)|]
    bodyGetSize =
      vsep $
        ["size_t size = 0;"]
          <> [getSize idx key | (idx, (key, _)) <- zip [0 ..] fields]
          <> ["return size;"]

    getSize :: Int -> MDoc -> MDoc
    getSize idx key = [idoc|size += get_shm_size(schema->parameters[#{pretty idx}], data.#{key});|]


================================================
FILE: executable/CppTranslator.hs
================================================
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE QuasiQuotes #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE UndecidableInstances #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : CppTranslator
Description : Translate 'SerialManifold' trees into C++ pool source code
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Stateful C++ translator using the two-phase IR architecture: lower the
'SerialManifold' tree into 'IStmt'/'IExpr' via 'LowerConfig', then print
via 'CppPrinter'. Handles C++-specific concerns like compilation flags,
include paths, struct generation, and template instantiation.
-}
module CppTranslator
  ( translate
  , cppLang
  ) where

import Control.Monad.Identity (Identity, runIdentity)
import qualified Control.Monad.State as CMS
import qualified CppPrinter as CP
import qualified Data.Char as DC
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as T
import Morloc.CodeGenerator.Grammars.Common
import Morloc.CodeGenerator.Grammars.Macro (expandMacro)
import Morloc.CodeGenerator.Grammars.Translator.Imperative
  ( IType (..)
  , LowerConfig (..)
  , buildProgramM
  , defaultFoldRules
  , expandDeserialize
  , expandSerialize
  , toIType
  )
import Morloc.CodeGenerator.Namespace
import Morloc.CodeGenerator.Serial
  ( serialAstToType
  , shallowType
  )
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import qualified Morloc.Language as ML
import qualified Morloc.Monad as MM
import qualified Morloc.Version as MV
import Morloc.Quasi
import qualified Morloc.System as MS
import qualified Morloc.TypeEval as TE

-- HACK: repeating these here is hacky
-- This same data is repeated in cpp/lang.yaml
cppLang :: ML.Lang
cppLang = ML.Lang "cpp" "cpp"

serialType :: MDoc
serialType = "uint8_t*"

data CallSemantics = Copy | Reference | ConstPtr

class HasCppType a where
  cppTypeOf :: a -> CppTranslator MDoc

  cppArgOf :: CallSemantics -> Arg a -> CppTranslator MDoc

setCallSemantics :: CallSemantics -> MDoc -> MDoc
setCallSemantics Copy typestr = typestr
setCallSemantics Reference typestr = "const" <+> typestr <> "&"
setCallSemantics ConstPtr typestr = "const" <+> typestr

chooseCallSemantics :: TypeM -> CallSemantics
chooseCallSemantics Passthrough = ConstPtr -- const uint8_t* packet
chooseCallSemantics (Serial _) = ConstPtr -- const uint8_t* packet
chooseCallSemantics (Native _) = Reference -- for now, primitives should be pass by copy
chooseCallSemantics (Function _ _) = Copy -- currently not used

instance HasCppType TypeM where
  cppTypeOf (Serial _) = return serialType
  cppTypeOf (Native c) = cppTypeOf c
  cppTypeOf Passthrough = return serialType
  cppTypeOf (Function ts t) = do
    t' <- cppTypeOf t
    ts' <- mapM cppTypeOf ts
    return $ "std::function<" <> t' <> tupled ts' <> ">"

  cppArgOf s (Arg i t) = do
    typeStr <- cppTypeOf t
    let typeStrQualified = setCallSemantics s typeStr
    return $ case t of
      (Serial _) -> typeStrQualified <+> svarNamer i
      (Native _) -> typeStrQualified <+> nvarNamer i
      Passthrough -> typeStrQualified <+> svarNamer i
      (Function _ _) -> typeStrQualified <+> nvarNamer i

instance HasCppType NativeManifold where
  cppTypeOf = cppTypeOf . typeMof
  cppArgOf s r = cppArgOf s $ fmap typeMof r

instance {-# OVERLAPPABLE #-} (HasTypeF e) => HasCppType e where
  cppTypeOf = f . typeFof
    where
      f (UnkF (FV _ x)) = return $ pretty x
      f (VarF (FV _ x)) = return $ pretty x
      f (FunF ts t) = do
        t' <- f t
        ts' <- mapM f ts
        return $ "std::function<" <> t' <> tupled ts' <> ">"
      f (NatLitF _) = return mempty
      f (AppF t ts) = do
        t' <- f t
        let runtimeTs = [x | x <- ts, not (isNatLitF x)]
        ts' <- mapM f runtimeTs
        return . pretty $ expandMacro (render t') (map render ts')
      f t@(NamF _ (FV gc (CV "struct")) _ rs) = do
        recmap <- CMS.gets translatorRecmap
        -- handle autogenerated structs
        case lookup (FV gc (CV "struct"), map fst rs) recmap of
          (Just rec) -> do
            params <- typeParams (zip (map snd (recFields rec)) (map snd rs))
            return $ recName rec <> params
          Nothing -> error $ "Record missing from recmap: " <> show t <> " from map: " <> show recmap
      f (NamF _ (FV _ (CV "arrow")) _ _) = return "mlc::ArrowTable"
      f (NamF _ (FV _ s) ps _) = do
        ps' <- mapM f ps
        return $ pretty s <> CP.printRecordTemplate ps'
      f (EffectF _ t) = do
        t' <- f t
        return $ "std::function<" <> t' <> "()" <> ">"
      f (OptionalF t) = do
        t' <- f t
        return $ "std::optional<" <> t' <> ">"
      isNatLitF (NatLitF _) = True
      isNatLitF _ = False

  cppArgOf s (Arg i t) = do
    t' <- cppTypeOf (typeFof t)
    return $ setCallSemantics s t' <+> nvarNamer i

data CppTranslatorState = CppTranslatorState
  { translatorCounter :: Int
  , translatorRecmap :: RecMap
  , translatorSignatureSet :: Set.Set Int
  , translatorLocalManifoldSet :: Set.Set Int
  , translatorRemoteManifoldSet :: Set.Set Int
  , translatorCurrentManifold :: Int
  , translatorEffectLabels :: Map.Map Int (Set.Set Text)
  }

instance Defaultable CppTranslatorState where
  defaultValue =
    CppTranslatorState
      { translatorCounter = 0
      , translatorRecmap = []
      , translatorSignatureSet = Set.empty
      , translatorLocalManifoldSet = Set.empty
      , translatorRemoteManifoldSet = Set.empty
      , translatorCurrentManifold = -1 -- -1 indicates we are not inside a manifold
      , translatorEffectLabels = Map.empty
      }

type CppTranslator a = CMS.StateT CppTranslatorState Identity a
type CppTranslatorM = CMS.StateT CppTranslatorState Identity

getCounter :: CppTranslator Int
getCounter = do
  s <- CMS.get
  let i = translatorCounter s
  CMS.put $ s {translatorCounter = translatorCounter s + 1}
  return i

resetCounter :: CppTranslator ()
resetCounter = do
  s <- CMS.get
  CMS.put $ s {translatorCounter = 0}

translate :: [Source] -> [SerialManifold] -> MorlocMonad Script
translate srcs es = do
  -- scopeMap :: GMap Int MVar (Map.Map Lang Scope)
  scopeMap <- MM.gets stateConcreteTypedefs

  -- universalScopeMap :: GMap Int MVar Scope
  universalScopeMap <- MM.gets stateUniversalConcreteTypedefs

  effectMap <- MM.gets stateManifoldEffects

  -- Canonicalize C++ source paths once up front so that the #include
  -- directives emitted by makeCppCode and the -I flags emitted by
  -- makeTheMaker see exactly the same absolute paths. Before this,
  -- `#include "./src/foo.hpp"` could not be resolved against
  -- `-I/abs/src` because the `src/` prefix was duplicated.
  (srcs', _, _) <- handleFlagsAndPaths srcs

  let recmap = unifyRecords . concatMap collectRecords $ es
      translatorState = defaultValue {translatorRecmap = recmap, translatorEffectLabels = effectMap}
      code = CMS.evalState (makeCppCode srcs' es universalScopeMap scopeMap) translatorState

  maker <- makeTheMaker srcs'

  poolSubdir <- MM.getModuleName

  return $
    Script
      { scriptBase = "pool"
      , scriptLang = cppLang
      , scriptCode = "." :/ Dir "pools" [Dir poolSubdir [File "pool.cpp" (Code (T.replace "__MORLOC_VERSION__" (MT.pack MV.versionStr) (render code)))]]
      , scriptMake = maker
      }

makeCppCode ::
  [Source] ->
  [SerialManifold] ->
  Map.Map Lang Scope ->
  GMap Int MVar (Map.Map Lang Scope) ->
  CppTranslator MDoc
makeCppCode srcs es univeralScopeMap scopeMap = do
  -- ([MDoc], [MDoc])
  (srcDecl, srcSerial) <- generateSourcedSerializers univeralScopeMap scopeMap es

  -- write include statements for sources
  let includeDocs = map translateSource (unique . mapMaybe srcPath $ srcs)

  signatures <- concat <$> mapM makeSignature es

  (autoDecl, autoSerial) <- generateAnonymousStructs
  let serializationCode = autoDecl ++ srcDecl ++ autoSerial ++ srcSerial

  -- build the program (translates each manifold tree)
  program <- buildProgramM includeDocs es translateSegment

  -- create and return complete pool script
  return $ CP.printProgram serializationCode signatures program

metaTypedefs ::
  GMap Int MVar (Map.Map Lang Scope) ->
  Int -> -- manifold index
  Scope
metaTypedefs tmap i =
  case GMap.lookup i tmap of
    (GMapJust langmap) -> case Map.lookup cppLang langmap of
      (Just scope) -> Map.filter (not . null) scope
      Nothing -> Map.empty
    _ -> Map.empty

-- | Collect TVar names of all named (non-anonymous) record types used
-- in a SerialManifold tree.
collectNamedRecordTVars :: SerialManifold -> Set.Set TVar
collectNamedRecordTVars e0 =
  runIdentity $ foldWithSerialManifoldM fm e0
  where
    fm = defaultValue
      { opFoldWithNativeExprM = nativeExpr
      , opFoldWithSerialExprM = serialExpr
      }

    nativeExpr _ (DeserializeN_ t s xs) =
      return $ Set.unions [xs, seekNamedRecs t, seekNamedRecs (serialAstToType s)]
    nativeExpr efull e =
      return $ foldlNE Set.union (seekNamedRecs (typeFof efull)) e

    serialExpr _ (SerializeS_ s xs) =
      return $ Set.union (seekNamedRecs (serialAstToType s)) xs
    serialExpr _ e = return $ foldlSE Set.union Set.empty e

    seekNamedRecs :: TypeF -> Set.Set TVar
    seekNamedRecs (NamF _ (FV v (CV c)) _ rs)
      | c /= "struct" = Set.insert v (Set.unions (map (seekNamedRecs . snd) rs))
    seekNamedRecs (NamF _ _ _ rs) = Set.unions (map (seekNamedRecs . snd) rs)
    seekNamedRecs (FunF ts t) = Set.unions (map seekNamedRecs (t : ts))
    seekNamedRecs (AppF t ts) = Set.unions (map seekNamedRecs (t : ts))
    seekNamedRecs (EffectF _ t) = seekNamedRecs t
    seekNamedRecs (OptionalF t) = seekNamedRecs t
    seekNamedRecs _ = Set.empty

makeTheMaker :: [Source] -> MorlocMonad [SysCommand]
makeTheMaker srcs = do
  poolSubdir <- MM.getModuleName
  let outfile = pretty $ "pools" </> poolSubdir </> ML.makeExecutablePoolName cppLang
  let src = pretty $ "pools" </> poolSubdir </> ML.makeSourcePoolName cppLang

  (_, flags, includes) <- handleFlagsAndPaths srcs

  bconf <- MM.gets stateBuildConfig
  let sanitizeFlags = case buildConfigSanitize bconf of
        Just True -> ["-fsanitize=alignment", "-fno-sanitize-recover=alignment"]
        _ -> []

  let incs = "-I." : [pretty ("-I" <> i) | i <- includes]
  let flags' = map pretty (flags ++ sanitizeFlags)

  let cmd =
        SysRun . Code . render $
          [idoc|g++ -O2 -o #{outfile} #{src} #{hsep flags'} #{hsep incs}|]

  return [cmd]

makeSignature :: SerialManifold -> CppTranslator [MDoc]
makeSignature = foldWithSerialManifoldM fm
  where
    fm =
      defaultValue
        { opFoldWithSerialManifoldM = serialManifold
        , opFoldWithNativeManifoldM = nativeManifold
        }

    serialManifold (SerialManifold m _ form _ _) _ = manifoldSignature m serialType form

    nativeManifold e@(NativeManifold m _ form _) _ = do
      typestr <- cppTypeOf e
      manifoldSignature m typestr form

    manifoldSignature ::
      (HasTypeM t) => Int -> MDoc -> ManifoldForm (Or TypeS TypeF) t -> CppTranslator [MDoc]
    manifoldSignature i typestr form = do
      s <- CMS.get
      if Set.member i (translatorSignatureSet s)
        then return []
        else do
          let formArgs = typeMofForm form

          args <- mapM (\r@(Arg _ t) -> cppArgOf (chooseCallSemantics t) r) formArgs
          CMS.put (s {translatorSignatureSet = Set.insert i (translatorSignatureSet s)})
          return [typestr <+> manNamer i <> tupled args <> ";"]

tupleKey :: Int -> MDoc -> MDoc
tupleKey i v = [idoc|std::get<#{pretty i}>(#{v})|]

recordAccess :: MDoc -> MDoc -> MDoc
recordAccess record field = record <> "." <> field

cppLowerConfig :: LowerConfig CppTranslatorM
cppLowerConfig =
  LowerConfig
    { lcSrcName = \src -> pretty (srcName src)
    , lcTypeOf = \t -> Just . toIType <$> cppTypeOf t
    , lcSerialAstType = serializeTypeOf
    , lcDeserialAstType = \s -> Just . toIType <$> cppTypeOf (shallowType s)
    , lcRawDeserialAstType = rawTypeOf
    , lcTypeMOf = \_ -> return Nothing
    , lcPackerName = \src -> pretty (srcName src)
    , lcUnpackerName = \src -> pretty (srcName src)
    , lcRecordAccessor = \_ _ -> recordAccess
    , lcDeserialRecordAccessor = \i _ v -> tupleKey i v
    , lcTupleAccessor = tupleKey
    , lcNewIndex = getCounter
    , lcPrintExpr = CP.printExpr
    , lcPrintStmt = CP.printStmt
    , lcEvalPattern = \t p xs -> do
        state <- CMS.get
        return $ evaluatePattern state t p xs
    , lcListConstructor = \_ _ es -> encloseSep "{" "}" "," es
    , lcTupleConstructor = \_ -> ((<>) "std::make_tuple" . tupled)
    , lcRecordConstructor = \recType _ _ _ rs -> do
        t <- cppTypeOf recType
        idx <- getCounter
        let v' = "a" <> pretty idx
            decl = t <+> v' <+> "=" <+> encloseSep "{" "}" "," (map snd rs) <> ";"
        return $ defaultValue {poolExpr = v', poolPriorLines = [decl]}
    , lcForeignCall = \socketFile mid args ->
        let argList = [dquotes socketFile, pretty mid] <> args <> ["NULL"]
         in [idoc|foreign_call#{tupled argList}|]
    , lcRemoteCall = \socketFile mid res args -> do
        let resMem = pretty $ fromMaybe (-1) (remoteResourcesMemory res)
            resTime = pretty $ maybe (-1) unTimeInSeconds (remoteResourcesTime res)
            resCPU = pretty $ fromMaybe (-1) (remoteResourcesThreads res)
            resGPU = pretty $ fromMaybe 0 (remoteResourcesGpus res)
            cacheDir = ".morloc-cache"
            argList = encloseSep "{" "}" "," args
            setup =
              [idoc|resources_t resources = {#{resMem}, #{resTime}, #{resCPU}, #{resGPU}};
const uint8_t* args[] = #{argList};
char* errmsg = NULL;|]
            call =
              [idoc|remote_call(
    #{pretty mid},
    #{dquotes socketFile},
    #{dquotes cacheDir},
    &resources,
    args,
    #{pretty (length args)},
    &errmsg
);
PROPAGATE_ERROR(errmsg)|]
        return $ defaultValue {poolExpr = call, poolPriorLines = [setup]}
    , lcMakeLet = \namer letIndex mt e1 e2 -> do
        typestr <- case mt of
          (Just t) -> cppTypeOf t
          Nothing -> return serialType
        return $ makeLet namer letIndex typestr e1 e2
    , lcReturn = \e -> "return(" <> e <> ");"
    , lcMakeIf = \origExpr condDocs thenDocs elseDocs -> do
        idx <- getCounter
        let v = helperNamer idx
        typeStr <- cppTypeOf origExpr
        let condE = poolExpr condDocs
            thenE = poolExpr thenDocs
            elseE = poolExpr elseDocs
            thenBlock = poolPriorLines thenDocs <> [v <+> "=" <+> thenE <> ";"]
            elseBlock = poolPriorLines elseDocs <> [v <+> "=" <+> elseE <> ";"]
            decl = typeStr <+> v <> ";"
            ifStmt = vsep
              [ decl
              , "if" <+> parens condE <+> "{"
              , indent 4 (vsep thenBlock)
              , "} else {"
              , indent 4 (vsep elseBlock)
              , "}"
              ]
        return $ PoolDocs
          { poolCompleteManifolds = poolCompleteManifolds condDocs <> poolCompleteManifolds thenDocs <> poolCompleteManifolds elseDocs
          , poolExpr = v
          , poolPriorLines = poolPriorLines condDocs <> [ifStmt]
          , poolPriorExprs = poolPriorExprs condDocs <> poolPriorExprs thenDocs <> poolPriorExprs elseDocs
          }
    , lcMakeDoBlock = \t stmts expr ->
        let isUnit = case t of
              EffectF _ (VarF (FV tv _)) -> tv == TV "Unit"
              VarF (FV tv _) -> tv == TV "Unit"
              _ -> False
        in (,) [] $ case (isUnit, stmts) of
          (True, []) -> "[&](){" <> expr <> "; return mlc::Unit{};}"
          (True, _) -> "[&](){" <> nest 4 (line <> vsep (stmts <> [expr <> ";", "return mlc::Unit{};"])) <> line <> "}"
          (False, []) -> "[&](){return " <> expr <> ";}"
          (False, _) -> "[&](){" <> nest 4 (line <> vsep (stmts <> ["return " <> expr <> ";"])) <> line <> "}"
    , lcSerialize = \v s -> serialize v s
    , lcDeserialize = \t v s -> do
        typestr <- cppTypeOf t
        deserialize v typestr s
    , lcMakeFunction = \mname args manifoldType priorLines body headForm -> do
        callIndex <- CMS.gets translatorCurrentManifold
        state <- CMS.get
        let effectLabels = Map.findWithDefault Set.empty callIndex (translatorEffectLabels state)
        let alreadyDone = case headForm of
              (Just HeadManifoldFormRemoteWorker) -> Set.member callIndex (translatorRemoteManifoldSet state)
              _ -> Set.member callIndex (translatorLocalManifoldSet state)
        if alreadyDone
          then return Nothing
          else do
            case headForm of
              (Just HeadManifoldFormRemoteWorker) ->
                CMS.modify
                  (\s -> s {translatorRemoteManifoldSet = Set.insert callIndex (translatorRemoteManifoldSet s)})
              _ ->
                CMS.modify
                  (\s -> s {translatorLocalManifoldSet = Set.insert callIndex (translatorLocalManifoldSet s)})
            returnTypeStr <- returnType manifoldType
            typedArgs <- mapM (\r@(Arg _ t) -> cppArgOf (chooseCallSemantics t) r) args
            let fullName = mname <> mnameExt headForm
                decl = returnTypeStr <+> fullName <> tupled typedArgs
                enrichError = case headForm of
                  Just HeadManifoldFormRemoteWorker -> True
                  _ -> Set.member "Error" effectLabels
                tryBody = block 4 "try" (vsep $ priorLines <> [body])
                catchBody
                  | enrichError =
                    let throwStatement = vsep
                          [ [idoc|std::string error_message = "Error raised in C++ pool by #{mname}:\n" + std::string(e.what());|]
                          , [idoc|throw std::runtime_error(error_message);|]
                          ]
                     in block 4 "catch (const std::exception& e)" throwStatement
                  | otherwise = block 4 "catch (...)" "throw;"
            return . Just . block 4 decl . vsep $ [tryBody <+> catchBody]
    , lcMakeLambda = \mname contextArgs boundArgs ->
        let vs' = take (length boundArgs) (map (\j -> "std::placeholders::_" <> viaShow j) ([1 ..] :: [Int]))
         in [idoc|std::bind(#{cat (punctuate "," (mname : (contextArgs ++ vs')))})|]
    }
  where
    -- For serialization, records become tuples (that's what _put_value/toAnything expects)
    serializeTypeOf :: SerialAST -> CppTranslator (Maybe IType)
    serializeTypeOf (SerialObject _ _ _ rs) = Just . toIType <$> recordToCppTuple (map snd rs)
    serializeTypeOf s = Just . toIType <$> cppTypeOf (serialAstToType s)

    rawTypeOf :: SerialAST -> CppTranslator (Maybe IType)
    rawTypeOf (SerialObject _ _ _ rs) = Just . toIType <$> recordToCppTuple (map snd rs)
    rawTypeOf s = Just . toIType <$> cppTypeOf (serialAstToType s)

    makeLet :: (Int -> MDoc) -> Int -> MDoc -> PoolDocs -> PoolDocs -> PoolDocs
    makeLet namer letIndex typestr (PoolDocs ms1 e1 rs1 pes1) (PoolDocs ms2 e2 rs2 pes2) =
      let letAssignment = [idoc|#{typestr} #{namer letIndex} = #{e1};|]
          rs = rs1 <> [letAssignment] <> rs2
       in PoolDocs
            { poolCompleteManifolds = ms1 <> ms2
            , poolExpr = e2
            , poolPriorLines = rs
            , poolPriorExprs = pes1 <> pes2
            }

    mnameExt :: Maybe HeadManifoldForm -> MDoc
    mnameExt (Just HeadManifoldFormRemoteWorker) = "_remote"
    mnameExt _ = ""

    returnType :: TypeM -> CppTranslator MDoc
    returnType (Function _ t) = cppTypeOf t
    returnType t = cppTypeOf t

-- Use `#include "foo.h"` rather than `#include <foo.h>`
translateSource ::
  -- | Path to a header (e.g., `$MORLOC_HOME/src/foo.h`)
  Path ->
  MDoc
translateSource path = "#include" <+> (dquotes . pretty) path

serialize :: MDoc -> SerialAST -> CppTranslator PoolDocs
serialize v s = do
  (expr, stmts) <- expandSerialize cppLowerConfig v s
  return $
    PoolDocs
      { poolCompleteManifolds = []
      , poolExpr = CP.printExpr expr
      , poolPriorLines = map CP.printStmt stmts
      , poolPriorExprs = []
      }

-- reverse of serialize, parameters are the same
deserialize :: MDoc -> MDoc -> SerialAST -> CppTranslator (MDoc, [MDoc])
deserialize varname0 typestr0 s0 = do
  (expr, stmts) <- expandDeserialize cppLowerConfig varname0 s0
  let rendered = CP.printExpr expr
  if null stmts
    then return (rendered, [])
    else do
      schemaVar <- helperNamer <$> getCounter
      let final = [idoc|#{typestr0} #{schemaVar} = #{rendered};|]
      return (schemaVar, map CP.printStmt stmts ++ [final])

recordToCppTuple :: [SerialAST] -> CppTranslator MDoc
recordToCppTuple ts = do
  tsDocs <- mapM (cppTypeOf . serialAstToType) ts
  return $ "std::tuple" <> encloseSep "<" ">" "," tsDocs

translateSegment :: SerialManifold -> CppTranslator MDoc
translateSegment m0 = do
  resetCounter
  e <- surroundFoldSerialManifoldM manifoldIndexer (defaultFoldRules cppLowerConfig) m0
  return $ renderPoolDocs e
  where
    manifoldIndexer =
      makeManifoldIndexer
        (CMS.gets translatorCurrentManifold)
        (\i -> CMS.modify (\s -> s {translatorCurrentManifold = i}))

-- handle string interpolation
evaluatePattern :: CppTranslatorState -> TypeF -> Pattern -> [MDoc] -> MDoc
evaluatePattern _ _ (PatternText s ss) xs = "interweave_strings" <> tupled [fragments, insertions]
  where
    fragments = encloseSep "{" "}" ", " (map (dquotes . pretty . escapeQuotes "\"" "\\\"" . escapeStringLit) (s : ss))
    insertions = encloseSep "{" "}" ", " xs

-- handle getters
evaluatePattern _ _ (PatternStruct (ungroup -> [ss])) [m] =
  writeSelector m ss
evaluatePattern _ _ (PatternStruct (ungroup -> sss)) [m] =
  encloseSep "{" "}" "," (map (writeSelector m) sss)
evaluatePattern state0 t0 (PatternStruct s0) (m0 : xs0) =
  patternSetter makeTuple makeRecord accessTuple accessRecord m0 t0 s0 xs0
  where
    makeTuple (AppF _ ts) xs =
      let tupleTypes = CMS.evalState (mapM cppTypeOf ts) state0
       in "std::tuple" <> encloseSep "<" ">" "," tupleTypes <> tupled xs
    makeTuple _ _ = error "Unreachable"

    makeRecord _ xs = encloseSep "{" "}" ", " xs

    accessTuple _ m i = "std::get<" <> pretty i <> ">(" <> m <> ")"
    accessRecord _ d k = d <> "." <> pretty k
evaluatePattern _ _ (PatternStruct _) [] = error "Unreachable illegal pattern"

writeSelector :: MDoc -> [Either Int Text] -> MDoc
writeSelector d [] = d
writeSelector d (Right k : rs) = writeSelector (d <> "." <> pretty k) rs
writeSelector d (Left i : rs) = writeSelector ("std::get<" <> pretty i <> ">" <> parens d) rs

typeParams :: [(Maybe TypeF, TypeF)] -> CppTranslator MDoc
typeParams ts = CP.printRecordTemplate <$> mapM cppTypeOf [t | (Nothing, t) <- ts]

generateAnonymousStructs :: CppTranslator ([MDoc], [MDoc])
generateAnonymousStructs = do
  recmap <- CMS.gets translatorRecmap

  xs <- mapM makeSerializers (reverse . map snd $ recmap)

  return (concatMap fst xs, concatMap snd xs)
  where
    makeSerializers :: RecEntry -> CppTranslator ([MDoc], [MDoc])
    makeSerializers rec = do
      let templateTerms = map (("T" <>) . pretty) ([1 ..] :: [Int])
          rs' = zip templateTerms (recFields rec)

      let params = [t | (t, (_, Nothing)) <- rs']
          rname = recName rec
          rtype = rname <> CP.printRecordTemplate [v | (v, (_, Nothing)) <- rs']

      let fieldNames = [k | (_, (k, _)) <- rs']

      fieldTypes <- mapM (\(t, v) -> maybeM t cppTypeOf v) [(t', v') | (t', (_, v')) <- rs']

      let fields = [(pretty k, v) | (k, v) <- zip fieldNames fieldTypes]

      let structDecl = CP.printStructTypedef params rname fields
          serializer = CP.printSerializer params rtype fields
          deserializer = CP.printDeserializer False params rtype fields

      return ([structDecl], [serializer, deserializer])

    -- monadic form of `maybe` function
    maybeM :: (Monad m) => a -> (b -> m a) -> Maybe b -> m a
    maybeM _ f (Just x) = f x
    maybeM x _ Nothing = return x

generateSourcedSerializers ::
  Map.Map Lang Scope ->
  GMap Int MVar (Map.Map Lang Scope) ->
  [SerialManifold] -> -- all segments that can be called in this pool
  CppTranslator
    ( [MDoc]
    , [MDoc]
    )
generateSourcedSerializers univeralScopeMap scopeMap es0 = do
  perManifold <- Map.unions <$> mapM (foldSerialManifoldM fm) es0

  scope <- case Map.lookup cppLang univeralScopeMap of
    (Just scope) -> return scope
    Nothing -> return Map.empty

  -- Supplement per-manifold typedefs with universal scope entries for named
  -- record types that appear in this pool but are missing from the per-manifold
  -- scope (happens in secondary C++ pools called via foreign_call).
  let usedTypes = Set.unions (map collectNamedRecordTVars es0)
      missingTypes = Set.difference usedTypes (Map.keysSet perManifold)
      supplemental = Map.filterWithKey (\k _ -> Set.member k missingTypes) scope
      typedef = Map.unionWith mergeScopes perManifold supplemental

  foldl groupQuad ([], []) . concat . Map.elems <$> Map.mapWithKeyM (makeSerials scope) typedef
  where
    -- given the universal map of scopes, pull out every one that is used in this subtree
    fm =
      defaultValue
        { opSerialManifoldM = \(SerialManifold_ i _ _ _ e) -> return $ Map.unionWith mergeScopes (metaTypedefs scopeMap i) e
        , opNativeManifoldM = \(NativeManifold_ i _ _ e) -> return $ Map.unionWith mergeScopes (metaTypedefs scopeMap i) e
        }

    -- there are likely to be repeats in the scopes, we only want the unique ones
    mergeScopes xs ys = unique (xs <> ys)

    groupQuad :: ([a], [a]) -> (a, a) -> ([a], [a])
    groupQuad (xs, ys) (x, y) = (x : xs, y : ys)

    makeSerials ::
      Scope -> TVar -> [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] -> CppTranslator [(MDoc, MDoc)]
    makeSerials s v xs = catMaybes <$> mapM (makeSerial s v) xs

    makeSerial ::
      Scope -> TVar -> ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) -> CppTranslator (Maybe (MDoc, MDoc))
    makeSerial _ _ (_, NamU _ (TV "struct") _ _, _, _) = return Nothing
    makeSerial _ _ (_, NamU _ (TV "arrow") _ _, _, _) = return Nothing
    makeSerial scope _ (ps, NamU r (TV v) _ rs, _, _) = do
      params <- mapM (either (\(p, _) -> return $ "T" <> pretty p) (\_ -> return "XXX_FIXME")) ps
      let templateTerms = ["T" <> pretty p | Left (p, _) <- ps]
          rtype = pretty v <> CP.printRecordTemplate templateTerms
          rs' = map (second (evaluateTypeU scope)) rs
          fields = [(pretty k, showDefType ps (typeOf t)) | (k, t) <- rs']
          serializer = CP.printSerializer params rtype fields
          deserializer = CP.printDeserializer (r == NamObject) params rtype fields
      return $ Just (serializer, deserializer)
    makeSerial _ _ _ = return Nothing

    evaluateTypeU :: Scope -> TypeU -> TypeU
    evaluateTypeU scope t = case TE.evaluateType scope t of
      (Left e) -> error $ show e
      (Right t') -> t'

    showDefType :: [Either (TVar, Kind) TypeU] -> Type -> MDoc
    showDefType ps (UnkT v)
      | any (\p -> either (\(tv, _) -> tv == v) (const False) p) ps = "T" <> pretty v
      | otherwise = pretty v
    showDefType ps (VarT v)
      | any (\p -> either (\(tv, _) -> tv == v) (const False) p) ps = "T" <> pretty v
      | otherwise = pretty v
    showDefType _ (FunT _ _) = error "Cannot serialize functions"
    showDefType _ (NamT _ v _ _) = pretty v
    showDefType _ (NatLitT _) = mempty
    showDefType ps (AppT (VarT (TV v)) ts) = pretty $ expandMacro v (map (render . showDefType ps) runtimeTs)
      where runtimeTs = [t | t <- ts, not (isNatLitT t)]
    showDefType _ (AppT _ _) = error "AppT is only OK with VarT, for now"
    showDefType _ (EffectT _ _) = error "Cannot show EffectT"
    showDefType _ (NatAddT _ _) = mempty
    showDefType _ (NatMulT _ _) = mempty
    showDefType _ (NatSubT _ _) = mempty
    showDefType _ (NatDivT _ _) = mempty
    showDefType ps (OptionalT t) = "std::optional<" <> showDefType ps t <> ">"
    isNatLitT (NatLitT _) = True
    isNatLitT _ = False

-- C++ specific source handling (flags, headers, libraries)

handleFlagsAndPaths :: [Source] -> MorlocMonad ([Source], [Text], [Path])
handleFlagsAndPaths srcs = do
  state <- MM.get
  let gccversion = gccVersionFlag . foldl max 0 . map packageCppVersion $ statePackageMeta state
  let explicitLibs = map ("-l" <>) . unique . concatMap packageDependencies $ statePackageMeta state
  (srcs', libflags, paths) <-
    fmap unzip3
      . mapM flagAndPath
      . unique
      $ [s | s <- srcs, srcLang s == cppLang]

  home <- MM.asks configHome
  let mlcInclude = ["-I" <> home <> "/include"]
      mlcPch = ["-include", "morloc_pch.hpp"]
      mlcLib = ["-L" <> home <> "/lib", "-Wl,-rpath," <> home <> "/lib", "-lmorloc", "-lcppmorloc", "-lpthread"]

  return
    ( filter (isJust . srcPath) srcs'
    , [gccversion] <> explicitLibs ++ (map MT.pack . concat) (mlcPch : mlcInclude : mlcLib : libflags)
    , unique (catMaybes paths)
    )

gccVersionFlag :: Int -> Text
gccVersionFlag i
  | i <= 17 = "-std=c++17"
  | otherwise = "-std=c++" <> MT.show' i

flagAndPath :: Source -> MorlocMonad (Source, [String], Maybe Path)
flagAndPath src@(Source _ srcL (Just p) _ _ _ _ _ _) | srcL == cppLang =
  case (MS.takeDirectory p, MS.dropExtensions (MS.takeFileName p), MS.takeExtensions p) of
    (".", base, "") -> do
      header <- lookupHeader base
      libFlags <- lookupLib base
      return (src {srcPath = Just header}, libFlags, Just (MS.takeDirectory header))
    (dir, base, _) -> do
      libFlags <- lookupLib base
      absDir <- liftIO $ MS.canonicalizePath dir
      absPath <- liftIO $ MS.canonicalizePath p
      return (src {srcPath = Just absPath}, libFlags, Just absDir)
  where
    lookupHeader :: String -> MorlocMonad Path
    lookupHeader base = do
      home <- MM.asks configHome
      let allPaths = getHeaderPaths home base [".h", ".hpp", ".hxx"]
      existingPaths <- liftIO . fmap catMaybes . mapM getFile $ allPaths
      case existingPaths of
        (x : _) -> liftIO $ MS.canonicalizePath x
        [] -> MM.throwSystemError $ "Header file " <> pretty base <> ".* not found"

    lookupLib :: String -> MorlocMonad [String]
    lookupLib base = do
      home <- MM.asks configHome
      let libnamebase = filter DC.isAlphaNum (map DC.toLower base)
      let libname = "lib" <> libnamebase <> ".so"
      let allPaths = getLibraryPaths home base libname
      existingPaths <- liftIO . fmap catMaybes . mapM getFile $ allPaths
      case existingPaths of
        (libpath : _) -> do
          libdir <- liftIO . MS.canonicalizePath . MS.takeDirectory $ libpath
          return
            [ "-Wl,-rpath=" <> libdir
            , "-L" <> libdir
            , "-l" <> libnamebase
            ]
        [] -> return []
flagAndPath src@(Source _ srcL Nothing _ _ _ _ _ _) | srcL == cppLang = return (src, [], Nothing)
flagAndPath _ = MM.throwSystemError $ "flagAndPath should only be called for C++ functions"

getFile :: Path -> IO (Maybe Path)
getFile x = do
  exists <- MS.doesFileExist x
  return $
    if exists
      then Just x
      else Nothing

getHeaderPaths :: Path -> String -> [String] -> [Path]
getHeaderPaths lib base exts = [path <> ext | path <- paths, ext <- exts]
  where
    paths =
      map
        MS.joinPath
        [ [base]
        , ["include", base]
        , [base, base]
        , [lib, "include", base]
        , [lib, "src", base, base]
        , ["/usr/include", base]
        , ["/usr/local/include", base]
        ]

getLibraryPaths :: Path -> String -> String -> [Path]
getLibraryPaths lib base sofile =
  map
    MS.joinPath
    [ [sofile]
    , ["lib", sofile]
    , [base, sofile]
    , [lib, "lib", sofile]
    , [lib, "src", base, sofile]
    , [lib, "src", base, "lib", sofile]
    ]


================================================
FILE: executable/Main.hs
================================================
{- |
Module      : Main
Description : Executable main module
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Main where

import GHC.IO.Encoding (setLocaleEncoding, utf8)
import Options.Applicative
import Subcommands (runMorloc)
import UI

main :: IO ()
main = do
  setLocaleEncoding utf8
  runMorloc =<< execParser opts


================================================
FILE: executable/Subcommands.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Subcommands
Description : Dispatch CLI subcommands and inject the translator callback
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Implements each CLI subcommand (make, typecheck, install, init, dump) and
defines the 'TranslateFn' callback that routes C++ to 'CppTranslator' and
other languages to the generic translator. This is the dependency injection
point that keeps translator code out of the library.
-}
module Subcommands (runMorloc) where

import Control.Exception (SomeException, bracket, finally, try)
import Data.Time.Clock (getCurrentTime)
import Data.Time.Format (formatTime, defaultTimeLocale)
import qualified CppTranslator
import qualified Data.Aeson as JSON
import qualified Data.ByteString.Lazy as BL
import qualified Data.Map as Map
import qualified Data.Set as Set
import qualified Data.Text as T
import qualified Data.Text.IO as TIO
import Morloc (generatePools)
import qualified Morloc as M
import Morloc.CodeGenerator.Emit (TranslateFn)
import qualified Morloc.CodeGenerator.Grammars.Translator.Generic as Generic
import Morloc.CodeGenerator.Grammars.Translator.PseudoCode (pseudocodeSerialManifold)
import Morloc.CodeGenerator.Namespace (SerialManifold (..))
import qualified Morloc.CodeGenerator.SystemConfig as MSC
import qualified Morloc.Completion as Completion
import qualified Morloc.Config as Config
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Text as MT
import qualified Morloc.Frontend.API as F
import Morloc.Module (OverwriteProtocol (..), findMainLocFile)
import qualified Morloc.Module as Mod
import qualified Morloc.Monad as MM
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type
import qualified Morloc.ProgramBuilder.Install as Install
import Morloc.Typecheck.Internal (prettyTypeU)
import System.Directory
  ( createDirectoryIfMissing
  , doesDirectoryExist
  , doesFileExist
  , getCurrentDirectory
  , listDirectory
  , removeDirectoryRecursive
  , removeFile
  , setCurrentDirectory
  )
import System.Exit (exitFailure, exitSuccess)
import System.FilePath (dropExtension, takeDirectory, takeFileName)
import System.IO (hPutStrLn, stderr)
import System.IO.Temp (createTempDirectory)
import qualified System.Process as SP
import UI

decodePackageMeta :: BL.ByteString -> Maybe PackageMeta
decodePackageMeta = JSON.decode

-- | Route each language to its translator.
translator :: TranslateFn
translator lang srcs es
  | lang == CppTranslator.cppLang = CppTranslator.translate srcs es
  | otherwise = Generic.translate lang srcs es

runMorloc :: CliCommand -> IO ()
runMorloc args = do
  config <- getConfig args
  buildConfig <- Config.loadBuildConfig config
  let verbose = getVerbosity args
  runPassed <- case args of
    (CmdMake g) -> cmdMake g verbose config buildConfig
    (CmdInstall g) -> cmdInstall g verbose config buildConfig
    (CmdTypecheck g) -> cmdTypecheck g verbose config buildConfig
    (CmdDump g) -> cmdDump g verbose config buildConfig
    (CmdInit g) -> cmdInit g config
    (CmdList g) -> cmdList g config
    (CmdUninstall g) -> cmdUninstall g config
    (CmdNew g) -> cmdNew g
    (CmdEval g) -> cmdEval g verbose config buildConfig
  case runPassed of
    True -> exitSuccess
    False -> exitFailure

-- | read the global morloc config file or return a default one
getConfig :: CliCommand -> IO Config.Config
getConfig (CmdMake g) = getConfig' (makeConfig g) (makeVanilla g)
getConfig (CmdInstall g) = getConfig' (installConfig g) (installVanilla g)
getConfig (CmdTypecheck g) = getConfig' (typecheckConfig g) (typecheckVanilla g)
getConfig (CmdDump g) = getConfig' (dumpConfig g) (dumpVanilla g)
getConfig (CmdInit g) = getConfig' (initConfig g) (initVanilla g)
getConfig (CmdList g) = getConfig' (listConfig g) (listVanilla g)
getConfig (CmdUninstall g) = getConfig' (uninstallConfig g) (uninstallVanilla g)
getConfig (CmdEval g) = getConfig' (evalConfig g) (evalVanilla g)
getConfig (CmdNew _) = getConfig' "" False

getConfig' :: String -> Bool -> IO Config.Config
getConfig' _ True = Config.loadMorlocConfig Nothing
getConfig' "" _ = Config.loadMorlocConfig Nothing
getConfig' filename _ = Config.loadMorlocConfig (Just filename)

getVerbosity :: CliCommand -> Int
getVerbosity (CmdMake g) = makeVerbose g
getVerbosity (CmdInstall g) = installVerbose g
getVerbosity (CmdTypecheck g) = typecheckVerbose g
getVerbosity (CmdDump g) = dumpVerbose g
getVerbosity (CmdInit g) = if initQuiet g then 0 else 1
getVerbosity (CmdList g) = listVerbose g
getVerbosity (CmdEval g) = evalVerbose g
getVerbosity (CmdUninstall _) = 0
getVerbosity (CmdNew _) = 0

readScript :: Bool -> String -> IO (Maybe Path, Code)
readScript True code = return (Nothing, Code (MT.pack code))
readScript _ filename = do
  code <- MT.readFile filename
  return (Just filename, Code code)

-- | Typecheck callback for module installation
typecheckModuleFn :: FilePath -> MorlocMonad [(T.Text, T.Text)]
typecheckModuleFn mainFile = do
  code <- liftIO $ MT.readFile mainFile
  -- Save current state, run typecheck in a clean sub-state
  savedState <- MM.get
  result <-
    MM.catchError
      ( do
          xs <- M.typecheckFrontend (Just mainFile) (Code code)
          st <- MM.get
          return
            [ (render (pretty v), render (pretty t))
            | AnnoS (Idx i t) _ _ <- xs
            , Just v <- [Map.lookup i (stateName st)]
            ]
      )
      (\_ -> return [])
  -- Restore state so module typechecking doesn't pollute the parent state
  MM.put savedState
  return result

-- | Install a module
cmdInstall :: InstallCommand -> Int -> Config.Config -> BuildConfig -> IO Bool
cmdInstall args verbosity conf buildConfig = do
  userSources <- Map.fromList <$> mapM (\modstr -> do
    name <- Mod.extractModuleName modstr
    return (name, modstr)) moduleTexts
  let cmdInstall' =
        mapM
          ( \modstr ->
              Mod.installModule
                (installForce args)
                (installUseSSH args)
                libpath
                (Config.configPlaneCore conf)
                mayTypecheck
                userSources
                Set.empty
                Mod.ExplicitInstall
                modstr
          )
          moduleTexts
  passed <- MM.runMorlocMonad Nothing verbosity conf buildConfig cmdInstall' >>= MM.writeMorlocReturn
  if passed && installBuild args
    then buildInstalledModules args verbosity conf buildConfig moduleTexts libpath
    else return passed
  where
    libpath = Config.configLibrary conf </> Config.configPlane conf
    moduleTexts = map MT.pack (installModuleStrings args)

    mayTypecheck =
      if installNoTypecheck args
        then Nothing
        else Just typecheckModuleFn

-- | Build and install executables for installed modules
buildInstalledModules ::
  InstallCommand -> Int -> Config.Config -> BuildConfig -> [T.Text] -> FilePath -> IO Bool
buildInstalledModules args verbosity conf buildConfig moduleTexts libpath = do
  results <- mapM buildOne moduleTexts
  return (and results)
  where
    force = installForce args == ForceOverwrite

    buildOne modstr = do
      name <- T.unpack <$> Mod.extractModuleName modstr
      let moduleDir = libpath </> name
      mainFile <- findMainLocFile moduleDir name
      case mainFile of
        Nothing -> do
          putStrLn $ "Warning: no main.loc found for '" <> name <> "', skipping build"
          return True
        Just locFile -> do
          origDir <- getCurrentDirectory
          setCurrentDirectory moduleDir
          buildResult <-
            buildModuleExecutable locFile name verbosity conf buildConfig force
              `finally` setCurrentDirectory origDir
          return buildResult

    buildModuleExecutable locFile _name verbosity' config buildConfig' forceOverwrite = do
      code <- MT.readFile locFile
      makeAndInstall (Just locFile) Nothing (Code code) [] verbosity' config buildConfig' forceOverwrite

-- | Compile a morloc program and optionally install it.
-- Shared by `morloc make --install` and `morloc install --build`.
makeAndInstall ::
  Maybe Path -> Maybe String -> Code -> [T.Text] -> Int ->
  Config.Config -> BuildConfig -> Bool -> IO Bool
makeAndInstall path outfile code extraIncludes verbosity config buildConfig force = do
  let action = do
        MM.modify (\s -> s {stateInstall = True, stateInstallForce = force})
        M.writeProgram translator path code
  result <- MM.runMorlocMonad outfile verbosity config buildConfig action
  passed <- MM.writeMorlocReturn result
  if passed
    then do
      let (_, finalState) = result
          -- Merge include fields from all loaded packages.
          -- Nothing = include everything (default mode).
          -- Just [...] = strict allowlist mode.
          pkgIncludes = map packageInclude (statePackageMeta finalState)
          mergedIncludes
            | not (null extraIncludes) =
                -- CLI --include flags force strict mode
                Just (concatMap (fromMaybe []) pkgIncludes ++ extraIncludes)
            | all (== Nothing) pkgIncludes = Nothing
            | otherwise = Just (concatMap (fromMaybe []) pkgIncludes)
          allSources = concat (GMap.elems (stateSources finalState))
          directSourcePaths = [ p | Source{srcPath = Just p} <- allSources ]
      case stateInstallDir finalState of
        Nothing -> do
          putStrLn "Error: install directory was not set during compilation"
          return False
        Just installDir -> do
          let installName = takeFileName installDir
              packageRoot = case fmap takeDirectory path of
                Just ""  -> "."
                Just d   -> d
                Nothing  -> "."
          -- Atomic install: clean up installDir on any failure so the user
          -- is not left with partial state requiring --force on retry.
          installResult <- try (do
            -- Only validate coverage in strict mode (explicit include patterns)
            case mergedIncludes of
              Just pats -> do
                Install.validateIncludeCoverage packageRoot pats directSourcePaths
              Nothing -> return ()
            Install.installProgram (Config.configHome config) installDir installName mergedIncludes force
            ) :: IO (Either SomeException ())
          case installResult of
            Right () -> return True
            Left e -> do
              dirExists <- doesDirectoryExist installDir
              if dirExists
                then do
                  removeDirectoryRecursive installDir
                  hPutStrLn stderr $ "Cleaned up partial install: " <> installDir
                else return ()
              hPutStrLn stderr $ show e
              return False
    else return False

-- | build a Morloc program, generating the nexus and pool files
cmdMake :: MakeCommand -> Int -> Config.Config -> BuildConfig -> IO Bool
cmdMake args verbosity config buildConfig = do
  (path, code) <- readScript (makeExpression args) (makeScript args)
  outfile <- case makeOutfile args of
    "" -> return Nothing
    x -> return . Just $ x
  if makeInstall args
    then
      makeAndInstall path outfile code
        (map T.pack (makeInclude args)) verbosity config buildConfig (makeForce args)
    else do
      let action = do
            MM.modify (\s -> s {stateInstall = False})
            M.writeProgram translator path code
      result <- MM.runMorlocMonad outfile verbosity config buildConfig action
      passed <- MM.writeMorlocReturn result
      return passed

-- | Evaluate a morloc expression
cmdEval :: EvalCommand -> Int -> Config.Config -> BuildConfig -> IO Bool
cmdEval args verbosity config buildConfig = do
  let rawExpr = evalExpression args
      code = MT.pack (preprocessEvalInput rawExpr)
      tmpBase = Config.configTmpDir config
      saveName = evalSave args
      extraArgs = evalArgs args
      isSave = not (null saveName)
      exeName = if isSave then saveName else "eval"
  createDirectoryIfMissing True tmpBase
  bracket
    (do
      origDir <- getCurrentDirectory
      tmpDir <- createTempDirectory tmpBase "morloc-eval-"
      setCurrentDirectory tmpDir
      return (origDir, tmpDir))
    (\(origDir, tmpDir) -> do
      setCurrentDirectory origDir
      cleanupTmpDir tmpDir)
    (\(_origDir, tmpDir) -> do
      let action = do
            MM.modify (\s -> s {stateEvalMode = True})
            if isSave then MM.modify (\s -> s {stateInstall = True}) else return ()
            M.writeProgram translator Nothing (Code code)
      result <- MM.runMorlocMonad (Just exeName) verbosity config buildConfig action
      passed <- MM.writeMorlocReturn result
      if not passed
        then return False
        else
          if isSave
            then do
              let (_, finalState) = result
                  pkgIncludes = map packageInclude (statePackageMeta finalState)
                  mergedIncludes
                    | all (== Nothing) pkgIncludes = Nothing
                    | otherwise = Just (concatMap (fromMaybe []) pkgIncludes)
              case stateInstallDir finalState of
                Nothing -> do
                  putStrLn "Error: install directory was not set during compilation"
                  return False
                Just installDir -> do
                  evalInstallResult <- try (do
                    Install.installProgram (Config.configHome config) installDir saveName mergedIncludes True
                    writeEvalMeta (Config.configHome config) saveName rawExpr
                    ) :: IO (Either SomeException ())
                  case evalInstallResult of
                    Right () -> return True
                    Left e -> do
                      dirExists <- doesDirectoryExist installDir
                      if dirExists
                        then do
                          removeDirectoryRecursive installDir
                          hPutStrLn stderr $ "Cleaned up partial install: " <> installDir
                        else return ()
                      hPutStrLn stderr $ show e
                      return False
            else do
              let exe = tmpDir </> exeName
              subcommand <- getFirstSubcommand exe
              let cmdArgs = subcommand : extraArgs
              runResult <- try (SP.callProcess exe cmdArgs) :: IO (Either SomeException ())
              case runResult of
                Right () -> return True
                Left e -> do
                  putStrLn $ "Error running expression: " ++ show e
                  return False)
  where
    cleanupTmpDir dir = do
      exists <- doesDirectoryExist dir
      if exists then removeDirectoryRecursive dir else return ()

-- | Extract the first subcommand name from the manifest embedded in a wrapper script.
-- Falls back to "__expr__" if the manifest cannot be parsed.
getFirstSubcommand :: FilePath -> IO String
getFirstSubcommand wrapperPath = do
  result <- try (readFile wrapperPath) :: IO (Either SomeException String)
  case result of
    Left _ -> return "__expr__"
    Right contents -> do
      let marker = "### MANIFEST ###"
          afterMarker = drop 1 $ dropWhile (/= marker) (lines contents)
          manifestStr = unlines afterMarker
      case JSON.eitherDecode (BL.fromStrict (MT.encodeUtf8 (MT.pack manifestStr))) of
        Right pm -> case pmCommands pm of
          (cmd : _) -> return (T.unpack (pcName cmd))
          [] -> return "__expr__"
        Left _ -> return "__expr__"

-- | Write metadata about the saved eval expression
writeEvalMeta :: FilePath -> String -> String -> IO ()
writeEvalMeta cfgHome name expr = do
  now <- getCurrentTime
  let fdbDir = cfgHome </> "fdb"
      metaPath = fdbDir </> name ++ ".eval-meta"
      timestamp = formatTime defaultTimeLocale "%Y-%m-%dT%H:%M:%SZ" now
      json = "{\"expression\":" ++ jsonEscape expr ++ ",\"timestamp\":\"" ++ timestamp ++ "\"}"
  createDirectoryIfMissing True fdbDir
  writeFile metaPath json
  where
    jsonEscape s = "\"" ++ concatMap escChar s ++ "\""
    escChar '"' = "\\\""
    escChar '\\' = "\\\\"
    escChar '\n' = "\\n"
    escChar '\t' = "\\t"
    escChar c = [c]

-- | Preprocess eval input: replace top-level semicolons with newlines.
-- Semicolons inside explicit brace blocks (depth > 0) are preserved.
-- Leading whitespace after each replacement is stripped so the layout
-- rule treats each statement as a new top-level declaration.
preprocessEvalInput :: String -> String
preprocessEvalInput = go (0 :: Int)
  where
    go _ [] = []
    go depth ('{' : rest) = '{' : go (depth + 1) rest
    go depth ('}' : rest) = '}' : go (max 0 (depth - 1)) rest
    go 0 (';' : rest) = '\n' : go 0 (dropWhile (== ' ') rest)
    go depth ('"' : rest) = '"' : goString depth rest
    go depth (c : rest) = c : go depth rest

    goString depth [] = go depth []
    goString depth ('"' : rest) = '"' : go depth rest
    goString depth ('\\' : c : rest) = '\\' : c : goString depth rest
    goString depth (c : rest) = c : goString depth rest

cmdTypecheck :: TypecheckCommand -> Int -> Config.Config -> BuildConfig -> IO Bool
cmdTypecheck args _ config buildConfig = do
  (path, code) <- readScript (typecheckExpression args) (typecheckScript args)
  let verbosity = typecheckVerbose args
  if typecheckType args
    then case F.readType (unCode code) of
      (Left err') -> do
        putStrLn err'
        return False
      (Right x) -> do
        print x
        return True
    else
      if typecheckRealize args
        then do
          (passed, result) <-
            MM.runMorlocMonad
              Nothing
              verbosity
              config
              buildConfig
              ( M.typecheck path code
                  >>= (generatePools . snd)
              )
              |>> writeTypecheckOutput verbosity
          putDoc (result <> "\n")
          return passed
        else do
          (passed, result) <-
            MM.runMorlocMonad
              Nothing
              verbosity
              config
              buildConfig
              (M.typecheckFrontend path code)
              |>> writeFrontendTypecheckOutput verbosity
          putDoc (result <> "\n")
          return passed

writeFrontendTypecheckOutput ::
  Int ->
  ((Either MorlocError [AnnoS (Indexed TypeU) Many Int], [MT.Text]), MorlocState) ->
  (Bool, MDoc)
writeFrontendTypecheckOutput _ ((Left e, _), st) = (False, MM.makeMorlocError st e)
writeFrontendTypecheckOutput 0 ((Right xs, _), st) = (True, vsep (map (writeFrontendTypes st) xs))
writeFrontendTypecheckOutput 1 x = writeFrontendTypecheckOutput 0 x -- no difference in verbosity
writeFrontendTypecheckOutput _ _ = (False, "I don't know how to be that verbose")

writeFrontendTypes :: MorlocState -> AnnoS (Indexed TypeU) Many Int -> MDoc
writeFrontendTypes st (AnnoS (Idx i t) _ _) =
  case Map.lookup i (stateName st) of
    (Just v) -> pretty v <+> "::" <+> prettyTypeU t
    Nothing -> "? ::" <+> prettyTypeU t

writeTypecheckOutput ::
  Int -> ((Either MorlocError [(Lang, [SerialManifold])], [MT.Text]), MorlocState) -> (Bool, MDoc)
writeTypecheckOutput _ ((Left e, _), st) = (False, MM.makeMorlocError st e)
writeTypecheckOutput _ ((Right pools, _), _) = (True, vsep $ map (uncurry writePool) pools)

writePool :: Lang -> [SerialManifold] -> MDoc
writePool lang manifolds = pretty lang <+> "pool:" <> "\n" <> vsep (map pseudocodeSerialManifold manifolds) <> "\n"

cmdDump :: DumpCommand -> Int -> Config.Config -> BuildConfig -> IO Bool
cmdDump args _ config buildConfig = do
  (path, code) <- readScript (dumpExpression args) (dumpScript args)
  let verbosity = dumpVerbose args
  ((x, _), st) <- MM.runMorlocMonad Nothing verbosity config buildConfig (F.parse path code)
  case x of
    (Left e) -> do
      putDoc $ MM.makeMorlocError st e
      return False
    (Right e) -> do
      putDoc $ prettyDAG e
      return True

cmdInit :: InitCommand -> Config.Config -> IO Bool
cmdInit ic config = MSC.configureAll (not (initQuiet ic)) (initForce ic) (initSlurmSupport ic) (initSanitize ic) config

cmdNew :: NewCommand -> IO Bool
cmdNew args = do
  let pkgFile = "package.yaml"
  exists <- doesFileExist pkgFile
  if exists
    then do
      hPutStrLn stderr "Error: package.yaml already exists. Remove it first or use a different directory."
      return False
    else do
      name <-
        if null (newName args)
          then takeFileName <$> getCurrentDirectory
          else return (newName args)
      writeFile pkgFile $
        unlines
          [ "name: " ++ name
          , "version: 0.1.0"
          , "homepage: null"
          , "synopsis: null"
          , "description: null"
          , "category: null"
          , "license: MIT"
          , "author: null"
          , "maintainer: null"
          , "github: null"
          , "bug-reports: null"
          , "dependencies: []"
          , "# Uncomment to restrict which files are copied during install."
          , "# By default, all files are included (filtered by .morlocignore)."
          , "# include:"
          , "#   - \"*.py\""
          , "#   - \"src/\""
          ]
      hPutStrLn stderr $ "Created package.yaml for '" ++ name ++ "'"
      return True

prettyDAG :: DAG MVar e ExprI -> MDoc
prettyDAG m0 = vsep (map prettyEntry (Map.toList m0))
  where
    prettyEntry :: (MVar, (ExprI, [(MVar, e)])) -> MDoc
    prettyEntry (k, (n, _)) = block 4 (pretty k) (vsep [pretty n])

-- ======================================================================
-- List command
-- ======================================================================

-- Lightweight JSON types for reading manifests

data ModuleManifest = ModuleManifest
  { mmName :: T.Text
  , mmVersion :: T.Text
  , mmSynopsis :: T.Text
  , mmExports :: [(T.Text, T.Text)]
  , mmMorlocDeps :: [T.Text]
  , mmReason :: T.Text
  }

data ProgramManifest = ProgramManifest
  { pmName :: T.Text
  , pmCommands :: [ProgramCommand]
  }

data ProgramCommand = ProgramCommand
  { pcName :: T.Text
  , pcReturnType :: T.Text
  , _pcArgSchemas :: [T.Text]
  }

instance JSON.FromJSON ModuleManifest where
  parseJSON = JSON.withObject "ModuleManifest" $ \o ->
    ModuleManifest
      <$> o JSON..:? "name" JSON..!= ""
      <*> o JSON..:? "version" JSON..!= ""
      <*> o JSON..:? "synopsis" JSON..!= ""
      <*> (o JSON..:? "exports" JSON..!= [] >>= mapM parseExport)
      <*> o JSON..:? "morloc_dependencies" JSON..!= []
      <*> o JSON..:? "install_reason" JSON..!= ""
    where
      parseExport = JSON.withObject "Export" $ \o ->
        (,) <$> o JSON..: "name" <*> o JSON..: "type"

instance JSON.FromJSON ProgramManifest where
  parseJSON = JSON.withObject "ProgramManifest" $ \o ->
    ProgramManifest
      <$> o JSON..:? "name" JSON..!= ""
      <*> o JSON..:? "commands" JSON..!= []

instance JSON.FromJSON ProgramCommand where
  parseJSON = JSON.withObject "ProgramCommand" $ \o ->
    ProgramCommand
      <$> o JSON..: "name"
      <*> o JSON..:? "return_type" JSON..!= ""
      <*> o JSON..:? "arg_schemas" JSON..!= []

-- | Check if pattern is a subsequence of the target string (case-insensitive)
subsequenceMatch :: String -> String -> Bool
subsequenceMatch [] _ = True
subsequenceMatch _ [] = False
subsequenceMatch (p : ps) (t : ts)
  | toLower p == toLower t = subsequenceMatch ps ts
  | otherwise = subsequenceMatch (p : ps) ts

cmdList :: ListCommand -> Config.Config -> IO Bool
cmdList args config = do
  let fdbDir = Config.configHome config </> "fdb"
      libDir = Config.configLibrary config </> Config.configPlane config
      verbose = listVerbose args
      kind = listKind args
      pat = listPattern args

  -- Load module manifests
  allModules <-
    if kind /= Just ListPrograms
      then do
        mods <- loadModuleManifests fdbDir
        discovered <- discoverModules libDir fdbDir
        return (mods ++ discovered)
      else return []

  -- Load program manifests
  allPrograms <-
    if kind /= Just ListModules
      then loadProgramManifests fdbDir
      else return []

  -- Filter by pattern
  let modules = case pat of
        Nothing -> allModules
        Just p -> filter (\m -> subsequenceMatch p (T.unpack (mmName m))) allModules
      programs = case pat of
        Nothing -> allPrograms
        Just p -> filter (\m -> subsequenceMatch p (T.unpack (pmName m))) allPrograms

  -- For verbose mode, fill in exports from .loc files when manifest has none
  modules' <-
    if verbose > 0
      then mapM (fillModuleExports libDir) modules
      else return modules

  -- Print results
  if null modules' && null programs
    then putStrLn "No installed modules or programs found."
    else do
      if not (null modules')
        then do
          putStrLn "Modules:"
          mapM_ (printModule verbose) modules'
        else return ()
      if not (null programs)
        then do
          if not (null modules') then putStrLn "" else return ()
          putStrLn "Programs:"
          mapM_ (printProgram verbose) programs
        else return ()

  return True

-- | If a module has no exports in its manifest, scan its .loc file for type signatures
fillModuleExports :: FilePath -> ModuleManifest -> IO ModuleManifest
fillModuleExports libDir m
  | not (null (mmExports m)) = return m
  | otherwise = do
      let modDir = libDir </> T.unpack (mmName m)
          modName = T.unpack (mmName m)
      mainFile <- findMainLocFile modDir modName
      case mainFile of
        Nothing -> return m
        Just f -> do
          sigs <- extractTypeSignatures f
          return m {mmExports = sigs}

-- | Extract top-level type signatures from a .loc file
extractTypeSignatures :: FilePath -> IO [(T.Text, T.Text)]
extractTypeSignatures path = do
  result <- try (TIO.readFile path) :: IO (Either SomeException T.Text)
  case result of
    Left _ -> return []
    Right content ->
      return
        . map parseSig
        . filter isTypeSig
        . T.lines
        $ content
  where
    isTypeSig ln =
      let stripped = T.stripStart ln
       in not (T.null stripped)
            && T.head stripped /= '-' -- not a comment
            && T.head stripped /= '{' -- not a block comment
            && T.isInfixOf " :: " stripped
            && not (T.isPrefixOf "type " stripped)
            && not (T.isPrefixOf "source " stripped)
            && not (T.isPrefixOf "import " stripped)
            && not (T.isPrefixOf "module " stripped)
            && not (T.isPrefixOf "class " stripped)
            && not (T.isPrefixOf "instance " stripped)

    parseSig ln =
      let (sigName, rest) = T.breakOn " :: " (T.stripStart ln)
          typ = T.strip (T.drop 4 rest) -- drop " :: "
       in (T.strip sigName, typ)

loadModuleManifests :: FilePath -> IO [ModuleManifest]
loadModuleManifests fdbDir = do
  result <- try (listDirectory fdbDir) :: IO (Either SomeException [FilePath])
  case result of
    Left _ -> return []
    Right entries -> do
      let moduleFiles = filter (".module" `isSuffixOf`) entries
      catMaybes
        <$> mapM
          ( \f -> do
              r <- try (BL.readFile (fdbDir </> f)) :: IO (Either SomeException BL.ByteString)
              case r of
                Left _ -> return Nothing
                Right bs -> case JSON.eitherDecode bs of
                  Right m -> return (Just m)
                  Left _ -> return Nothing
          )
          moduleFiles

loadProgramManifests :: FilePath -> IO [ProgramManifest]
loadProgramManifests fdbDir = do
  result <- try (listDirectory fdbDir) :: IO (Either SomeException [FilePath])
  case result of
    Left _ -> return []
    Right entries -> do
      let manifestFiles = filter (".manifest" `isSuffixOf`) entries
      catMaybes
        <$> mapM
          ( \f -> do
              r <- try (BL.readFile (fdbDir </> f)) :: IO (Either SomeException BL.ByteString)
              case r of
                Left _ -> return Nothing
                Right bs -> case JSON.eitherDecode bs of
                  Right m ->
                    let m' =
                          if T.null (pmName m)
                            then m {pmName = T.pack (dropExtension (takeFileName f))}
                            else m
                     in return (Just m')
                  Left _ -> return Nothing
          )
          manifestFiles

-- | Discover modules in the library that lack manifests
discoverModules :: FilePath -> FilePath -> IO [ModuleManifest]
discoverModules libDir fdbDir = do
  libExists <- doesDirectoryExist libDir
  if not libExists
    then return []
    else do
      entries <- listDirectory libDir
      catMaybes
        <$> mapM
          ( \name -> do
              let manifestPath = fdbDir </> name ++ ".module"
                  moduleDir = libDir </> name
              hasManifest <- doesFileExist manifestPath
              isDir <- doesDirectoryExist moduleDir
              if hasManifest || not isDir
                then return Nothing
                else do
                  -- Try to read package.yaml for basic info
                  let pkgYaml = moduleDir </> "package.yaml"
                  pkgExists <- doesFileExist pkgYaml
                  if pkgExists
                    then do
                      r <- try (BL.readFile pkgYaml) :: IO (Either SomeException BL.ByteString)
                      case r of
                        Left _ -> return (Just (minimalManifest name))
                        Right bs -> case decodePackageMeta bs of
                          Just meta ->
                            return . Just $
                              ModuleManifest
                                { mmName = if T.null (packageName meta) then T.pack name else packageName meta
                                , mmVersion = packageVersion meta
                                , mmSynopsis = packageSynopsis meta
                                , mmExports = []
                                , mmMorlocDeps = []
                                , mmReason = ""
                                }
                          Nothing -> return (Just (minimalManifest name))
                    else return (Just (minimalManifest name))
          )
          entries
  where
    minimalManifest name =
      ModuleManifest
        { mmName = T.pack name
        , mmVersion = ""
        , mmSynopsis = ""
        , mmExports = []
        , mmMorlocDeps = []
        , mmReason = ""
        }

printModule :: Int -> ModuleManifest -> IO ()
printModule verbose m = do
  let name = mmName m
      ver = if T.null (mmVersion m) then "" else " " <> T.unpack (mmVersion m)
      syn = if T.null (mmSynopsis m) then "" else "  " <> T.unpack (mmSynopsis m)
  putStrLn $ "  " <> T.unpack name <> ver <> syn
  if verbose > 0
    then mapM_ (\(n, t) -> putStrLn $ "    " <> T.unpack n <> " :: " <> T.unpack t) (mmExports m)
    else return ()

printProgram :: Int -> ProgramManifest -> IO ()
printProgram verbose p = do
  let name = pmName p
      cmds = pmCommands p
      cmdCount = length cmds
      summary = show cmdCount <> " command" <> (if cmdCount /= 1 then "s" else "")
  putStrLn $ "  " <> T.unpack name <> "  " <> summary
  if verbose > 0
    then
      mapM_ (\c -> putStrLn $ "    " <> T.unpack (pcName c) <> " :: " <> T.unpack (pcReturnType c)) cmds
    else return ()

-- ======================================================================
-- Uninstall command
-- ======================================================================

cmdUninstall :: UninstallCommand -> Config.Config -> IO Bool
cmdUninstall args config = do
  let fdbDir = Config.configHome config </> "fdb"
      libDir = Config.configLibrary config </> Config.configPlane config
      binDir = Config.configHome config </> "bin"
      exeDir = Config.configHome config </> "exe"
      dryRun = uninstallDryRun args
      kind = uninstallKind args

  names <- if uninstallAll args
    then do
      fdbExists <- doesDirectoryExist fdbDir
      if not fdbExists
        then return []
        else do
          entries <- listDirectory fdbDir
          let moduleNames = [dropExtension f | f <- entries, ".module" `isSuffixOf` f]
          return moduleNames
    else return (uninstallNames args)

  if null names
    then do
      if uninstallAll args
        then putStrLn "No modules installed"
        else putStrLn "No module names specified. Use --all to uninstall all modules."
      return True
    else do
      let skipDepCheck = uninstallAll args
      allPassed <- mapM (\name -> uninstallOne fdbDir libDir binDir exeDir dryRun skipDepCheck kind name) names
      let anyRemoved = or allPassed

      -- Regenerate completions if anything was actually removed
      if anyRemoved && not dryRun
        then Completion.regenerateCompletions False (Config.configHome config)
        else return ()

      return True

uninstallOne ::
  FilePath -> FilePath -> FilePath -> FilePath -> Bool -> Bool -> Maybe ListKind -> String -> IO Bool
uninstallOne fdbDir libDir binDir exeDir dryRun skipDepCheck kind name = do
  let moduleManifest = fdbDir </> name ++ ".module"
      programManifest = fdbDir </> name ++ ".manifest"
      moduleDir = libDir </> name

  hasModule <- doesFileExist moduleManifest
  hasModuleDir <- doesDirectoryExist moduleDir
  hasProgram <- doesFileExist programManifest

  let removeModule = (hasModule || hasModuleDir) && kind /= Just ListPrograms
      removeProgram = hasProgram && kind /= Just ListModules

  if not removeModule && not removeProgram
    then do
      putStrLn $ "Nothing found for '" <> name <> "'"
      return False
    else do
      -- Reverse dependency check for modules (skip when uninstalling all)
      if removeModule
        then do
          if not skipDepCheck then checkReverseDeps fdbDir name else return ()
          if dryRun
            then do
              putStrLn $ "Would uninstall module '" <> name <> "'"
              if hasModuleDir
                then putStrLn $ "  Remove: " <> moduleDir
                else return ()
              if hasModule
                then putStrLn $ "  Remove: " <> moduleManifest
                else return ()
            else do
              if hasModuleDir then removeDirectoryRecursive moduleDir else return ()
              if hasModule then removeFile moduleManifest else return ()
              hPutStrLn stderr $ "Uninstalled module '" <> name <> "'"
        else return ()

      if removeProgram
        then do
          let binPath = binDir </> name
          binExists <- doesFileExist binPath
          if dryRun
            then do
              putStrLn $ "Would uninstall program '" <> name <> "'"
              if binExists then putStrLn $ "  Remove: " <> binPath else return ()
              -- Check for exe dir
              exeDirPath <- findExeDir exeDir name
              case exeDirPath of
                Just d -> putStrLn $ "  Remove: " <> d
                Nothing -> return ()
              putStrLn $ "  Remove: " <> programManifest
            else do
              if binExists then removeFile binPath else return ()
              exeDirPath <- findExeDir exeDir name
              case exeDirPath of
                Just d -> removeDirectoryRecursive d
                Nothing -> return ()
              removeFile programManifest
              hPutStrLn stderr $ "Uninstalled program '" <> name <> "'"
        else return ()

      return (removeModule || removeProgram)

-- | Find the exe directory for a program
findExeDir :: FilePath -> String -> IO (Maybe FilePath)
findExeDir exeDir name = do
  exists <- doesDirectoryExist exeDir
  if not exists
    then return Nothing
    else do
      entries <- listDirectory exeDir
      -- Look for name or name-<hash>
      let matches = filter (\e -> e == name || (name ++ "-") `isPrefixOf'` e) entries
      case matches of
        (m : _) -> return (Just (exeDir </> m))
        [] -> return Nothing
  where
    isPrefixOf' prefix str = take (length prefix) str == prefix

-- | Check if any other modules depend on the one being uninstalled
checkReverseDeps :: FilePath -> String -> IO ()
checkReverseDeps fdbDir name = do
  result <- try (listDirectory fdbDir) :: IO (Either SomeException [FilePath])
  case result of
    Left _ -> return ()
    Right entries -> do
      let moduleFiles = filter (".module" `isSuffixOf`) entries
          nameT = T.pack name
      forM_ moduleFiles $ \f -> do
        r <- try (BL.readFile (fdbDir </> f)) :: IO (Either SomeException BL.ByteString)
        case r of
          Left _ -> return ()
          Right bs -> case JSON.eitherDecode bs :: Either String ModuleManifest of
            Right m
              | nameT `elem` mmMorlocDeps m && mmName m /= nameT ->
                  putStrLn $ "Warning: module '" <> T.unpack (mmName m) <> "' depends on '" <> name <> "'"
            _ -> return ()


================================================
FILE: executable/UI.hs
================================================
{- |
Module      : UI
Description : CLI argument parsing with optparse-applicative
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Defines the command-line interface for the @morloc@ executable using
optparse-applicative: subcommands (make, typecheck, install, init, dump,
completion), their options, and help text.
-}
module UI
  ( opts
  , CliCommand (..)
  , MakeCommand (..)
  , InitCommand (..)
  , InstallCommand (..)
  , TypecheckCommand (..)
  , DumpCommand (..)
  , ListCommand (..)
  , ListKind (..)
  , UninstallCommand (..)
  , NewCommand (..)
  , EvalCommand (..)
  ) where

import Morloc.Module (GitProtocol (..), OverwriteProtocol (..))
import Morloc.Version (versionStr)
import Options.Applicative
import qualified Options.Applicative.Extra as OAE

opts :: ParserInfo CliCommand
opts =
  info
    (cliParser <**> helper <**> OAE.simpleVersioner versionStr)
    ( fullDesc
        <> progDesc "Call 'morloc make -h', 'morloc install -h', etc for details"
        <> header ("morloc v" <> versionStr)
    )

data CliCommand
  = CmdMake MakeCommand
  | CmdInstall InstallCommand
  | CmdUninstall UninstallCommand
  | CmdList ListCommand
  | CmdTypecheck TypecheckCommand
  | CmdDump DumpCommand
  | CmdInit InitCommand
  | CmdNew NewCommand
  | CmdEval EvalCommand

cliParser :: Parser CliCommand
cliParser =
  hsubparser
    ( makeSubcommand
        <> installSubcommand
        <> uninstallSubcommand
        <> listSubcommand
        <> typecheckSubcommand
        <> dumpSubcommand
        <> initSubcommand
        <> newSubcommand
        <> evalSubcommand
    )

data MakeCommand = MakeCommand
  { makeExpression :: Bool
  , makeConfig :: String
  , makeVerbose :: Int
  , makeVanilla :: Bool
  , makeOutfile :: String
  , makeInstall :: Bool
  , makeForce :: Bool
  , makeInclude :: [String]
  , makeScript :: String
  }

makeCommandParser :: Parser MakeCommand
makeCommandParser =
  MakeCommand
    <$> optExpression
    <*> optConfig
    <*> optVerbose
    <*> optVanilla
    <*> optOutfile
    <*> optMakeInstall
    <*> optMakeForce
    <*> optMakeInclude
    <*> optScript

makeSubcommand :: Mod CommandFields CliCommand
makeSubcommand = command "make" (info (CmdMake <$> makeCommandParser) (progDesc "Build a morloc script"))

data InitCommand = InitCommand
  { initConfig :: String
  , initQuiet :: Bool
  , initVanilla :: Bool
  , initForce :: OverwriteProtocol
  , initSlurmSupport :: Bool
  , initSanitize :: Bool
  }

initCommandParser :: Parser InitCommand
initCommandParser =
  InitCommand
    <$> optConfig
    <*> optQuiet
    <*> optVanilla
    <*> optForce
    <*> optSlurmSupport
    <*> optSanitize

initSubcommand :: Mod CommandFields CliCommand
initSubcommand = command "init" (info (CmdInit <$> initCommandParser) (progDesc "Initialize morloc environment"))

data NewCommand = NewCommand
  { newName :: String
  }

newCommandParser :: Parser NewCommand
newCommandParser =
  NewCommand
    <$> strArgument
      ( metavar "NAME"
          <> value ""
          <> help "Package name (defaults to current directory name)"
      )

newSubcommand :: Mod CommandFields CliCommand
newSubcommand = command "new" (info (CmdNew <$> newCommandParser) (progDesc "Create a new morloc package"))

data InstallCommand = InstallCommand
  { installConfig :: String
  , installVanilla :: Bool
  , installVerbose :: Int
  , installForce :: OverwriteProtocol
  , installUseSSH :: GitProtocol
  , installNoTypecheck :: Bool
  , installBuild :: Bool
  , installModuleStrings :: [String]
  }

makeInstallParser :: Parser InstallCommand
makeInstallParser =
  InstallCommand
    <$> optConfig
    <*> optVanilla
    <*> optVerbose
    <*> optForce
    <*> optUseSSH
    <*> optNoTypecheck
    <*> optInstallBuild
    <*> optModuleStrings

installSubcommand :: Mod CommandFields CliCommand
installSubcommand = command "install" (info (CmdInstall <$> makeInstallParser) (progDesc "Install a morloc module"))

data TypecheckCommand = TypecheckCommand
  { typecheckConfig :: String
  , typecheckVanilla :: Bool
  , typecheckType :: Bool
  , typecheckRaw :: Bool
  , typecheckExpression :: Bool
  , typecheckVerbose :: Int
  , typecheckRealize :: Bool
  , typecheckScript :: String
  }

makeTypecheckParser :: Parser TypecheckCommand
makeTypecheckParser =
  TypecheckCommand
    <$> optConfig
    <*> optVanilla
    <*> optType
    <*> optRaw
    <*> optExpression
    <*> optVerbose
    <*> optRealize
    <*> optScript

typecheckSubcommand :: Mod CommandFields CliCommand
typecheckSubcommand =
  command
    "typecheck"
    (info (CmdTypecheck <$> makeTypecheckParser) (progDesc "Typecheck a morloc program"))

dumpSubcommand :: Mod CommandFields CliCommand
dumpSubcommand =
  command "dump" (info (CmdDump <$> makeDumpParser) (progDesc "Dump parsed code"))

data DumpCommand = DumpCommand
  { dumpConfig :: String
  , dumpVanilla :: Bool
  , dumpVerbose :: Int
  , dumpExpression :: Bool
  , dumpScript :: String
  }

makeDumpParser :: Parser DumpCommand
makeDumpParser =
  DumpCommand
    <$> optConfig
    <*> optVanilla
    <*> optVerbose
    <*> optExpression
    <*> optScript

data ListKind = ListModules | ListPrograms
  deriving (Show, Eq)

data ListCommand = ListCommand
  { listPattern :: Maybe String
  , listConfig :: String
  , listVanilla :: Bool
  , listVerbose :: Int
  , listKind :: Maybe ListKind
  }

makeListParser :: Parser ListCommand
makeListParser =
  ListCommand
    <$> optListPattern
    <*> optConfig
    <*> optVanilla
    <*> optVerbose
    <*> optListKind

listSubcommand :: Mod CommandFields CliCommand
listSubcommand =
  command "list" (info (CmdList <$> makeListParser) (progDesc "List installed modules and programs"))

data UninstallCommand = UninstallCommand
  { uninstallNames :: [String]
  , uninstallConfig :: String
  , uninstallVanilla :: Bool
  , uninstallKind :: Maybe ListKind
  , uninstallDryRun :: Bool
  , uninstallAll :: Bool
  }

makeUninstallParser :: Parser UninstallCommand
makeUninstallParser =
  UninstallCommand
    <$> optUninstallNamesOrNone
    <*> optConfig
    <*> optVanilla
    <*> optUninstallKind
    <*> optDryRun
    <*> optUninstallAll

uninstallSubcommand :: Mod CommandFields CliCommand
uninstallSubcommand =
  command
    "uninstall"
    (info (CmdUninstall <$> makeUninstallParser) (progDesc "Uninstall a module or program"))

optExpression :: Parser Bool
optExpression =
  switch
    ( long "expression"
        <> short 'e'
        <> help "Read script as string rather than file"
    )

optVanilla :: Parser Bool
optVanilla =
  switch
    ( long "vanilla"
        <> help "Ignore local configuration files"
    )

optForce :: Parser OverwriteProtocol
optForce =
  flag
    DoNotOverwrite
    ForceOverwrite
    ( long "force"
        <> short 'f'
        <> help "Overwrite files if they already exist"
    )

optUseSSH :: Parser GitProtocol
optUseSSH =
  flag
    HttpsProtocol
    SshProtocol
    ( long "ssh"
        <> help "Use SSH protocol for remote git access"
    )

optNoTypecheck :: Parser Bool
optNoTypecheck =
  switch
    ( long "no-typecheck"
        <> help "Skip typechecking during install"
    )

optInstallBuild :: Parser Bool
optInstallBuild =
  switch
    ( long "build"
        <> short 'b'
        <> help "Build and install executable after module install"
    )

optModuleStrings :: Parser [String]
optModuleStrings =
  some -- one or more
    . strArgument
    $ ( metavar "INSTALL"
          <> help "Module install strings"
      )

optRaw :: Parser Bool
optRaw =
  switch
    ( long "raw"
        <> help "Print raw objects"
    )

optSlurmSupport :: Parser Bool
optSlurmSupport =
  switch
    ( long "slurm"
        <> help "Allow use of SLURM for remote jobs"
    )

optSanitize :: Parser Bool
optSanitize =
  switch
    ( long "sanitize"
        <> help "Enable alignment sanitizer for debugging memory layout issues"
    )

optVerbose :: Parser Int
optVerbose = length <$> many (flag' () (short 'v'))

optQuiet :: Parser Bool
optQuiet =
  switch
    ( long "quiet"
        <> short 'q'
        <> help "Print minimal output to STDERR"
    )

optRealize :: Parser Bool
optRealize =
  switch
    ( long "realize"
        <> short 'r'
        <> help "Typecheck the composition realizations"
    )

optConfig :: Parser String
optConfig =
  strOption
    ( long "config"
        <> metavar "CONFIG"
        <> value ""
        <> help "Use this config rather than the one in morloc home"
    )

optOutfile :: Parser String
optOutfile =
  strOption
    ( long "outfile"
        <> short 'o'
        <> metavar "OUT"
        <> value ""
        <> showDefault
        <> help "The name of the generated executable"
    )

optMakeInstall :: Parser Bool
optMakeInstall =
  switch
    ( long "install"
        <> help "Install module to PATH"
    )

optMakeForce :: Parser Bool
optMakeForce =
  switch
    ( long "force"
        <> short 'f'
        <> help "Overwrite existing install"
    )

optMakeInclude :: Parser [String]
optMakeInclude =
  many
    ( strOption
        ( long "include"
            <> metavar "PATTERN"
            <> help "File pattern to include in install"
        )
    )

optScript :: Parser String
optScript = argument str (metavar "<script>" <> value "main.loc")

optType :: Parser Bool
optType =
  switch
    ( long "type"
        <> short 't'
        <> help "Parse a typestring instread of an expression"
    )

optListKind :: Parser (Maybe ListKind)
optListKind =
  flag' (Just ListModules) (long "modules" <> help "List only modules")
    <|> flag' (Just ListPrograms) (long "programs" <> help "List only programs")
    <|> pure Nothing

optListPattern :: Parser (Maybe String)
optListPattern =
  optional . strArgument $
    ( metavar "PATTERN"
        <> help "Filter by subsequence match on name"
    )

optUninstallNamesOrNone :: Parser [String]
optUninstallNamesOrNone =
  many
    . strArgument
    $ ( metavar "NAME"
          <> help "Names of modules or programs to uninstall"
      )

optUninstallAll :: Parser Bool
optUninstallAll =
  switch
    ( long "all"
        <> help "Uninstall all installed modules"
    )

optUninstallKind :: Parser (Maybe ListKind)
optUninstallKind =
  flag' (Just ListModules) (long "module" <> help "Uninstall only the module")
    <|> flag' (Just ListPrograms) (long "program" <> help "Uninstall only the program")
    <|> pure Nothing

optDryRun :: Parser Bool
optDryRun =
  switch
    ( long "dry-run"
        <> help "Show what would be removed without removing"
    )

data EvalCommand = EvalCommand
  { evalConfig :: String
  , evalVanilla :: Bool
  , evalVerbose :: Int
  , evalSave :: String
  , evalExpression :: String
  , evalArgs :: [String]
  }

evalCommandParser :: Parser EvalCommand
evalCommandParser =
  EvalCommand
    <$> optConfig
    <*> optVanilla
    <*> optVerbose
    <*> optSave
    <*> strArgument
      ( metavar "EXPRESSION"
          <> help "Morloc expression to evaluate"
      )
    <*> many (strArgument (metavar "ARGS..." <> help "Extra arguments passed to the compiled program"))

evalSubcommand :: Mod CommandFields CliCommand
evalSubcommand =
  command
    "eval"
    (info (CmdEval <$> evalCommandParser) (progDesc "Evaluate a morloc expression"))

optSave :: Parser String
optSave =
  strOption
    ( long "save"
        <> metavar "NAME"
        <> value ""
        <> help "Save as a named command instead of running"
    )


================================================
FILE: fourmolu.yaml
================================================
# Fourmolu configuration for morloc compiler
# https://github.com/fourmolu/fourmolu

# Indentation
indentation: 2

# Maximum line length (soft limit for formatting decisions)
column-limit: 100

# How to format function arguments
function-arrows: trailing

# How to format record syntax
record-brace-space: true

# Indent where bindings
indent-wheres: true

# How to format haddock comments
haddock-style: multi-line

# How to format import lists
import-export-style: leading

# How to format record fields
record-style: multi-line

# How to format let expressions
let-style: inline

# How to format in expressions
in-style: right-align

# How to treat single constraint contexts
single-constraint-parens: always

# Unicode syntax (don't convert to unicode)
unicode: never

# Respect language pragmas in files
respectful: true

# Newlines between declarations
newlines-between-decls: 1


================================================
FILE: hie.yaml
================================================
cradle:
  stack:
    - path: "./library"
      component: "morloc:lib"

    - path: "./executable/Main.hs"
      component: "morloc:exe:morloc"

    - path: "./executable/Subcommands.hs"
      component: "morloc:exe:morloc"

    - path: "./executable/UI.hs"
      component: "morloc:exe:morloc"

    - path: "./executable/Paths_morloc.hs"
      component: "morloc:exe:morloc"

    - path: "./test-suite"
      component: "morloc:test:morloc-test"


================================================
FILE: library/Morloc/BaseTypes.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.BaseTypes
Description : Predefined base type names and constructors
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Smart constructors for the built-in morloc types (Unit, Int, Real, Bool, Str,
List, Tuple, etc.) as both 'TVar' names and 'TypeU' values. These correspond
to the types that are hardwired into the type system and have special
serialization\/deserialization support.
-}
module Morloc.BaseTypes
  ( unit
  , real
  , f32
  , f64
  , int
  , i8
  , i16
  , i32
  , i64
  , uint
  , u8
  , u16
  , u32
  , u64
  , bool
  , str
  , tuple
  , list
  , vector
  , matrix
  , tensor
  , record
  , unitU
  , realU
  , f32U
  , f64U
  , intU
  , i8U
  , i16U
  , i32U
  , i64U
  , uintU
  , u8U
  , u16U
  , u32U
  , u64U
  , boolU
  , strU
  , tupleU
  , listU
  , effectU
  , optionalU
  ) where

import Morloc.Data.Text (pretty)
import Morloc.Namespace.Prim (TVar (..))
import Morloc.Namespace.Type (TypeU (..), emptyEffectSet)
import Prelude hiding (log)

unit :: TVar
unit = TV "Unit"

real :: TVar
real = TV "Real"

f32 :: TVar
f32 = TV "Float32"

f64 :: TVar
f64 = TV "Float64"

int :: TVar
int = TV "Int"

i8 :: TVar
i8 = TV "Int8"

i16 :: TVar
i16 = TV "Int16"

i32 :: TVar
i32 = TV "Int32"

i64 :: TVar
i64 = TV "Int64"

u8 :: TVar
u8 = TV "UInt8"

uint :: TVar
uint = TV "UInt"

u16 :: TVar
u16 = TV "UInt16"

u32 :: TVar
u32 = TV "UInt32"

u64 :: TVar
u64 = TV "UInt64"

bool :: TVar
bool = TV "Bool"

str :: TVar
str = TV "Str"

list :: TVar
list = TV "List"

tuple :: Int -> TVar
tuple k = TV $ "Tuple" <> pretty k

vector :: TVar
vector = TV "Vector"

matrix :: TVar
matrix = TV "Matrix"

tensor :: Int -> TVar
tensor k = TV $ "Tensor" <> pretty k

record :: TVar
record = TV "Record"

unitU :: TypeU
unitU = VarU $ TV "Unit"

realU :: TypeU
realU = VarU $ TV "Real"

f32U :: TypeU
f32U = VarU $ TV "Float32"

f64U :: TypeU
f64U = VarU $ TV "Float64"

intU :: TypeU
intU = VarU $ TV "Int"

i8U :: TypeU
i8U = VarU $ TV "Int8"

i16U :: TypeU
i16U = VarU $ TV "Int16"

i32U :: TypeU
i32U = VarU $ TV "Int32"

i64U :: TypeU
i64U = VarU $ TV "Int64"

u8U :: TypeU
u8U = VarU $ TV "UInt8"

uintU :: TypeU
uintU = VarU $ TV "UInt"

u16U :: TypeU
u16U = VarU $ TV "UInt16"

u32U :: TypeU
u32U = VarU $ TV "UInt32"

u64U :: TypeU
u64U = VarU $ TV "UInt64"

boolU :: TypeU
boolU = VarU $ TV "Bool"

strU :: TypeU
strU = VarU $ TV "Str"

listU :: TypeU -> TypeU
listU t = AppU (VarU list) [t]

tupleU :: [TypeU] -> TypeU
tupleU ts = AppU (VarU $ tuple (length ts)) ts

effectU :: TypeU -> TypeU
effectU = EffectU emptyEffectSet

optionalU :: TypeU -> TypeU
optionalU = OptionalU


================================================
FILE: library/Morloc/CodeGenerator/Docstrings.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Docstrings
Description : Generate CLI help text and argument documentation for exported functions
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Processes docstring annotations from type signatures into the final
'MDoc' records used by the nexus for @--help@ output, including argument
names, default values, metavars, and CLI option flags.
-}
module Morloc.CodeGenerator.Docstrings (processDocstrings) where

import qualified Data.Map as Map
import Data.Text (Text)
import qualified Morloc.BaseTypes as MBT
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM

-- Most of the transmogrification of docstrings occurs in the parser, but there
-- are some limitations there since the types are not yet known. If a type in a
-- function signature is labeled as `unrolled: true`, then the standard
-- positional argument should be replaced with a group of arguments for every
-- field in the record. But the type signature for the function will have only
-- the name of the type, not the details.
--
-- In addition to unrolling arguments, docstring information can be inherited
-- even for non-record types. The main use case for this is defining a type that
-- has a description and short/long option terms that are reused across function
-- signatures.
--
-- This top-level function collects docstring info and passes it to `processArgDoc`
processDocstrings ::
  AnnoS (Indexed Type) One a -> MorlocMonad (AnnoS (Indexed Type) One a, CmdDocSet)
processDocstrings e@(AnnoS (Idx i t) _ _) = do
  sgmap <- MM.gets stateSignatures
  argdoc <- case GMap.lookup i sgmap of
    (GMapJust (Monomorphic (TermTypes (Just et) _ _))) -> return $ edocs et
    (GMapJust (Polymorphic _ _ et _)) -> return $ edocs et
    _ -> case t of
      (FunT ts _) -> return $ ArgDocSig defaultValue (take (length ts) (repeat defaultValue)) defaultValue
      _ -> return $ ArgDocAlias defaultValue
  -- Declaration-level docstrings take precedence over signature docstrings
  -- for the command-level description.
  declDocs <- lookupDeclDocs i
  let argdoc' = case declDocs of
        [] -> argdoc
        ls -> overrideCmdDocLines ls argdoc
  doc <- processArgDoc i t argdoc'
  return (e, doc)

-- | Look up the declaration-level docstring for the term at a given index.
-- Returns an empty list if no declaration docstring exists.
lookupDeclDocs :: Int -> MorlocMonad [Text]
lookupDeclDocs i = do
  nameMap <- MM.gets stateName
  case Map.lookup i nameMap of
    Nothing -> return []
    Just name -> do
      termDocs <- MM.gets stateTermDocs
      return $ Map.findWithDefault [] name termDocs

-- | Override the command-level docLines while preserving all other docstring
-- fields (argument docs, return docs, metavars, etc.).
overrideCmdDocLines :: [Text] -> ArgDoc -> ArgDoc
overrideCmdDocLines ls (ArgDocSig cmd args ret) =
  ArgDocSig (cmd { docLines = ls }) args ret
overrideCmdDocLines ls (ArgDocRec vars fields) =
  ArgDocRec (vars { docLines = ls }) fields
overrideCmdDocLines ls (ArgDocAlias vars) =
  ArgDocAlias (vars { docLines = ls })

-- dispatch docstring info for each argument to `processArgDoc`
processArgDoc :: Int -> Type -> ArgDoc -> MorlocMonad CmdDocSet
processArgDoc i (FunT ts t) (ArgDocSig cmddoc argdocs retdoc) = do
  (ts', argdocs') <- zipWithM (reduceArgDoc i) ts (map ArgDocAlias argdocs) |>> unzip
  cmdargs <- zipWithM makeCmdArg ts' argdocs'
  (t', retdoc') <- reduceArgDoc i t (ArgDocAlias retdoc)
  return $
    CmdDocSet
      { cmdDocDesc = docLines cmddoc
      , cmdDocName = docName cmddoc
      , cmdDocArgs = cmdargs
      , cmdDocRet = (t', getReturnDesc retdoc' (docReturn cmddoc))
      }
processArgDoc i t (ArgDocSig cmddoc [] retdoc) = do
  (t', retdoc') <- reduceArgDoc i t (ArgDocAlias retdoc)
  return $
    CmdDocSet
      { cmdDocDesc = docLines cmddoc
      , cmdDocName = docName cmddoc
      , cmdDocArgs = []
      , cmdDocRet = (t', getReturnDesc retdoc' (docReturn cmddoc))
      }
processArgDoc _ t (ArgDocAlias r) =
  return $
    CmdDocSet
      { cmdDocDesc = docLines r
      , cmdDocName = docName r
      , cmdDocArgs = []
      , cmdDocRet = (t, [])
      }
processArgDoc i t r = do
  (t', r') <- reduceArgDoc i t r
  case (t', r') of
    (NamT _ _ _ ts, ArgDocRec args entries) -> do
      cmdargs <- zipWithM makeCmdArg (map snd ts) (map (ArgDocAlias . snd) entries)
      return $
        CmdDocSet
          { cmdDocDesc = docLines args
          , cmdDocName = docName args
          , cmdDocArgs = cmdargs
          , cmdDocRet = (t, [])
          }
    _ -> MM.throwSystemError "Expected a record type with docstrings but found a non-record type"

getReturnDesc :: ArgDoc -> Maybe Text -> [Text]
getReturnDesc _ (Just ret) = [ret]
getReturnDesc (ArgDocRec r _) _ = docLines r
getReturnDesc (ArgDocSig r _ _) _ = docLines r
getReturnDesc (ArgDocAlias r) _ = docLines r

reduceArgDoc :: Int -> Type -> ArgDoc -> MorlocMonad (Type, ArgDoc)
reduceArgDoc i t@(VarT v) arg = do
  scope <- MM.getGeneralScope i
  case Map.lookup v scope of
    (Just [(_, typeOf -> parentType, parentArg, _)]) ->
      inheritArgDoc arg parentArg >>= reduceArgDoc i parentType
    (Just _) -> MM.throwSystemError $ "Multiple definitions for type alias '" <> pretty (unTVar v) <> "'"
    Nothing -> return (t, arg)
  where
    inheritArgDoc :: ArgDoc -> ArgDoc -> MorlocMonad ArgDoc
    inheritArgDoc (ArgDocAlias r1) (ArgDocAlias r2) = return $ ArgDocAlias (inheritArgDocVars r1 r2)
    inheritArgDoc (ArgDocAlias r1) (ArgDocRec r2 rs) = return $ ArgDocRec (inheritArgDocVars r1 r2) rs
    inheritArgDoc _ _ = MM.throwSystemError $ "Cannot inherit docstrings for type alias '" <> pretty (unTVar v) <> "'"

    inheritArgDocVars :: ArgDocVars -> ArgDocVars -> ArgDocVars
    inheritArgDocVars r1 r2 =
      ArgDocVars
        { docLines = if (length (docLines r1) > 0) then docLines r1 else docLines r2
        , docName = docName r1 <|> docName r2
        , docLiteral = docLiteral r1 <|> docLiteral r2
        , docUnroll = docUnroll r1 <|> docUnroll r2
        , docDefault = docDefault r1 <|> docDefault r2
        , docMetavar = docMetavar r1 <|> docMetavar r2
        , docArg = docArg r1 <|> docArg r2
        , docTrue = docTrue r1 <|> docTrue r2
        , docFalse = docFalse r1 <|> docFalse r2
        , docReturn = docReturn r1 <|> docReturn r2
        }
reduceArgDoc i (NamT o v ps (map snd -> ts)) (ArgDocRec arg rs) = do
  let args = map (ArgDocAlias . snd) rs
      keys = map fst rs
  entries <- zipWithM (reduceArgDoc i) ts args
  let args' = [r | (ArgDocAlias r) <- map snd entries]
  return (NamT o v ps (zip keys (map fst entries)), ArgDocRec arg (zip keys args'))
reduceArgDoc _ t r = return (t, r)

makeCmdArg :: Type -> ArgDoc -> MorlocMonad CmdArg
makeCmdArg recType@(NamT _ _ _ rs) (ArgDocRec arg entries) = do
  -- Set the metavar default for groups to the record type name
  let typedEntries = zipWith (\(k, t) (_, r) -> (k, (t, r))) rs entries
  resolveArgDocVars typedEntries recType arg
makeCmdArg t (ArgDocRec r _) = resolveArgDocVars [] t r
makeCmdArg t (ArgDocAlias r) = resolveArgDocVars [] t r
makeCmdArg _ (ArgDocSig _ _ _) = MM.throwSystemError "Illegal functional CLI parameter"

resolveArgDocVars :: [(Key, (Type, ArgDocVars))] -> Type -> ArgDocVars -> MorlocMonad CmdArg
resolveArgDocVars rs t r
  | docUnroll r == Just False = resolvePos t r |>> CmdArgPos
  | length rs > 0 && docUnroll r == Just True = resolveGrp t r rs
  | t == VarT MBT.bool = resolveFlagCmdArg r
  | isJust (docArg r) && isJust (docDefault r) = resolveOpt t r |>> CmdArgOpt
  | otherwise = resolvePos t r |>> CmdArgPos

resolveGrp :: Type -> ArgDocVars -> [(Key, (Type, ArgDocVars))] -> MorlocMonad CmdArg
resolveGrp recType@(NamT _ v _ _) arg argEntries = do
  entries <- mapM resolveRecDocVars argEntries
  return . CmdArgGrp $
    RecDocSet
      { recDocType = recType
      , recDocDesc = docLines arg
      , recDocMetavar = fromMaybe (unTVar v) (docMetavar arg)
      , recDocOpt = docArg arg
      , recDocEntries = entries
      }
  where
    resolveRecDocVars ::
      (Key, (Type, ArgDocVars)) -> MorlocMonad (Key, Either ArgFlagDocSet ArgOptDocSet)
    resolveRecDocVars (k, (t, r))
      | t == VarT MBT.bool = do
          eitherFlag <- resolveFlag r
          case eitherFlag of
            (Right flag) -> return $ (k, Left flag)
            (Left _) -> MM.throwSystemError $ "Non-optional field found in unrolled record"
      | otherwise = do
          opt <- resolveOpt t r
          return (k, Right opt)
resolveGrp _ _ _ = MM.throwSystemError "Cannot unroll a non-record type into CLI argument groups"

-- resolve a boolean into either a flag option or a positional
resolveFlag :: ArgDocVars -> MorlocMonad (Either ArgPosDocSet ArgFlagDocSet)
resolveFlag r =
  case (docTrue r, docFalse r, (==) "true" <$> docDefault r) of
    -- if no default value is given, make default based on given args
    -- e.g., true: -v/--verbose
    (Just rt, Nothing, Nothing) -> flag rt Nothing False
    -- e.g., false: -q/--quit
    (Nothing, Just rf, Nothing) -> flag rf Nothing True
    -- e.g., true: -v/--verbose
    --       false: -q/--quit
    (Just rt, Just rf, Nothing) -> flag rt (Just rf) False
    -- set default to TRUE
    (Nothing, Just rf, Just True) -> flag rf Nothing True
    (Just rt, Just rf, Just True) -> flag rf (Just rt) True
    -- set default to FALSE
    (Just rt, Nothing, Just False) -> flag rt Nothing False
    (Just rt, Just rf, Just False) -> flag rt (Just rf) False
    -- handle noop cases
    (Just _, Nothing, Just True) -> MM.throwSystemError "Noop flag"
    (Nothing, Just _, Just False) -> MM.throwSystemError "Noop flag"
    -- handle positional with a given default
    (Nothing, Nothing, Just _) -> MM.throwSystemError "Positional argument with default"
    -- handle positional
    (Nothing, Nothing, Nothing) ->
      return . Left $
        ArgPosDocSet
          { argPosDocType = VarT MBT.bool
          , argPosDocDesc = docLines r
          , argPosDocMetavar = docMetavar r <|> Just "BOOL"
          , argPosDocLiteral = docLiteral r
          }
  where
    flag :: CliOpt -> Maybe CliOpt -> Bool -> MorlocMonad (Either ArgPosDocSet ArgFlagDocSet)
    flag opt rev def =
      return . Right $
        ArgFlagDocSet
          { argFlagDocDesc = docLines r
          , argFlagDocOpt = opt
          , argFlagDocOptRev = rev
          , argFlagDocDefault = if def then "true" else "false"
          }

resolveFlagCmdArg :: ArgDocVars -> MorlocMonad CmdArg
resolveFlagCmdArg r = do
  eitherFlag <- resolveFlag r
  case eitherFlag of
    (Right flag) -> return . CmdArgFlag $ flag
    (Left pos) -> return . CmdArgPos $ pos

resolveOpt :: Type -> ArgDocVars -> MorlocMonad ArgOptDocSet
resolveOpt t r = case (docArg r, docDefault r) of
  (Nothing, _) -> MM.throwSystemError "Optional argument missing tags"
  (Just opt, Nothing)
    -- literal ?Str: auto-default to null (the only way to get null is to omit the flag)
    | isLiteralOptStr -> makeOpt opt "null"
    | otherwise ->
        MM.throwSystemError $ "Optional argument " <> pretty (makeArg opt) <> " must have default values"
  (Just opt, Just def)
    -- literal ?Str with non-null default is an error
    | isLiteralOptStr && def /= "null" ->
        MM.throwSystemError $
          "Optional argument " <> pretty (makeArg opt)
          <> " has type ?Str with literal: true, so default must be null (got \""
          <> pretty def <> "\")"
    | otherwise -> makeOpt opt def
  where
    isLiteralOptStr = docLiteral r == Just True && isOptionalStrType t

    isOptionalStrType (OptionalT (VarT v)) = v == MBT.str
    isOptionalStrType _ = False

    makeOpt opt def = return $
      ArgOptDocSet
        { argOptDocType = t
        , argOptDocDesc = docLines r
        , argOptDocMetavar = fromMaybe (makeOptMeta t) (docMetavar r)
        , argOptDocLiteral = docLiteral r
        , argOptDocArg = opt
        , argOptDocDefault = def
        }

makeArg ::
  CliOpt ->
  Text -- argument string, such as "-h/--help"
makeArg (CliOptShort s) = "-" <> MT.show' s
makeArg (CliOptLong l) = "--" <> l
makeArg (CliOptBoth s l) = "-" <> MT.show' s <> "/--" <> l

makeOptMeta :: Type -> Text
makeOptMeta (UnkT v) = unTVar v
makeOptMeta (VarT v) = unTVar v
makeOptMeta (FunT _ _) = "FUN" -- illegal, but who's watching?
makeOptMeta (AppT (VarT v) _) = unTVar v
makeOptMeta (AppT _ _) = "VAL" -- weird stuff, choose your own metadata
makeOptMeta (NamT _ v _ _) = unTVar v
makeOptMeta (EffectT _ t) = "<E>" <> makeOptMeta t
makeOptMeta (OptionalT t) = "?" <> makeOptMeta t
makeOptMeta (NatLitT n) = MT.show' n
makeOptMeta (NatAddT _ _) = "NAT"
makeOptMeta (NatMulT _ _) = "NAT"
makeOptMeta (NatSubT _ _) = "NAT"
makeOptMeta (NatDivT _ _) = "NAT"

resolvePos :: Type -> ArgDocVars -> MorlocMonad ArgPosDocSet
resolvePos t r = do
  return $
    ArgPosDocSet
      { argPosDocType = t
      , argPosDocDesc = docLines r
      , argPosDocMetavar = docMetavar r
      , argPosDocLiteral = docLiteral r
      }


================================================
FILE: library/Morloc/CodeGenerator/Emit.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Emit
Description : Group serialized manifolds by language and translate to target source code
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.CodeGenerator.Emit
  ( pool
  , emit
  , TranslateFn
  ) where

import Morloc.CodeGenerator.Grammars.Common (invertSerialManifold)
import Morloc.CodeGenerator.Namespace
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM

{- | Callback type for language-specific translation.
The executable provides concrete implementations for each language.
-}
type TranslateFn = Lang -> [Source] -> [SerialManifold] -> MorlocMonad Script

-- | Sort manifolds into pools. Within pools, group manifolds into call sets.
pool :: [SerialManifold] -> [(Lang, [SerialManifold])]
pool es =
  let (langs, indexedSegments) = unzip . groupSort . map (\x@(SerialManifold i lang _ _ _) -> (lang, (i, x))) $ es
      uniqueSegments = map (Map.elems . Map.fromList) indexedSegments
   in zip langs uniqueSegments

-- | Translate a pool of serialized manifolds to target language source code
emit ::
  TranslateFn ->
  Lang ->
  [SerialManifold] ->
  MorlocMonad Script
emit translateFn lang xs = do
  srcs' <- findSources xs
  let xs' = map invertSerialManifold xs
  translateFn lang srcs' xs'

findSources :: [SerialManifold] -> MorlocMonad [Source]
findSources ms = unique <$> concatMapM (foldSerialManifoldM fm) ms
  where
    fm =
      defaultValue
        { opSerialExprM = serialExprSrcs
        , opNativeExprM = nativeExprSrcs
        , opNativeManifoldM = nativeManifoldSrcs
        , opSerialManifoldM = nativeSerialSrcs
        }

    nativeExprSrcs (AppExeN_ _ (SrcCallP src) xss) = return (src : concat xss)
    nativeExprSrcs (ExeN_ _ (SrcCallP src)) = return [src]
    nativeExprSrcs (DeserializeN_ _ s xs) = return $ serialASTsources s <> xs
    nativeExprSrcs e = return $ foldlNE (<>) [] e

    serialExprSrcs (SerializeS_ s xs) = return $ serialASTsources s <> xs
    serialExprSrcs e = return $ foldlSE (<>) [] e

    serialASTsources :: SerialAST -> [Source]
    serialASTsources (SerialPack _ (p, s)) = [typePackerForward p, typePackerReverse p] <> serialASTsources s
    serialASTsources (SerialList _ s) = serialASTsources s
    serialASTsources (SerialTuple _ ss) = concatMap serialASTsources ss
    serialASTsources (SerialObject _ _ _ (map snd -> ss)) = concatMap serialASTsources ss
    serialASTsources _ = []

    nativeManifoldSrcs (NativeManifold_ m lang _ e) = (<>) e <$> lookupConstructors lang m
    nativeSerialSrcs (SerialManifold_ m lang _ _ e) = (<>) e <$> lookupConstructors lang m

    lookupConstructors :: Lang -> Int -> MorlocMonad [Source]
    lookupConstructors lang i = MM.metaSources i |>> filter ((==) lang . srcLang)


================================================
FILE: library/Morloc/CodeGenerator/Express.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Express
Description : Resolve type aliases and infer concrete types in manifold trees
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Transforms the parameterized 'AnnoS' trees into a form where every
node carries both its general type and inferred concrete type. This is
the step where language-specific type aliases are resolved and type
parameters are fully instantiated.
-}
module Morloc.CodeGenerator.Express
  ( express
  ) where

import qualified Data.Set as Set
import Morloc.CodeGenerator.Infer
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM
import qualified Morloc.TypeEval as TE

mkIdx :: AnnoS g One (Indexed c, d) -> Type -> Indexed Type
mkIdx (AnnoS _ (Idx i _, _) _) = Idx i

setManifoldConfig ::
  Int ->
  AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) ->
  MorlocMonad ()
setManifoldConfig midx (AnnoS _ _ (AppS (AnnoS (Idx fidx _) _ (VarS _ _)) _)) = linkConfigIndex midx fidx
setManifoldConfig midx (AnnoS _ _ (AppS (AnnoS (Idx fidx _) _ (ExeS _)) _)) = linkConfigIndex midx fidx
setManifoldConfig midx (AnnoS _ _ (AppS e _)) = setManifoldConfig midx e
setManifoldConfig midx (AnnoS _ _ (LamS _ e)) = setManifoldConfig midx e
setManifoldConfig midx (AnnoS _ _ (DoBlockS e)) = setManifoldConfig midx e
setManifoldConfig midx (AnnoS _ _ (EvalS e)) = setManifoldConfig midx e
setManifoldConfig midx (AnnoS _ _ (CoerceS _ e)) = setManifoldConfig midx e
setManifoldConfig _ (AnnoS _ _ (IntrinsicS _ _)) = return ()
setManifoldConfig midx (AnnoS _ _ (IfS _ t _)) = setManifoldConfig midx t
setManifoldConfig _ (AnnoS _ _ (CallS _)) = return ()
setManifoldConfig _ _ = return ()

linkConfigIndex :: Int -> Int -> MorlocMonad ()
linkConfigIndex midx fidx = do
  s <- MM.get
  case Map.lookup fidx (stateManifoldConfig s) of
    Nothing -> return ()
    (Just mconfig) -> do
      MM.sayVVV $ "Copy manifold config from" <+> pretty fidx <+> "to" <+> pretty midx
      MM.put (s {stateManifoldConfig = Map.insert midx mconfig (stateManifoldConfig s)})

propagateScope :: Int -> Int -> MorlocMonad ()
propagateScope calleeIdx appIdx = do
  s <- MM.get
  case GMap.yIsX calleeIdx appIdx (stateConcreteTypedefs s) of
    (Just gmap') -> MM.put $ s {stateConcreteTypedefs = gmap'}
    Nothing -> return ()

express :: AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) -> MorlocMonad PolyHead
express e@(AnnoS (Idx midx t) (Idx cidx _, _) _) = do
  -- Store the return effect labels before forceExportThunks strips them
  let retEffects = extractReturnEffects t
  MM.modify (\s -> s { stateManifoldEffects = Map.insert midx retEffects (stateManifoldEffects s) })
  forceExportThunks cidx t <$> expressCore e
  where
    extractReturnEffects (FunT _ (EffectT effs _)) = effs
    extractReturnEffects (EffectT effs _) = effs
    extractReturnEffects _ = Set.empty

-- At the export boundary, thunks cannot be serialized. This function:
--   1. Wraps thunk-typed args in PolyDoBlock so they are received as plain
--      values from the CLI and suspended inside the pool.
--   2. Wraps thunk return types in PolyEval so they are evaluated before
--      serialization back to the user.
forceExportThunks :: Int -> Type -> PolyHead -> PolyHead
forceExportThunks cidx t (PolyHead lang midx args body) =
  let inputTs = case t of FunT inputs _ -> inputs; _ -> []
      thunkArgIds = [ann a | (a, EffectT _ _) <- zip args inputTs]
      retT = case t of FunT _ ret -> ret; t' -> t'
      body' = suspendThunkArgs thunkArgIds body
      body'' = forceAtReturn cidx retT body'
   in PolyHead lang midx args body''
  where
    -- Wrap BndVar references to thunk-typed args in PolyDoBlock.
    -- The arg is deserialized as the inner type; the suspend creates the thunk.
    suspendThunkArgs [] e = e
    suspendThunkArgs ids e = goExpr ids e

    goExpr ids (PolyBndVar (C (Idx ci (EffectT effs inner))) i)
      | i `elem` ids = wrapSuspends ci (EffectT effs inner) i
    goExpr ids (PolyManifold l m f e) = PolyManifold l m f (goExpr ids e)
    goExpr ids (PolyLet i e1 e2) = PolyLet i (goExpr ids e1) (goExpr ids e2)
    goExpr ids (PolyReturn e) = PolyReturn (goExpr ids e)
    goExpr ids (PolyApp e es) = PolyApp (goExpr ids e) (map (goExpr ids) es)
    goExpr ids (PolyEval ti e) = PolyEval ti (goExpr ids e)
    goExpr ids (PolyDoBlock ti e) = PolyDoBlock ti (goExpr ids e)
    goExpr ids (PolyCoerce c ti e) = PolyCoerce c ti (goExpr ids e)
    goExpr ids (PolyIntrinsic ti intr es) = PolyIntrinsic ti intr (map (goExpr ids) es)
    goExpr ids (PolyList v ti es) = PolyList v ti (map (goExpr ids) es)
    goExpr ids (PolyTuple v es) = PolyTuple v (map (fmap (goExpr ids)) es)
    goExpr ids (PolyRecord o v ps rs) = PolyRecord o v ps (map (fmap (fmap (goExpr ids))) rs)
    goExpr ids (PolyIf c t' e) = PolyIf (goExpr ids c) (goExpr ids t') (goExpr ids e)
    goExpr ids (PolyRemoteInterface l ti is rf e) = PolyRemoteInterface l ti is rf (goExpr ids e)
    goExpr _ e = e

    -- Peel EffectT layers, wrapping each in PolyDoBlock, with the innermost
    -- BndVar carrying the fully-unwrapped type.
    wrapSuspends ci (EffectT effs inner) i =
      PolyDoBlock (Idx ci (EffectT effs inner)) (wrapSuspends ci inner i)
    wrapSuspends ci inner i = PolyBndVar (C (Idx ci inner)) i

    forceAtReturn c rt (PolyReturn e) = PolyReturn (wrapForces c rt e)
    forceAtReturn c rt (PolyManifold l m f e) = PolyManifold l m f (forceAtReturn c rt e)
    forceAtReturn c rt (PolyLet i e1 e2) = PolyLet i e1 (forceAtReturn c rt e2)
    forceAtReturn c rt e = wrapForces c rt e

    wrapForces c (EffectT _ inner) e = wrapForces c inner (PolyEval (Idx c inner) e)
    wrapForces _ _ e = e

expressCore :: AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) -> MorlocMonad PolyHead
expressCore (AnnoS (Idx midx c@(FunT inputs _)) (Idx cidx lang, _) (ExeS exe)) = do
  MM.sayVVV $ "express CallS (midx=" <> pretty midx <> "," <+> "cidx=" <> pretty cidx <> "):"
  ids <- MM.takeFromCounter (length inputs)
  exe' <- case exe of
    (SrcCall src) -> return $ SrcCallP src
    (PatCall pat) -> return $ PatCallP pat
  let lambdaVals = fromJust $ safeZipWith PolyBndVar (map (C . Idx cidx) inputs) ids
  return
    . PolyHead lang midx [Arg i None | i <- ids]
    . PolyReturn
    $ PolyApp (PolyExe (Idx midx c) exe') lambdaVals
expressCore (AnnoS (Idx midx _) (_, lambdaArgs) (LamS _ e@(AnnoS (Idx _ applicationType) (c, _) x))) = do
  MM.sayVVV $ "express LamS (midx=" <> pretty midx <> "):"
  setManifoldConfig midx e
  expressCore (AnnoS (Idx midx applicationType) (c, lambdaArgs) x)
expressCore (AnnoS (Idx midx (AppT (VarT v) [t])) (Idx cidx lang, args) (LstS xs)) = do
  MM.sayVVV $ "express LstS"
  xs' <- mapM (\x -> expressPolyExprWrap lang (mkIdx x t) x) xs
  let x = PolyList (Idx cidx v) (Idx cidx t) xs'
  return $ PolyHead lang midx [Arg i None | Arg i _ <- args] (PolyReturn x)
expressCore (AnnoS (Idx _ t) _ (LstS _)) = error $ "Invalid list form: " <> show t
expressCore (AnnoS t@(Idx midx (AppT (VarT v) ts)) (Idx cidx lang, args) (TupS xs)) = do
  MM.sayVVV $ "express TupS:" <+> pretty t
  let idxTs = zipWith mkIdx xs ts
  xs' <- fromJust <$> safeZipWithM (expressPolyExprWrap lang) idxTs xs
  let x = PolyTuple (Idx cidx v) (fromJust $ safeZip idxTs xs')
  return $ PolyHead lang midx [Arg i None | Arg i _ <- args] (PolyReturn x)
expressCore (AnnoS g _ (TupS _)) = error $ "Invalid tuple form: " <> show g
expressCore (AnnoS (Idx midx t@(NamT o v ps rs)) (Idx cidx lang, args) (NamS entries)) = do
  MM.sayVVV $ "express NamT:" <+> pretty t
  let idxTypes = zipWith mkIdx (map snd entries) (map snd rs)
  xs' <- fromJust <$> safeZipWithM (expressPolyExprWrap lang) idxTypes (map snd entries)
  let x = PolyRecord o (Idx cidx v) (map (Idx cidx) ps) (zip (map fst rs) (zip idxTypes xs'))
  return $ PolyHead lang midx [Arg i None | Arg i _ <- args] (PolyReturn x)
expressCore (AnnoS (Idx midx t) (Idx cidx lang, args) (NamS entries)) = do
  MM.sayVVV $ "express NamT expand:" <+> pretty t
  mayT <- evalGeneralStep midx (type2typeu t)
  case mayT of
    (Just t') -> expressCore (AnnoS (Idx midx (typeOf t')) (Idx cidx lang, args) (NamS entries))
    Nothing -> MM.throwSourcedError midx $ "Missing concrete:" <+> "t=" <> pretty t
expressCore e = do
  MM.sayVVV "express default"
  expressDefault e

reduceType :: Scope -> Type -> Maybe Type
reduceType scope t0 =
  let tu0 = type2typeu t0
   in case TE.evaluateStep scope tu0 of
        (Just tu1) -> if tu0 == tu1 then Nothing else Just (typeOf tu1)
        Nothing -> Nothing

expressDefault :: AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) -> MorlocMonad PolyHead
expressDefault e0@(AnnoS (Idx midx t) (Idx cidx lang, args) _) =
  PolyHead lang midx [Arg i None | Arg i _ <- args] . ensurePolyReturn
    <$> expressPolyExprWrap lang (Idx cidx t) e0
  where
    -- ensure the manifold body has PolyReturn at the return position
    ensurePolyReturn (PolyReturn x) = PolyReturn x
    ensurePolyReturn (PolyLet i e1 e2) = PolyLet i e1 (ensurePolyReturn e2)
    ensurePolyReturn (PolyManifold l m f e) = PolyManifold l m f (ensurePolyReturn e)
    ensurePolyReturn x = PolyReturn x

expressPolyExprWrap ::
  Lang ->
  Indexed Type ->
  AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) ->
  MorlocMonad PolyExpr
expressPolyExprWrap l t e@(AnnoS (Idx midx _) _ (LamS _ lamExpr)) = do
  setManifoldConfig midx lamExpr
  expressPolyExprWrapCommon l t e
expressPolyExprWrap l t e = expressPolyExprWrapCommon l t e

expressPolyExprWrapCommon ::
  Lang -> Indexed Type -> AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) -> MorlocMonad PolyExpr
expressPolyExprWrapCommon l t e@(AnnoS _ _ (AppS (AnnoS (Idx gidxCall _) _ _) _)) = do
  bconf <- MM.gets stateBuildConfig
  mconMap <- MM.gets stateManifoldConfig
  expressPolyExpr (decideRemoteness bconf (Map.lookup gidxCall mconMap)) l t e
expressPolyExprWrapCommon l t e@(AnnoS (Idx midx _) _ _) = do
  bconf <- MM.gets stateBuildConfig
  mconMap <- MM.gets stateManifoldConfig
  expressPolyExpr (decideRemoteness bconf (Map.lookup midx mconMap)) l t e

decideRemoteness :: BuildConfig -> Maybe ManifoldConfig -> Lang -> Lang -> Maybe RemoteForm
decideRemoteness _ Nothing l1 l2
  | l1 == l2 = Nothing
  | otherwise = Just ForeignCall
decideRemoteness _ (Just (ManifoldConfig _ _ Nothing)) l1 l2
  | l1 == l2 = Nothing
  | otherwise = Just ForeignCall
decideRemoteness bconf (Just (ManifoldConfig _ _ (Just res))) l1 l2 =
  case (buildConfigSlurmSupport bconf, l1 /= l2) of
    (Just True, _) -> Just $ RemoteCall res
    (_, True) -> Just $ ForeignCall
    _ -> Nothing

expressPolyExpr ::
  (Lang -> Lang -> Maybe RemoteForm) ->
  Lang ->
  Indexed Type ->
  AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) ->
  MorlocMonad PolyExpr
expressPolyExpr
  findRemote
  parentLang
  _
  ( AnnoS
      (Idx midx (FunT lamInputTypes lamOutType))
      (Idx cidxLam _, lamArgs)
      ( LamS
          vs
          ( AnnoS
              _
              (Idx _ appLang, appArgs)
              ( AppS
                  funExpr@(AnnoS (Idx gidxCall (FunT callInputTypes _)) (Idx _ callLang, _) _)
                  xs
                )
            )
        )
    )
    | isLocal = do
        propagateScope gidxCall midx
        MM.sayVVV "case #4"
        let nContextArgs = length appArgs - length vs
            contextArgs = map unvalue (take nContextArgs appArgs)

            typedLambdaArgs =
              fromJust $
                safeZipWith
                  (\(Arg i _) t -> Arg i (Just t))
                  (drop nContextArgs lamArgs)
                  lamInputTypes

        xs' <- fromJust <$> safeZipWithM (expressPolyExprWrap appLang) (zipWith mkIdx xs callInputTypes) xs

        call <- expressPolyApp parentLang funExpr xs'

        return
          . PolyManifold parentLang midx (ManifoldPart contextArgs typedLambdaArgs)
          $ call
    | not isLocal = do
        propagateScope gidxCall midx

        xsInfo <- mapM partialExpress xs

        MM.sayVVV $ "  xsInfo:" <+> pretty xsInfo

        let xs' = map (\(_, _, e) -> e) xsInfo
            callArgs = unique (concatMap (\(rs, _, _) -> rs) xsInfo)
            args = [i | Arg i _ <- appArgs]
            allParentArgs = args <> [i | (_, Just (i, _), _) <- xsInfo]
            lets = [PolyLet i e | (_, Just (i, e), _) <- xsInfo]
            passedParentArgs = concat [[r | r <- allParentArgs, r == i] | i <- callArgs]
            nContextArgs = length appArgs - length vs

            lambdaTypeMap = zip vs (map (Idx cidxLam) lamInputTypes)
            boundVars =
              [ PolyBndVar (maybe (A parentLang) C (lookup v lambdaTypeMap)) i
              | Arg i v <- appArgs
              ]
            untypedContextArgs = map unvalue $ take nContextArgs appArgs
            typedPassedArgs = fromJust $ safeZipWith (\(Arg i _) t -> Arg i (Just t)) (drop nContextArgs lamArgs) lamInputTypes

            localForm = ManifoldPart untypedContextArgs typedPassedArgs

            foreignForm = ManifoldFull [Arg i None | i <- passedParentArgs]

        call <- expressPolyApp parentLang funExpr xs'

        return
          . PolyManifold parentLang midx localForm
          . chain lets
          . PolyReturn
          . PolyApp
            ( PolyRemoteInterface callLang (Idx cidxLam lamOutType) passedParentArgs (fromJust remote)
                . PolyManifold callLang midx foreignForm
                $ call
            )
          $ boundVars
    where
      remote = findRemote parentLang callLang
      isLocal = isNothing remote

      chain :: [a -> a] -> a -> a
      chain [] x = x
      chain (f : fs) x = chain fs (f x)

      partialExpress ::
        AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) ->
        MorlocMonad
          ( [Int]
          , Maybe (Int, PolyExpr)
          , PolyExpr
          )
      partialExpress (AnnoS (Idx _ t) (Idx cidx argLang, args@[Arg idx _]) (BndS v)) = do
        MM.sayVVV $
          "partialExpress case #0:" <+> "x="
            <> pretty v <+> "cidx="
            <> pretty cidx <+> "t =" <+> pretty t
            <> "\n  parentLang:"
            <> pretty parentLang
            <> "\n  callLang:"
            <> pretty callLang
            <> "\n  argLang:"
            <> pretty argLang
            <> "\n  args:"
            <> pretty args
        let x' = PolyBndVar (C (Idx cidx t)) idx
        return ([idx], Nothing, x')
      partialExpress x@(AnnoS (Idx _ t) (Idx cidx argLang, args) _)
        | argLang == callLang = do
            MM.sayVVV $
              "partialExpress case #2:" <+> "cidx="
                <> pretty cidx <+> "t =" <+> pretty t
                <> "\n  parentLang:"
                <> pretty parentLang
                <> "\n  callLang:"
                <> pretty callLang
                <> "\n  argLang:"
                <> pretty argLang
                <> "\n  args:"
                <> pretty args
            let argParentType = Idx cidx t
            x' <- expressPolyExprWrap argLang argParentType x
            return ([i | Arg i _ <- args], Nothing, x')
        | otherwise = do
            MM.sayVVV $
              "partialExpress case #1:" <+> "cidx="
                <> pretty cidx <+> "t =" <+> pretty t
                <> "\n  parentLang:"
                <> pretty parentLang
                <> "\n  callLang:"
                <> pretty callLang
                <> "\n  argLang:"
                <> pretty argLang
                <> "\n  args:"
                <> pretty args
            let argparentType = Idx cidx t
            letVal <- expressPolyExprWrap argLang argparentType x
            idx <- MM.getCounter
            MM.sayVVV $ "making index in partialExpress #1:" <+> pretty idx

            let x' = PolyLetVar (Idx cidx t) idx
            return ([idx], Just (idx, letVal), x')
expressPolyExpr _ _ _ (AnnoS lambdaType@(Idx midx _) (Idx _ lang, manifoldArguments) (LamS vs body)) = do
  MM.sayVVV $ "expressPolyExpr LamS:" <+> pretty lambdaType

  body' <- expressPolyExprWrap lang lambdaType body

  inputTypes <- case val lambdaType of
    (FunT ts _) -> return ts
    _ -> return []

  let contextArguments = map unvalue $ take (length manifoldArguments - length vs) manifoldArguments
      boundArguments = map unvalue $ drop (length contextArguments) manifoldArguments
      typeBoundArguments = fromJust $ safeZipWith (\t (Arg i _) -> Arg i (Just t)) inputTypes boundArguments

  MM.sayVVV $
    "Express lambda:"
      <> "\n  vs:" <+> pretty vs
      <> "\n  lambdaType:" <+> pretty lambdaType
      <> "\n  manifoldArguments:" <+> list (map pretty manifoldArguments)
      <> "\n  contextArguments:" <+> list (map pretty contextArguments)
      <> "\n  boundArguments" <+> list (map pretty typeBoundArguments)

  return
    . PolyManifold lang midx (ManifoldPart contextArguments typeBoundArguments)
    . PolyReturn
    $ body'
-- Inline source call: skip PolyManifold, emit as direct subexpression
expressPolyExpr
  findRemote
  parentLang
  _
  ( AnnoS
      (Idx midx _)
      _
      (AppS f@(AnnoS (Idx gidxCall (FunT inputs _)) (Idx cidxCall callLang, _) (ExeS (SrcCall src))) xs)
    )
    | srcInline src && isLocal = do
        propagateScope gidxCall midx
        xsExpr <- zipWithM (expressPolyExprWrap callLang) (map (Idx cidxCall) inputs) xs
        expressPolyApp parentLang f xsExpr >>= stripPolyReturn
    where
      remote = findRemote parentLang callLang
      isLocal = isNothing remote
      stripPolyReturn (PolyReturn e) = return e
      stripPolyReturn e = return e
expressPolyExpr
  findRemote
  parentLang
  pc
  ( AnnoS
      (Idx midx _)
      (_, args)
      (AppS f@(AnnoS (Idx gidxCall (FunT inputs _)) (Idx cidxCall callLang, _) _) xs)
    )
    | isLocal = do
        propagateScope gidxCall midx
        xsExpr <- zipWithM (expressPolyExprWrap callLang) (map (Idx cidxCall) inputs) xs

        func <- expressPolyApp parentLang f xsExpr
        return
          . PolyManifold callLang midx (ManifoldFull (map unvalue args))
          $ func
    | not isLocal = do
        propagateScope gidxCall midx
        let idxInputTypes = zipWith mkIdx xs inputs
        mayXs <- safeZipWithM (expressPolyExprWrap callLang) idxInputTypes xs
        func <- expressPolyApp parentLang f (fromJust mayXs)
        return
          . PolyManifold parentLang midx (ManifoldFull (map unvalue args))
          . PolyReturn
          . PolyApp
            ( PolyRemoteInterface callLang pc [] (fromJust remote)
                . PolyManifold callLang midx (ManifoldFull (map unvalue args))
                $ func
            )
          $ [PolyBndVar (A parentLang) i | Arg i _ <- args]
    where
      remote = findRemote parentLang callLang
      isLocal = isNothing remote
expressPolyExpr
  findRemote
  parentLang
  (val -> FunT pinputs poutput)
  e@(AnnoS (Idx midx (FunT callInputs _)) (Idx cidx callLang, _) _)
    | isLocal = do
        ids <- MM.takeFromCounter (length callInputs)
        let lambdaVals = bindVarIds ids (map (C . Idx cidx) callInputs)
            lambdaTypedArgs = fromJust $ safeZipWith annotate ids (map Just callInputs)
        retapp <- expressPolyApp parentLang e lambdaVals
        return
          . PolyManifold callLang midx (ManifoldPass lambdaTypedArgs)
          $ retapp
    | otherwise = do
        ids <- MM.takeFromCounter (length callInputs)
        let lambdaArgs = [Arg i None | i <- ids]
            lambdaTypedArgs = map (`Arg` Nothing) ids
            callVals = bindVarIds ids (map (C . Idx cidx) callInputs)
        retapp <- expressPolyApp callLang e callVals
        return
          . PolyManifold parentLang midx (ManifoldPass lambdaTypedArgs)
          . PolyReturn
          . PolyApp
            ( PolyRemoteInterface callLang (Idx cidx poutput) (map ann lambdaArgs) (fromJust remote)
                . PolyManifold callLang midx (ManifoldFull lambdaArgs)
                $ retapp
            )
          $ fromJust
          $ safeZipWith (PolyBndVar . C) (map (Idx cidx) pinputs) (map ann lambdaArgs)
    where
      remote = findRemote parentLang callLang
      isLocal = isNothing remote
expressPolyExpr _ _ _ (AnnoS (Idx i c) (Idx cidx _, rs) (BndS v)) = do
  MM.sayVVV $ "express' VarS" <+> parens (pretty v) <+> "::" <+> pretty c
  case [j | (Arg j v') <- rs, v == v'] of
    [r] -> return $ PolyBndVar (C (Idx cidx c)) r
    rs' ->
      MM.throwSourcedError i $
        "Expected VarS"
          <+> dquotes (pretty v)
          <+> "of type"
          <+> parens (pretty c)
          <+> "to match exactly one argument, found:"
          <+> list (map pretty rs')
          <> "\n  v:" <+> pretty v
          <> "\n  cidx:" <+> pretty cidx
          <> "\n  gidx:" <+> pretty cidx
          <> "\n  rs:" <+> list (map pretty rs)
expressPolyExpr _ _ _ (AnnoS (Idx i c) (Idx cidx _, rs) (LetBndS v)) = do
  case [j | (Arg j v') <- rs, v == v'] of
    [r] -> return $ PolyLetVar (Idx cidx c) r
    _ -> MM.throwSourcedError i $ "Undefined let-bound variable:" <+> pretty v
expressPolyExpr
  _
  parentLang
  parentType
  (AnnoS _ (Idx cidx _, _) (LetS v e1 e2)) = do
    let bodyArgs = case e2 of AnnoS _ (_, args) _ -> args
        -- unused let-bound variables (e.g. from do-block bare statements) won't
        -- appear in body args; use cidx as a unique dummy ID in that case
        letId = case [j | Arg j v' <- bodyArgs, v' == v] of
          [j] -> j
          _ -> cidx
    let e1Type = case e1 of AnnoS (Idx _ t) _ _ -> mkIdx e1 t
    e1' <- expressPolyExprWrap parentLang e1Type e1
    e2' <- expressPolyExprWrap parentLang parentType e2
    return $ PolyLet letId e1' e2'
expressPolyExpr _ _ _ (AnnoS (Idx _ (VarT v)) (Idx cidx _, _) (RealS x)) = return $ PolyReal (Idx cidx v) x
expressPolyExpr _ _ _ (AnnoS (Idx _ (VarT v)) (Idx cidx _, _) (IntS x)) = return $ PolyInt (Idx cidx v) x
expressPolyExpr _ _ _ (AnnoS (Idx _ (VarT v)) (Idx cidx _, _) (LogS x)) = return $ PolyLog (Idx cidx v) x
expressPolyExpr _ _ _ (AnnoS (Idx _ (VarT v)) (Idx cidx _, _) (StrS x)) = return $ PolyStr (Idx cidx v) x
expressPolyExpr _ _ _ (AnnoS (Idx _ (VarT v)) (Idx cidx _, _) UniS) = return $ PolyNull (Idx cidx v)
expressPolyExpr _ _ _ (AnnoS (Idx _ (OptionalT (VarT v))) (Idx cidx _, _) NullS) = return $ PolyNull (Idx cidx v)
expressPolyExpr _ _ _ (AnnoS _ (Idx cidx _, _) NullS) = return $ PolyNull (Idx cidx (TV "Unit"))
expressPolyExpr _ parentLang pc (AnnoS (Idx midx (AppT (VarT v) [t])) (Idx cidx lang, args) (LstS xs)) = do
  xs' <- mapM (\x -> expressPolyExprWrap lang (mkIdx x t) x) xs
  let e = PolyList (Idx cidx v) (Idx cidx t) xs'
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e
expressPolyExpr _ _ _ (AnnoS _ _ (LstS _)) = error "LstS can only be (AppP (VarP _) [_]) type"
expressPolyExpr _ parentLang pc (AnnoS (Idx midx (AppT (VarT v) ts)) (Idx cidx lang, args) (TupS xs)) = do
  let idxTs = zipWith mkIdx xs ts
  xs' <- fromJust <$> safeZipWithM (expressPolyExprWrap lang) idxTs xs
  let e = PolyTuple (Idx cidx v) (fromJust $ safeZip idxTs xs')
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e
expressPolyExpr _ parentLang pc (AnnoS (Idx midx (NamT o v ps rs)) (Idx cidx lang, args) (NamS entries)) = do
  let tsIdx = zipWith mkIdx (map snd entries) (map snd rs)
  xs' <- fromJust <$> safeZipWithM (expressPolyExprWrap lang) tsIdx (map snd entries)
  let e = PolyRecord o (Idx cidx v) (map (Idx cidx) ps) (zip (map fst rs) (zip tsIdx xs'))
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e
expressPolyExpr _ pl pc (AnnoS (Idx i t) c e@(NamS _)) = do
  scope <- MM.getGeneralScope i
  case reduceType scope t of
    (Just t') -> expressPolyExprWrap pl pc (AnnoS (Idx i t') c e)
    Nothing -> error "Expected a record type"
-- Recursive call used as a value (not applied via AppS)
expressPolyExpr _ parentLang _ (AnnoS (Idx i c) (Idx _cidx _, _) (CallS v)) = do
  (mid, crossLang) <- lookupRecursiveTarget parentLang v
  -- Strip EffectT from return type (serial manifolds force thunks)
  case c of
    FunT inputs (EffectT effs out) ->
      return . PolyDoBlock (Idx i (EffectT effs out))
        $ PolyExe (Idx i (FunT inputs out)) (RecCallP mid crossLang)
    _ ->
      return $ PolyExe (Idx i c) (RecCallP mid crossLang)
expressPolyExpr _ _ _ (AnnoS (Idx i _) _ (AppS (AnnoS _ _ (BndS v)) _)) =
  MM.throwSourcedError i $
    "Undefined function" <+> dquotes (pretty v) <> ", did you forget an import?"
expressPolyExpr _ _ _ (AnnoS _ _ (AppS (AnnoS _ _ (LamS vs _)) _)) =
  error $ "All applications of lambdas should have been eliminated of length " <> show (length vs)
expressPolyExpr _ parentLang pc (AnnoS (Idx midx t) (Idx cidx lang, args) (IfS cond thenE elseE)) = do
  let boolType = VarT (TV "Bool")
  cond' <- expressPolyExprWrap lang (mkIdx cond boolType) cond
  thenE' <- expressPolyExprWrap lang (mkIdx thenE t) thenE
  elseE' <- expressPolyExprWrap lang (mkIdx elseE t) elseE
  let e = PolyIf cond' thenE' elseE'
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e
expressPolyExpr _ parentLang pc (AnnoS (Idx midx t) (Idx cidx lang, args) (DoBlockS x)) = do
  -- The inner expression has the unwrapped type (without EffectT).
  -- Passing EffectT through would cause cross-language calls to generate
  -- effect-wrapped return types for pure functions.
  let innerT = case t of EffectT _ inner -> inner; _ -> t
  x' <- expressPolyExprWrap lang (mkIdx x innerT) x
  let e = PolyDoBlock (Idx cidx t) x'
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e
expressPolyExpr _ parentLang _ (AnnoS (Idx _ t) (Idx cidx _, _) (CoerceS coercion x)) = do
  let innerType = unapplyCoercion coercion t
  x' <- expressPolyExprWrap parentLang (Idx cidx innerType) x
  return $ PolyCoerce coercion (Idx cidx t) x'
expressPolyExpr _ parentLang _ (AnnoS (Idx _ t) (Idx cidx _lang, _) (EvalS x)) = do
  -- Always use pushForceIntoRemote: if the inner expression contains a
  -- PolyRemoteInterface (cross-language call), it strips EffectT Set.empty so the remote
  -- pool forces the thunk and serializes the concrete result. If no
  -- PolyRemoteInterface is found (same-language), it falls back to PolyEval.
  -- We cannot rely on parentLang /= lang because Realize.hs assigns both to
  -- the same language when the EvalS node lives in a same-language context,
  -- even if the inner expression calls into a foreign language.
  x' <- expressPolyExprWrap parentLang (Idx cidx t) x
  return $ pushForceIntoRemote (Idx cidx t) x'
expressPolyExpr _ parentLang pc (AnnoS (Idx midx t) (Idx cidx lang, args) (IntrinsicS intr xs)) = do
  xs' <- mapM (\x@(AnnoS (Idx xi xt) _ _) -> expressPolyExprWrap lang (Idx xi xt) x) xs
  let e = PolyIntrinsic (Idx cidx t) intr xs'
  return $ expressContainer pc (Idx midx parentLang) (Idx cidx lang) args e

-- Nullary source/pattern call (e.g., clockResNs :: {Int})
expressPolyExpr
  findRemote
  parentLang
  pc
  f@(AnnoS (Idx midx _) (Idx _ callLang, args) (ExeS _))
    | isLocal = do
        call <- expressPolyApp parentLang f []
        return
          . PolyManifold callLang midx (ManifoldFull (map unvalue args))
          $ call
    | otherwise = do
        call <- expressPolyApp callLang f []
        return
          . PolyManifold parentLang midx (ManifoldFull (map unvalue args))
          . PolyReturn
          . PolyApp
            ( PolyRemoteInterface callLang pc [] (fromJust remote)
                . PolyManifold callLang midx (ManifoldFull (map unvalue args))
                $ call
            )
          $ [PolyBndVar (A parentLang) i | Arg i _ <- args]
    where
      remote = findRemote parentLang callLang
      isLocal = isNothing remote
expressPolyExpr _ _ parentType x@(AnnoS (Idx m t) _ _) = do
  MM.sayVVV "Bad case"
  MM.sayVVV $ "  t :: " <> pretty t
  name' <- MM.metaName m
  case name' of
    (Just v) ->
      MM.throwSourcedError m $
        "Missing concrete:"
          <> "\n  t:" <+> viaShow t
          <> "\n  v:" <+> pretty v
          <> "\n parentType:" <+> pretty parentType
          <> "\n x:" <+> pretty x
    Nothing ->
      MM.throwSourcedError m $
        "Missing concrete in unnamed function:"
          <> "\n  t:" <+> pretty t
          <> "\n parentType:" <+> pretty parentType
          <> "\n x:" <+> pretty x

expressPolyApp ::
  Lang ->
  AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]) ->
  [PolyExpr] ->
  MorlocMonad PolyExpr
expressPolyApp _ (AnnoS g _ (ExeS (SrcCall src))) xs =
  return . PolyReturn $ PolyApp (PolyExe g (SrcCallP src)) xs
expressPolyApp _ (AnnoS g _ (ExeS (PatCall pat))) xs =
  return . PolyReturn $ PolyApp (PolyExe g (PatCallP pat)) xs
expressPolyApp lang f@(AnnoS g@(Idx i _) _ (AppS _ _)) es = do
  fe <- expressPolyExprWrap lang g f
  return
    . PolyLet i fe
    . PolyReturn
    $ PolyApp (PolyLetVar g i) es
expressPolyApp _ (AnnoS g (_, args) (BndS v)) xs = do
  case [j | (Arg j u) <- args, u == v] of
    [j] -> return . PolyReturn $ PolyApp (PolyExe g (LocalCallP j)) xs
    _ -> error "Unreachable? BndS value should have been wired uniquely to args previously"
expressPolyApp parentLang (AnnoS (Idx i t) _ (CallS v)) xs = do
  (mid, crossLang) <- lookupRecursiveTarget parentLang v
  -- Serial manifolds force thunks before serializing, so strip EffectT from the
  -- return type and wrap in PolyDoBlock to reconstruct the thunk after deserializing.
  case t of
    FunT inputs (EffectT effs out) ->
      return . PolyReturn
        . PolyDoBlock (Idx i (EffectT effs out))
        $ PolyApp (PolyExe (Idx i (FunT inputs out)) (RecCallP mid crossLang)) xs
    _ ->
      return . PolyReturn $ PolyApp (PolyExe (Idx i t) (RecCallP mid crossLang)) xs
expressPolyApp _ (AnnoS _ _ (LamS _ _)) _ = error "unexpected LamS - should have been handled"
expressPolyApp _ (AnnoS _ _ (VarS _ _)) _ = error "unexpected VarS - should have been substituted"
expressPolyApp _ _ _ = error "Unreachable? This does not seem to be applicable"

expressContainer ::
  Indexed Type -> Indexed Lang -> Indexed Lang -> [Arg EVar] -> PolyExpr -> PolyExpr
expressContainer pc (Idx midx parentLang) (Idx _ lang) args e
  | parentLang /= lang =
      PolyApp
        ( PolyRemoteInterface lang pc [i | Arg i _ <- args] ForeignCall
            . PolyManifold lang midx (ManifoldFull (map unvalue args))
            . PolyReturn
            $ e
        )
        $ [PolyBndVar (A parentLang) i | Arg i _ <- args]
  | otherwise = e

unvalue :: Arg a -> Arg None
unvalue (Arg i _) = Arg i None

{- | Handle cross-language force by stripping EffectT from the callee's function
return type. The source function actually returns the unwrapped type; the
EffectT wrapper is a type-system abstraction. By removing it, Common.hs won't
auto-wrap in DoBlockN, so the raw value is serialized directly.
If no PolyRemoteInterface is found, falls back to wrapping in PolyEval.
-}
pushForceIntoRemote :: Indexed Type -> PolyExpr -> PolyExpr
pushForceIntoRemote t = go
  where
    go (PolyManifold l m f e) = PolyManifold l m f (go e)
    go (PolyReturn e) = PolyReturn (go e)
    go (PolyLet i e1 e2) = PolyLet i e1 (go e2)
    go (PolyApp (PolyRemoteInterface lang _ args remote callee) xs) =
      PolyApp (PolyRemoteInterface lang t args remote (stripThunkReturn callee)) xs
    go e = PolyEval t e -- fallback for local expressions

    -- Strip EffectT from the function's return type inside the callee manifold
    stripThunkReturn (PolyManifold l m f body) = PolyManifold l m f (stripInBody body)
    stripThunkReturn e = stripInBody e

    stripInBody (PolyReturn e) = PolyReturn (stripInExe e)
    stripInBody (PolyLet i e1 e2) = PolyLet i e1 (stripInBody e2)
    stripInBody e = stripInExe e

    stripInExe (PolyApp (PolyExe (Idx gidx (FunT inputs (EffectT _ out))) exe) xs) =
      PolyApp (PolyExe (Idx gidx (FunT inputs out)) exe) xs
    stripInExe (PolyApp (PolyExe (Idx gidx (EffectT _ out)) exe) xs) =
      PolyApp (PolyExe (Idx gidx out) exe) xs
    stripInExe e = e

-- | Resolve a function name to its manifold ID and determine if the call is cross-language.
-- Returns (manifold ID, Nothing) for same-pool calls, (manifold ID, Just targetLang) for foreign calls.
-- Searches all manifolds in stateName, not just exports, to support non-exported recursive helpers.
lookupRecursiveTarget :: Lang -> EVar -> MorlocMonad (Int, Maybe Lang)
lookupRecursiveTarget parentLang v = do
  nameMap <- MM.gets stateName
  langMap <- MM.gets stateManifoldLang
  -- Filter to concrete manifolds only (those in langMap) to avoid picking up
  -- general/polymorphic indices that don't have serial manifold definitions
  let reverseMap = Map.fromList [(name, idx) | (idx, name) <- Map.toList nameMap, Map.member idx langMap]
  case Map.lookup v reverseMap of
    (Just mid) -> do
      let crossLang = case Map.lookup mid langMap of
            Just tl | tl /= parentLang -> Just tl
            _ -> Nothing
      return (mid, crossLang)
    Nothing -> MM.throwSystemError $ "Cannot resolve recursive call to" <+> pretty v

bindVarIds :: [Int] -> [Three Lang Type (Indexed Type)] -> [PolyExpr]
bindVarIds [] [] = []
bindVarIds (i : args) (t : types) = PolyBndVar t i : bindVarIds args types
bindVarIds [] ts = error $ "bindVarIds: too few arguments: " <> show ts
bindVarIds _ [] = error "bindVarIds: too few types"


================================================
FILE: library/Morloc/CodeGenerator/Grammars/Common.hs
================================================
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Grammars.Common
Description : Shared codegen utilities: manifold inversion, naming, pool doc merging
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Provides 'invertSerialManifold' (the preprocessing step that all translators
run), 'PoolDocs' (the accumulator for the lowering fold), naming convention
helpers, and the fold framework ('FoldRules', 'foldWithSerialManifoldM').
-}
module Morloc.CodeGenerator.Grammars.Common
  ( invertSerialManifold
  , PoolDocs (..)
  , mergePoolDocs

    -- * Naming conventions
  , svarNamer
  , nvarNamer
  , helperNamer
  , argNamer
  , manNamer
  , patternSetter

    -- * Record collection/unification
  , RecEntry (..)
  , RecMap
  , collectRecords
  , unifyRecords
  , structName

    -- * Dispatch extraction
  , DispatchEntry (..)
  , extractLocalDispatch
  , extractRemoteDispatch

    -- * Utilities
  , provideClosure
  , makeManifoldIndexer
  , renderPoolDocs
  ) where

import qualified Control.Monad.State as CMS
import Data.Binary (Binary)
import GHC.Generics (Generic)
import Morloc.CodeGenerator.Namespace
import Morloc.CodeGenerator.Serial (serialAstToType)
import Morloc.Data.Doc
import Morloc.Data.Text (Text)
import Morloc.Monad (Identity, Index, newIndex, runIdentity, runIndex)

-- Stores pieces of code made while building a pool
data PoolDocs = PoolDocs
  { poolCompleteManifolds :: [MDoc]
  -- ^ completely generated manifolds
  , poolExpr :: MDoc
  -- ^ the inplace expression
  , poolPriorLines :: [MDoc]
  -- ^ lines to precede the returned expression
  , poolPriorExprs :: [MDoc]
  -- ^ expressions that should precede this manifold, may include helper
  -- functions or imports
  }

instance Defaultable PoolDocs where
  defaultValue =
    PoolDocs
      { poolCompleteManifolds = []
      , poolExpr = ""
      , poolPriorLines = []
      , poolPriorExprs = []
      }

{- | Merge a series of pools, keeping prior lines, expression and manifolds, but
merging bodies with a function. For example, merge all elements in a list and
process the poolExpr variables into list syntax in the given language.
-}
mergePoolDocs :: ([MDoc] -> MDoc) -> [PoolDocs] -> PoolDocs
mergePoolDocs f ms =
  PoolDocs
    { poolCompleteManifolds = concatMap poolCompleteManifolds ms
    , poolExpr = f (map poolExpr ms)
    , poolPriorLines = concatMap poolPriorLines ms
    , poolPriorExprs = concatMap poolPriorExprs ms
    }

provideClosure :: Source -> [MDoc] -> [[MDoc]]
provideClosure src args0 = f (srcRsize src) args0
  where
    f [] args = [args]
    f (n : ns) args
      | n < length args = take n args : f ns (drop n args)
      | otherwise =
          error $
            "Invalid rsize value for imported "
              <> show (srcLang src)
              <> " function "
              <> show (unEVar (srcAlias src))

svarNamer :: Int -> MDoc
svarNamer i = "s" <> viaShow i

nvarNamer :: Int -> MDoc
nvarNamer i = "n" <> viaShow i

helperNamer :: Int -> MDoc
helperNamer i = "helper" <> viaShow i

argNamer :: (HasTypeM t) => Arg t -> MDoc
argNamer (Arg i (typeMof -> Native _)) = nvarNamer i
argNamer (Arg i (typeMof -> Function _ _)) = nvarNamer i
argNamer (Arg i _) = svarNamer i

-- create a name for a manifold based on a unique id
manNamer :: Int -> MDoc
manNamer i = "m" <> viaShow i

renderPoolDocs :: PoolDocs -> MDoc
renderPoolDocs e = vsep . punctuate line $ poolPriorExprs e <> poolCompleteManifolds e

-- The surround rules control the setting of manifold ids across the recursion
makeManifoldIndexer :: (Monad m) => m Int -> (Int -> m ()) -> SurroundManifoldM m sm nm se ne sr nr
makeManifoldIndexer getId putId =
  defaultValue
    { surroundSerialManifoldM = surroundSM
    , surroundNativeManifoldM = surroundNM
    }
  where
    -- \| Run a computation in a child manifold, manage manifold indices
    descend childManifoldIndex x f = do
      originalManifoldIndex <- getId
      putId childManifoldIndex
      x' <- f x
      putId originalManifoldIndex
      return x'

    surroundSM f sm@(SerialManifold i _ _ _ _) = descend i sm f

    surroundNM f nm@(NativeManifold i _ _ _) = descend i nm f

patternSetter ::
  (TypeF -> [MDoc] -> MDoc) -> -- make a tuple from a type and list of elements
  (TypeF -> [MDoc] -> MDoc) -> -- make a record from a type and list of elements
  (TypeF -> MDoc -> Int -> MDoc) -> -- access an element in a tuple
  (TypeF -> MDoc -> Text -> MDoc) -> -- access an element in a record
  MDoc -> -- initial data variable name
  TypeF -> -- data type
  Selector -> -- selection pattern
  [MDoc] -> -- ordered arguments substituted at set sites
  MDoc -- the returned data structure with a new spine that reuses unchanged fields
patternSetter makeTuple makeRecord accessTuple accessRecord dat0 t0 s0 args0 =
  snd (setter dat0 t0 s0 args0)
  where
    setter :: MDoc -> TypeF -> Selector -> [MDoc] -> ([MDoc], MDoc)

    -- tuple setters
    setter dat1 tupleType@(AppF _ ts1) (SelectorIdx s1 ss1) args1 =
      second (makeTuple tupleType) $ statefulMap (chooseField dat1 (s1 : ss1)) args1 (zip [0 ..] ts1)
      where
        chooseField :: MDoc -> [(Int, Selector)] -> [MDoc] -> (Int, TypeF) -> ([MDoc], MDoc)
        chooseField dat ss args (i, t) =
          let dat' = accessTuple tupleType dat i
           in case (lookup i ss) of
                (Just s) -> setter dat' t s args
                Nothing -> (args, dat')

    -- record setters
    setter dat1 recType@(NamF _ _ _ rs1) (SelectorKey s1 ss1) args1 =
      second (makeRecord recType) $ statefulMap (chooseField dat1 (s1 : ss1)) args1 rs1
      where
        chooseField :: MDoc -> [(Text, Selector)] -> [MDoc] -> (Key, TypeF) -> ([MDoc], MDoc)
        chooseField dat ss args (Key k, t) =
          let dat' = accessRecord recType dat k
           in case (lookup k ss) of
                (Just s) -> setter dat' t s args
                Nothing -> (args, dat')
    setter _ _ _ (arg : args2) = (args2, arg)
    setter _ _ _ [] = error "Illegal setter"

-- Represents the dependency of a on previously bound expressions
data D a = D a [(Int, Either SerialExpr NativeExpr)]

unD :: D a -> a
unD (D a _) = a

getDeps :: D a -> [(Int, Either SerialExpr NativeExpr)]
getDeps (D _ d) = d

class Dependable a where
  weave :: D a -> a
  atomize :: a -> [(Int, Either SerialExpr NativeExpr)] -> Index (D a)
  isAtomic :: a -> Bool

instance Dependable NativeExpr where
  weave (D x ((i, Left se) : deps)) = weave $ D (SerialLetN i se x) deps
  weave (D x ((i, Right ne) : deps)) = weave $ D (NativeLetN i ne x) deps
  weave (D x []) = x

  atomize e deps
    | isAtomic e = return $ D e deps
    | otherwise = do
        i <- newIndex
        return $ D (LetVarN (typeFof e) i) ((i, Right e) : deps)

  isAtomic (AppExeN _ _ _) = False
  isAtomic ManN {} = False
  isAtomic SerialLetN {} = False
  isAtomic NativeLetN {} = False
  isAtomic ListN {} = False
  isAtomic TupleN {} = False
  isAtomic RecordN {} = False
  isAtomic IfN {} = False
  isAtomic _ = True

instance Dependable SerialExpr where
  weave (D x ((i, Left se) : deps)) = weave $ D (SerialLetS i se x) deps
  weave (D x ((i, Right ne) : deps)) = weave $ D (NativeLetS i ne x) deps
  weave (D x []) = x

  atomize e deps
    | isAtomic e = return $ D e deps
    | otherwise = do
        i <- newIndex
        t <- case typeMof e of
          Passthrough -> return Nothing
          (Serial ft) -> return $ Just ft
          _ -> return Nothing
        -- _ -> error "This type must be serialized"
        return $ D (LetVarS t i) ((i, Left e) : deps)

  isAtomic (LetVarS _ _) = True
  isAtomic (BndVarS _ _) = True
  isAtomic (ReturnS _) = True
  isAtomic (SerializeS _ _) = True
  isAtomic _ = False

-- ---------------------------------------------------------------------------
-- Variable index substitution [old/new]
--
-- When a let-binding has a trivial RHS (just a variable reference), we
-- eliminate it by substituting the bound index throughout the body and
-- remaining deps.  Since variable indices appear in many AST positions
-- (variable refs, binding sites, manifold parameter forms, pool call
-- descriptors, LocalCallP executable refs), the substitution must
-- reach all of them.
-- ---------------------------------------------------------------------------

-- | Detect a trivial native variable reference.
nativeTrivialVar :: NativeExpr -> Maybe Int
nativeTrivialVar (LetVarN _ j) = Just j
nativeTrivialVar (BndVarN _ j) = Just j
nativeTrivialVar _ = Nothing

-- | Detect a trivial serial variable reference.
serialTrivialVar :: SerialExpr -> Maybe Int
serialTrivialVar (LetVarS _ j) = Just j
serialTrivialVar (BndVarS _ j) = Just j
serialTrivialVar _ = Nothing

-- | Substitute variable index [old/new] throughout a NativeExpr.
renameNE :: Int -> Int -> NativeExpr -> NativeExpr
renameNE old new = go where
  ri i = if i == old then new else i
  go (ManN nm) = ManN (renameNM old new nm)
  go (AppExeN t exe args) = AppExeN t (renameExe old new exe) (map goA args)
  go (ReturnN ne) = ReturnN (go ne)
  go (SerialLetN i se ne) = SerialLetN (ri i) (renameSE old new se) (go ne)
  go (NativeLetN i ne1 ne2) = NativeLetN (ri i) (go ne1) (go ne2)
  go (LetVarN t i) = LetVarN t (ri i)
  go (BndVarN t i) = BndVarN t (ri i)
  go (DeserializeN t s se) = DeserializeN t s (renameSE old new se)
  go (ExeN t exe) = ExeN t (renameExe old new exe)
  go (ListN v t nes) = ListN v t (map go nes)
  go (TupleN v xs) = TupleN v (map go xs)
  go (RecordN o v ps rs) = RecordN o v ps (map (second go) rs)
  go e@(LogN _ _) = e
  go e@(RealN _ _) = e
  go e@(IntN _ _) = e
  go e@(StrN _ _) = e
  go e@(NullN _) = e
  go (DoBlockN t ne) = DoBlockN t (go ne)
  go (EvalN t ne) = EvalN t (go ne)
  go (CoerceN c t ne) = CoerceN c t (go ne)
  go (IfN t c th el) = IfN t (go c) (go th) (go el)
  go (IntrinsicN t intr msch nes) = IntrinsicN t intr msch (map go nes)
  goA (NativeArgManifold nm) = NativeArgManifold (renameNM old new nm)
  goA (NativeArgExpr ne) = NativeArgExpr (go ne)

-- | Substitute variable index [old/new] throughout a SerialExpr.
renameSE :: Int -> Int -> SerialExpr -> SerialExpr
renameSE old new = go where
  ri i = if i == old then new else i
  go (ManS sm) = ManS (renameSM old new sm)
  go (AppPoolS t p args) = AppPoolS t (renamePoolCall old new p) (map goA args)
  go (AppRecS t m es) = AppRecS t m (map go es)
  go (AppForeignRecS t m s es) = AppForeignRecS t m s (map go es)
  go (ReturnS se) = ReturnS (go se)
  go (SerialLetS i se1 se2) = SerialLetS (ri i) (go se1) (go se2)
  go (NativeLetS i ne se) = NativeLetS (ri i) (renameNE old new ne) (go se)
  go (LetVarS mt i) = LetVarS mt (ri i)
  go (BndVarS mt i) = BndVarS mt (ri i)
  go (SerializeS s ne) = SerializeS s (renameNE old new ne)
  goA (SerialArgManifold sm) = SerialArgManifold (renameSM old new sm)
  goA (SerialArgExpr se) = SerialArgExpr (go se)

renameNM :: Int -> Int -> NativeManifold -> NativeManifold
renameNM old new (NativeManifold m lang form body) =
  NativeManifold m lang (renameForm old new form) (renameNE old new body)

renameSM :: Int -> Int -> SerialManifold -> SerialManifold
renameSM old new (SerialManifold m lang form hf body) =
  SerialManifold m lang (renameForm old new form) hf (renameSE old new body)

renameForm :: Int -> Int -> ManifoldForm a b -> ManifoldForm a b
renameForm old new form = case form of
  ManifoldPass args -> ManifoldPass (map ra args)
  ManifoldFull args -> ManifoldFull (map ra args)
  ManifoldPart ctx bnd -> ManifoldPart (map ra ctx) (map ra bnd)
  where
    ra (Arg i t) = Arg (if i == old then new else i) t

renamePoolCall :: Int -> Int -> PoolCall -> PoolCall
renamePoolCall old new (PoolCall mid sock rform args) =
  PoolCall mid sock rform (map ra args)
  where
    ra (Arg i t) = Arg (if i == old then new else i) t

renameExe :: Int -> Int -> ExecutableExpressionPool -> ExecutableExpressionPool
renameExe old new (LocalCallP i) = LocalCallP (if i == old then new else i)
renameExe _ _ other = other

renameDeps :: Int -> Int -> [(Int, Either SerialExpr NativeExpr)]
           -> [(Int, Either SerialExpr NativeExpr)]
renameDeps old new = map f where
  ri i = if i == old then new else i
  f (i, Left se) = (ri i, Left (renameSE old new se))
  f (i, Right ne) = (ri i, Right (renameNE old new ne))

invertSerialManifold :: SerialManifold -> SerialManifold
invertSerialManifold sm0 =
  runIndex (maxIndex sm0) (unD <$> foldSerialManifoldM fm sm0)
  where
    fm =
      FoldManifoldM
        { opSerialManifoldM = invertSerialManifoldM
        , opNativeManifoldM = invertNativeManifoldM
        , opSerialExprM = invertSerialExprM
        , opNativeExprM = invertNativeExprM
        , opSerialArgM = invertSerialArgM
        , opNativeArgM = invertNativeArgM
        }

    invertSerialManifoldM :: SerialManifold_ (D SerialExpr) -> Index (D SerialManifold)
    invertSerialManifoldM (SerialManifold_ m lang form headForm se) = do
      return (D (SerialManifold m lang form headForm (weave se)) [])

    invertNativeManifoldM :: NativeManifold_ (D NativeExpr) -> Index (D NativeManifold)
    invertNativeManifoldM (NativeManifold_ m lang form (weave -> ne)) = do
      return (D (NativeManifold m lang form ne) [])

    invertSerialExprM ::
      SerialExpr_ (D SerialManifold) (D SerialExpr) (D NativeExpr) (D SerialArg) (D NativeArg) ->
      Index (D SerialExpr)
    invertSerialExprM (ManS_ (D sm lets)) = return $ D (ManS sm) lets
    invertSerialExprM (AppPoolS_ t pool serialArgs) = do
      let serialArgs' = map unD serialArgs
          deps = concatMap getDeps serialArgs
      atomize (AppPoolS t pool serialArgs') deps
    invertSerialExprM (ReturnS_ (D se lets)) = return $ D (ReturnS se) lets
    invertSerialExprM (SerialLetS_ i (D se1 lets1) (D se2 lets2))
      | Just j <- serialTrivialVar se1 =
          return $ D (renameSE i j se2) (renameDeps i j lets2 <> lets1)
      | otherwise =
          return $ D se2 (lets2 <> ((i, Left se1) : lets1))
    invertSerialExprM (NativeLetS_ i (D ne1 lets1) (D se2 lets2))
      | Just j <- nativeTrivialVar ne1 =
          return $ D (renameSE i j se2) (renameDeps i j lets2 <> lets1)
      | otherwise =
          return $ D se2 (lets2 <> ((i, Right ne1) : lets1))
    invertSerialExprM (LetVarS_ t i) = atomize (LetVarS t i) []
    invertSerialExprM (BndVarS_ t i) = atomize (BndVarS t i) []
    invertSerialExprM (AppRecS_ t mid serialExprs) = do
      let serialExprs' = map unD serialExprs
          deps = concatMap getDeps serialExprs
      atomize (AppRecS t mid serialExprs') deps
    invertSerialExprM (AppForeignRecS_ t mid socket serialExprs) = do
      let serialExprs' = map unD serialExprs
          deps = concatMap getDeps serialExprs
      atomize (AppForeignRecS t mid socket serialExprs') deps
    invertSerialExprM (SerializeS_ s (D ne lets)) = atomize (SerializeS s ne) lets

    invertNativeExprM ::
      NativeExpr_ (D NativeManifold) (D SerialExpr) (D NativeExpr) (D SerialArg) (D NativeArg) ->
      Index (D NativeExpr)
    invertNativeExprM (AppExeN_ t exe nativeArgs) = do
      let nativeArgs' = map unD nativeArgs
          deps = concatMap getDeps nativeArgs
      case (t, exe) of
        -- Source functions return the unwrapped type; the compiler wraps in suspend
        (EffectF _ innerT, SrcCallP _) ->
          return $ D (DoBlockN t (weave (D (AppExeN innerT exe nativeArgs') deps))) []
        (OptionalF _, SrcCallP _) ->
          atomize (AppExeN t exe nativeArgs') deps
        _ -> atomize (AppExeN t exe nativeArgs') deps
    invertNativeExprM (ManN_ (D nm lets)) = atomize (ManN nm) lets
    invertNativeExprM (ReturnN_ (D ne lets)) = atomize (ReturnN ne) lets
    -- Eliminate trivial let-bindings where the RHS is just a variable
    -- reference, e.g. "let i = j" becomes substitution [i/j] in body.
    -- This avoids redundant assignments like "n7 = n8" in generated code.
    invertNativeExprM (SerialLetN_ i (D se1 lets1) (D ne2 lets2))
      | Just j <- serialTrivialVar se1 =
          return $ D (renameNE i j ne2) (renameDeps i j lets2 <> lets1)
      | otherwise =
          return $ D ne2 (lets2 <> ((i, Left se1) : lets1))
    invertNativeExprM (NativeLetN_ i (D ne1 lets1) (D ne2 lets2))
      | Just j <- nativeTrivialVar ne1 =
          return $ D (renameNE i j ne2) (renameDeps i j lets2 <> lets1)
      | otherwise =
          return $ D ne2 (lets2 <> ((i, Right ne1) : lets1))
    invertNativeExprM (LetVarN_ t i) = atomize (LetVarN t i) []
    invertNativeExprM (BndVarN_ t i) = atomize (BndVarN t i) []
    invertNativeExprM (DeserializeN_ t s (D se lets)) = atomize (DeserializeN t s se) lets
    invertNativeExprM (ExeN_ t x) = atomize (ExeN t x) []
    invertNativeExprM (ListN_ v t nes) = atomize (ListN v t (map unD nes)) (concatMap getDeps nes)
    invertNativeExprM (TupleN_ v xs) = atomize (TupleN v (map unD xs)) (concatMap getDeps xs)
    invertNativeExprM (RecordN_ o v ps rs) = atomize (RecordN o v ps (map (second unD) rs)) (concatMap (getDeps . snd) rs)
    invertNativeExprM (LogN_ v x) = atomize (LogN v x) []
    invertNativeExprM (RealN_ v x) = atomize (RealN v x) []
    invertNativeExprM (IntN_ v x) = atomize (IntN v x) []
    invertNativeExprM (StrN_ v x) = atomize (StrN v x) []
    invertNativeExprM (NullN_ v) = atomize (NullN v) []
    -- keep dependencies inside suspend so thunk body stays lazy
    invertNativeExprM (DoBlockN_ t (D ne lets)) = return $ D (DoBlockN t (weave (D ne lets))) []
    invertNativeExprM (EvalN_ t (D ne lets)) = atomize (EvalN t ne) lets
    -- coercion is transparent: pass through like EvalN
    invertNativeExprM (CoerceN_ c t (D ne lets)) = atomize (CoerceN c t ne) lets
    -- keep dependencies inside if branches (like suspend)
    invertNativeExprM (IfN_ t (D condNe condLets) (D thenNe thenLets) (D elseNe elseLets)) =
      atomize (IfN t (weave (D condNe condLets)) (weave (D thenNe thenLets)) (weave (D elseNe elseLets))) []
    invertNativeExprM (IntrinsicN_ t intr msch nes) =
      atomize (IntrinsicN t intr msch (map unD nes)) (concatMap getDeps nes)

    invertSerialArgM :: SerialArg_ (D SerialManifold) (D SerialExpr) -> Index (D SerialArg)
    invertSerialArgM (SerialArgManifold_ (D sm deps)) = return $ D (SerialArgManifold sm) deps
    invertSerialArgM (SerialArgExpr_ (D se deps)) = return $ D (SerialArgExpr se) deps

    invertNativeArgM :: NativeArg_ (D NativeManifold) (D NativeExpr) -> Index (D NativeArg)
    invertNativeArgM (NativeArgManifold_ (D nm deps)) = return $ D (NativeArgManifold nm) deps
    invertNativeArgM (NativeArgExpr_ (D ne deps)) = return $ D (NativeArgExpr ne) deps

maxIndex :: SerialManifold -> Int
maxIndex = (+ 1) . runIdentity . foldSerialManifoldM fm
  where
    fm =
      FoldManifoldM
        { opSerialManifoldM = findSerialManifoldIndices
        , opNativeManifoldM = findNativeManifoldIndices
        , opSerialExprM = findSerialIndices
        , opNativeExprM = findNativeIndices
        , opSerialArgM = return . foldlSA max 0
        , opNativeArgM = return . foldlNA max 0
        }

    findSerialManifoldIndices :: (Monad m) => SerialManifold_ Int -> m Int
    findSerialManifoldIndices (SerialManifold_ _ _ form _ bodyMax) = do
      let formIndices = abilist const const form
      return $ foldl max bodyMax formIndices

    findNativeManifoldIndices :: (Monad m) => NativeManifold_ Int -> m Int
    findNativeManifoldIndices (NativeManifold_ _ _ form bodyMax) = do
      let formIndices = abilist const const form
      return $ foldl max bodyMax formIndices

    findSerialIndices :: (Monad m) => SerialExpr_ Int Int Int Int Int -> m Int
    findSerialIndices (LetVarS_ _ i) = return i
    findSerialIndices (BndVarS_ _ i) = return i
    findSerialIndices e = return $ foldlSE max 0 e

    findNativeIndices :: (Monad m) => NativeExpr_ Int Int Int Int Int -> m Int
    findNativeIndices (LetVarN_ _ i) = return i
    findNativeIndices (BndVarN_ _ i) = return i
    findNativeIndices e = return $ foldlNE max 0 e

{- | A record entry stores the common name, keys, and types of records that are
not imported from source. These records are generated as structs (or
equivalent) in the pool. 'unifyRecords' takes all such records and "unifies"
ones with the same name and keys. The unified records may have different
types, but they will all be instances of the same generic struct. Fields that
differ between instances are made generic.
-}
data RecEntry = RecEntry
  { recName :: MDoc
  , recFields ::
      [ ( Key
        , Maybe TypeF
        )
      ]
  }
  deriving (Show)

-- | Lookup table mapping (FVar, keys) to their unified RecEntry.
type RecMap = [((FVar, [Key]), RecEntry)]

collectRecords :: SerialManifold -> [(FVar, Int, [(Key, TypeF)])]
collectRecords e0@(SerialManifold i0 _ _ _ _) =
  unique $ CMS.evalState (surroundFoldSerialManifoldM manifoldIndexer fm e0) i0
  where
    fm = defaultValue {opFoldWithNativeExprM = nativeExpr, opFoldWithSerialExprM = serialExpr}

    manifoldIndexer = makeManifoldIndexer CMS.get CMS.put

    nativeExpr _ (DeserializeN_ t s xs) = do
      manifoldIndex <- CMS.get
      let tRecs = seekRecs manifoldIndex t
          sRecs = seekRecs manifoldIndex (serialAstToType s)
      return $ xs <> tRecs <> sRecs
    nativeExpr efull e = do
      manifoldIndex <- CMS.get
      let newRecs = seekRecs manifoldIndex (typeFof efull)
      return $ foldlNE (<>) newRecs e

    serialExpr _ (SerializeS_ s xs) = do
      manifoldIndex <- CMS.get
      return $ seekRecs manifoldIndex (serialAstToType s) <> xs
    serialExpr _ e = return $ foldlSE (<>) [] e

    seekRecs :: Int -> TypeF -> [(FVar, Int, [(Key, TypeF)])]
    seekRecs m (NamF _ v@(FV _ (CV "struct")) _ rs) = [(v, m, rs)] <> concatMap (seekRecs m . snd) rs
    seekRecs m (NamF _ _ _ rs) = concatMap (seekRecs m . snd) rs
    seekRecs m (FunF ts t) = concatMap (seekRecs m) (t : ts)
    seekRecs m (AppF t ts) = concatMap (seekRecs m) (t : ts)
    seekRecs _ (UnkF _) = []
    seekRecs _ (VarF _) = []
    seekRecs m (EffectF _ t) = seekRecs m t
    seekRecs m (OptionalF t) = seekRecs m t
    seekRecs _ (NatLitF _) = []

unifyRecords ::
  [ ( FVar
    , Int
    , [(Key, TypeF)]
    )
  ] ->
  RecMap
unifyRecords xs =
  zipWith (\i ((v, ks), es) -> ((v, ks), RecEntry (structName i v) es)) [1 ..]
    . map (\((v, ks), rss) -> ((v, ks), map unifyField (transpose (map snd rss))))
    . groupSort
    . unique
    $ [((v, map fst es), (m, es)) | (v, m, es) <- xs]

structName :: Int -> FVar -> MDoc
structName i (FV v (CV "struct")) = "mlc_" <> pretty v <> "_" <> pretty i
structName _ (FV _ v) = pretty v

unifyField :: [(Key, TypeF)] -> (Key, Maybe TypeF)
unifyField [] = error "Empty field"
unifyField rs@((v, _) : _)
  | not (all ((== v) . fst) rs) =
      error $ "Bad record - unequal fields: " <> show (unique rs)
  | otherwise = case unique (map snd rs) of
      [t] -> (v, Just t)
      _ -> (v, Nothing)

-- | A dispatch table entry: manifold ID and argument count.
data DispatchEntry = DispatchEntry
  { dispatchId :: Int
  , dispatchArgCount :: Int
  }
  deriving (Show, Eq, Ord, Generic)

instance Binary DispatchEntry

{- | Extract local dispatch entries from serial manifolds.
Skips manifolds marked as remote workers.
-}
extractLocalDispatch :: [SerialManifold] -> [DispatchEntry]
extractLocalDispatch = catMaybes . map localEntry
  where
    localEntry (SerialManifold _ _ _ HeadManifoldFormRemoteWorker _) = Nothing
    localEntry (SerialManifold i _ form _ _) = Just $ DispatchEntry i (getSize form)

    getSize :: ManifoldForm (Or TypeS TypeF) TypeS -> Int
    getSize = sum . abilist (\_ _ -> 1) (\_ _ -> 1)

-- | Extract remote dispatch entries by walking the AST.
extractRemoteDispatch :: [SerialManifold] -> [DispatchEntry]
extractRemoteDispatch = map (uncurry DispatchEntry) . unique . concatMap getRemotes
  where
    getRemotes :: SerialManifold -> [(Int, Int)]
    getRemotes = runIdentity . foldSerialManifoldM (defaultValue {opSerialExprM = getRemoteSE})

    getRemoteSE ::
      SerialExpr_ [(Int, Int)] [(Int, Int)] [(Int, Int)] [(Int, Int)] [(Int, Int)] ->
      Identity [(Int, Int)]
    getRemoteSE (AppPoolS_ _ (PoolCall i _ (RemoteCall _) _) xss) = return $ (i, length xss) : concat xss
    getRemoteSE x = return $ foldlSE mappend mempty x


================================================
FILE: library/Morloc/CodeGenerator/Grammars/Macro.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.CodeGenerator.Grammars.Macro
Description : Expand parameters in concrete types
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.CodeGenerator.Grammars.Macro
  ( expandMacro
  ) where

import Data.Text (Text)
import Morloc.CodeGenerator.Namespace
import qualified Morloc.Data.Text as MT
import Text.Parsec (Parsec, runParser, eof, many1, getState)
import Text.Parsec.Char (noneOf, string, digit)
import Text.Parsec.Text ()

type Parser = Parsec Text ParserState

newtype ParserState = ParserState {stateParameters :: [Text]}

expandMacro :: Text -> [Text] -> Text
expandMacro t [] = t
expandMacro t ps =
  case runParser (pBase <* eof) (ParserState ps) "typemacro" t of
    Left err' -> error (show err')
    Right es -> es

pBase :: Parser Text
pBase = MT.concat <$> many1 (pChar <|> pMacro)

pChar :: Parser Text
pChar = MT.pack <$> many1 (noneOf ['$'])

pMacro :: Parser Text
pMacro = do
  xs <- stateParameters <$> getState
  _ <- string "$"
  n <- read <$> many1 digit
  -- index is 1-based
  let i = n - 1
  return (xs !! i)


================================================
FILE: library/Morloc/CodeGenerator/Grammars/Translator/Generic.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE QuasiQuotes #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Grammars.Translator.Generic
Description : Descriptor-driven translator for dynamically-typed languages
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Generic translator that generates pool code for dynamically-typed interpreted
languages based on a LangDescriptor. All language-specific behavior is driven
by descriptor fields -- no hardcoded language-specific code.
-}
module Morloc.CodeGenerator.Grammars.Translator.Generic
  ( translate
  , preprocess
  , CodegenManifest (..)
  , printProgram
  ) where

import qualified Data.Aeson as Aeson
import qualified Data.Binary as Binary
import qualified Data.ByteString.Lazy as BL
import Data.Text (Text)
import qualified Data.Text as T
import qualified Data.Text.Encoding as TE
import Morloc.CodeGenerator.Grammars.Common
import Morloc.CodeGenerator.Grammars.Translator.Imperative
  ( IAccessor (..)
  , IExpr (..)
  , IProgram (..)
  , IStmt (..)
  , IndexM
  , LowerConfig (..)
  , buildProgram
  , defaultDeserialize
  , defaultFoldRules
  , defaultSerialize
  )
import Morloc.CodeGenerator.Grammars.Translator.PseudoCode (pseudocodeSerialManifold)
import Morloc.CodeGenerator.LanguageDescriptor
import Morloc.CodeGenerator.Namespace
import qualified Morloc.Config as MC
import Morloc.Data.Doc
import qualified Morloc.Data.Text as MT
import qualified Morloc.DataFiles as DF
import qualified Morloc.LangRegistry as LR
import qualified Morloc.Language as ML
import qualified Morloc.Version as MV
import Morloc.Monad (asks, gets, newIndex, runIndex)
import qualified Morloc.Monad as MM
import Morloc.Quasi
import qualified System.Directory as Dir
import qualified System.Exit as Exit
import System.IO (hClose, openBinaryTempFile)
import qualified System.Process as Proc

-- | Simple template substitution: replace {{key}} with value
substituteT :: Text -> [(Text, Text)] -> Text
substituteT = foldl (\t (k, v) -> T.replace ("{{" <> k <> "}}") v t)

preprocess :: SerialManifold -> MorlocMonad SerialManifold
preprocess = return . invertSerialManifold

translate :: Lang -> [Source] -> [SerialManifold] -> MorlocMonad Script
translate lang srcs es = do
  desc <- loadDescriptorForLang lang
  case ldCodegenCommand desc of
    Just cmd -> translateExternal cmd lang desc srcs es
    Nothing -> translateBuiltin lang desc srcs es

-- | Translate using the built-in generic renderer.
translateBuiltin :: Lang -> LangDescriptor -> [Source] -> [SerialManifold] -> MorlocMonad Script
translateBuiltin lang desc srcs es = do
  home <- pretty <$> asks MC.configHome
  lib <- MT.pack <$> asks MC.configLibrary
  let opt = home <> "/opt"

  -- translate source imports
  includeDocs <-
    mapM
      (translateSource desc)
      (unique . mapMaybe srcPath $ srcs)

  debugLog (vsep (map pseudocodeSerialManifold es) <> "\n")

  -- build src name function
  let srcNamer =
        if ldQualifiedImports desc
          then qualifiedSrcName lib
          else \src -> pretty (srcName src)

  -- add language-specific preamble from registry
  registry <- gets stateLangRegistry
  let preambleTemplates = case LR.lookupLang (ML.langName lang) registry of
        Just entry -> LR.lrePreamble entry
        Nothing -> []
  homeDir <- asks MC.configHome
  let preambleDocs = map (substitutePreamble home lib opt homeDir) preambleTemplates

  let allSources = preambleDocs ++ includeDocs
      mDocs = map (translateSegment desc srcNamer) es
      program = buildProgram allSources mDocs es

  let code = printProgram desc program
  let exefile = ML.makeExecutablePoolName lang
  let rendered = T.replace "__MORLOC_VERSION__" (MT.pack MV.versionStr) (render code)

  poolSubdir <- getPoolSubdir

  return $
    Script
      { scriptBase = "pool"
      , scriptLang = lang
      , scriptCode = "." :/ Dir "pools" [Dir poolSubdir [File exefile (Code rendered)]]
      , scriptMake = []
      }
  where
    substitutePreamble :: MDoc -> Text -> MDoc -> Path -> Text -> MDoc
    substitutePreamble homeDoc libText optDoc _homeDir t =
      pretty
        . T.replace "{{home}}" (render homeDoc)
        . T.replace "{{lib}}" libText
        . T.replace "{{opt}}" (render optDoc)
        $ t

-- | Translate using an external codegen tool.
translateExternal ::
  Text -> Lang -> LangDescriptor -> [Source] -> [SerialManifold] -> MorlocMonad Script
translateExternal cmd lang desc srcs es = do
  home <- asks MC.configHome
  lib <- MT.pack <$> asks MC.configLibrary

  includeDocs <-
    mapM
      (translateSource desc)
      (unique . mapMaybe srcPath $ srcs)

  debugLog (vsep (map pseudocodeSerialManifold es) <> "\n")

  let srcNamer =
        if ldQualifiedImports desc
          then qualifiedSrcName lib
          else \src -> pretty (srcName src)

  let mDocs = map (translateSegment desc srcNamer) es
      program = buildProgram includeDocs mDocs es

  -- find the lang.yaml path for the codegen tool
  let langYamlPath = home </> "lang" </> T.unpack (ML.langName lang) </> "lang.yaml"

  -- serialize IProgram to a temp file
  tmpDir <- liftIO Dir.getTemporaryDirectory
  (tmpPath, tmpHandle) <- liftIO $ openBinaryTempFile tmpDir "iprogram.bin"
  liftIO $ do
    BL.hPut tmpHandle (Binary.encode program)
    hClose tmpHandle

  -- invoke the codegen command: cmd lang.yaml iprogram.bin
  let cmdStr = T.unpack cmd
  (exitCode, stdoutStr, stderrStr) <-
    liftIO $
      Proc.readCreateProcessWithExitCode
        (Proc.proc cmdStr [langYamlPath, tmpPath])
        ""

  -- clean up temp file
  liftIO $ Dir.removeFile tmpPath

  case exitCode of
    Exit.ExitFailure code' ->
      MM.throwSystemError $
        "External codegen '"
          <> pretty cmd
          <> "' failed with exit code "
          <> pretty code'
          <> ":\n"
          <> pretty stderrStr
    Exit.ExitSuccess -> do
      -- parse the codegen manifest from stdout
      let manifest = Aeson.decodeStrict (TE.encodeUtf8 (T.pack stdoutStr)) :: Maybe CodegenManifest
      case manifest of
        Nothing ->
          MM.throwSystemError $
            "External codegen '"
              <> pretty cmd
              <> "' produced invalid manifest on stdout"
        Just m -> do
          let exefile = ML.makeExecutablePoolName lang
              poolContent = T.replace "__MORLOC_VERSION__" (MT.pack MV.versionStr) (cgmPoolCode m)
              buildCmds = map (SysRun . Code) (cgmBuildCommands m)
          poolSubdir <- getPoolSubdir
          return $
            Script
              { scriptBase = "pool"
              , scriptLang = lang
              , scriptCode = "." :/ Dir "pools" [Dir poolSubdir [File exefile (Code poolContent)]]
              , scriptMake = buildCmds
              }

-- | Manifest returned by an external codegen tool on stdout.
data CodegenManifest = CodegenManifest
  { cgmPoolCode :: Text
  -- ^ rendered pool file content
  , cgmBuildCommands :: [Text]
  -- ^ build commands to run after writing files
  }
  deriving (Show)

instance Aeson.FromJSON CodegenManifest where
  parseJSON = Aeson.withObject "CodegenManifest" $ \v ->
    CodegenManifest
      <$> v Aeson..: "pool_code"
      <*> (v Aeson..:? "build_commands" Aeson..!= [])

instance Aeson.ToJSON CodegenManifest where
  toJSON m =
    Aeson.object
      [ "pool_code" Aeson..= cgmPoolCode m
      , "build_commands" Aeson..= cgmBuildCommands m
      ]

{- | Load the language descriptor for a language.
Tries embedded lang.yaml first, then falls back to filesystem.
If the pool template is empty, loads it from the embedded or filesystem pool file.
-}
loadDescriptorForLang :: Lang -> MorlocMonad LangDescriptor
loadDescriptorForLang lang = do
  let name = ML.langName lang
      ext = ML.langExtension lang
  desc <- loadDescriptorByName name
  -- if pool template is empty, load from embedded or filesystem pool file
  if T.null (ldPoolTemplate desc)
    then do
      poolText <- loadPoolTemplate name ext
      return desc {ldPoolTemplate = poolText}
    else return desc
  where
    loadDescriptorByName :: T.Text -> MorlocMonad LangDescriptor
    loadDescriptorByName name =
      case lookup (T.unpack name) [(n, DF.embededFileText ef) | (n, ef) <- DF.langRegistryFiles] of
        Just yamlText -> case loadLangDescriptorFromText yamlText of
          Left err ->
            MM.throwSystemError $
              "Failed to parse embedded lang.yaml for " <> pretty name <> ": " <> pretty err
          Right desc -> return desc
        Nothing -> do
          -- try filesystem
          home <- asks MC.configHome
          let descPath = home </> "lang" </> T.unpack name </> "lang.yaml"
          result <- liftIO $ loadLangDescriptor descPath
          case result of
            Left err ->
              MM.throwSystemError $
                "Failed to load language descriptor for " <> pretty name <> ": " <> pretty err
            Right desc -> return desc

    loadPoolTemplate :: T.Text -> String -> MorlocMonad T.Text
    loadPoolTemplate name ext =
      -- try embedded pool template first
      case lookupEmbeddedPool name of
        Just t -> return t
        Nothing -> do
          -- try filesystem
          home <- asks MC.configHome
          let poolPath = home </> "lang" </> T.unpack name </> "pool." <> ext
          liftIO $ MT.readFile poolPath

    lookupEmbeddedPool :: T.Text -> Maybe T.Text
    lookupEmbeddedPool "py" = Just $ DF.embededFileText (DF.poolTemplateGeneric "py")
    lookupEmbeddedPool "r" = Just $ DF.embededFileText (DF.poolTemplateGeneric "r")
    lookupEmbeddedPool "cpp" = Just $ DF.embededFileText (DF.poolTemplate "cpp")
    lookupEmbeddedPool _ = Nothing

{- | Get the pool subdirectory name from the module name.
This ensures each program gets its own pool directory (e.g., pools/foo/).
-}
getPoolSubdir :: MorlocMonad String
getPoolSubdir = MM.getModuleName

debugLog :: Doc ann -> MorlocMonad ()
debugLog d = do
  verbosity <- gets stateVerbosity
  when (verbosity > 0) $ (liftIO . putDoc) d

translateSource :: LangDescriptor -> Path -> MorlocMonad MDoc
translateSource desc p = do
  let p' = MT.stripPrefixIfPresent "./" (MT.pack p)
      p'' = if ldIncludeRelToFile desc then "../" <> p' else p'
  if ldQualifiedImports desc
    then do
      lib <- MT.pack <$> asks MC.configLibrary
      let tmpl = ldImportTemplate desc
          ns = render (makeNamespace lib p)
          modPath = render (makeImportPath lib p)
      return . pretty $
        substituteT
          tmpl
          [ ("namespace", ns)
          , ("module_path", modPath)
          ]
    else do
      let tmpl = ldImportTemplate desc
      return . pretty $ substituteT tmpl [("path", p'')]

-- | Qualify a source function name with its module path.
qualifiedSrcName :: Text -> Source -> MDoc
qualifiedSrcName lib src = case srcPath src of
  Nothing -> pretty $ srcName src
  (Just path) -> makeNamespace lib path <> "." <> pretty (srcName src)

makeNamespace :: Text -> Path -> MDoc
makeNamespace lib =
  pretty
    . MT.liftToText (map toLower')
    . MT.replace "/" "_"
    . MT.replace "-" "_"
    . MT.replace "." "_"
    . MT.stripPrefixIfPresent "/"
    . MT.stripPrefixIfPresent "./"
    . MT.stripPrefixIfPresent lib
    . MT.liftToText dropExtensions
    . MT.pack
  where
    toLower' c = if c >= 'A' && c <= 'Z' then toEnum (fromEnum c + 32) else c
    dropExtensions = reverse . drop 1 . dropWhile (/= '.') . reverse

makeImportPath :: Text -> Path -> MDoc
makeImportPath lib =
  pretty
    . MT.liftToText (map toLower')
    . MT.replace "/" "."
    . MT.stripPrefixIfPresent "/"
    . MT.stripPrefixIfPresent "./"
    . MT.stripPrefixIfPresent lib
    . MT.liftToText dropExtensions
    . MT.pack
  where
    toLower' c = if c >= 'A' && c <= 'Z' then toEnum (fromEnum c + 32) else c
    dropExtensions = reverse . drop 1 . dropWhile (/= '.') . reverse

translateSegment :: LangDescriptor -> (Source -> MDoc) -> SerialManifold -> MDoc
translateSegment desc srcNamer m0 =
  let cfg = genericLowerConfig desc srcNamer
   in renderPoolDocs $ runIndex 0 (foldWithSerialManifoldM (defaultFoldRules cfg) m0)

-- | Build a LowerConfig from a LangDescriptor and a source name function
genericLowerConfig :: LangDescriptor -> (Source -> MDoc) -> LowerConfig IndexM
genericLowerConfig desc srcNamer = cfg
  where
    cfg =
      LowerConfig
        { lcSrcName = srcNamer
        , lcTypeOf = \_ -> return Nothing
        , lcSerialAstType = \_ -> return Nothing
        , lcDeserialAstType = \_ -> return Nothing
        , lcRawDeserialAstType = \_ -> return Nothing
        , lcTypeMOf = \_ -> return Nothing
        , lcPackerName = srcNamer
        , lcUnpackerName = srcNamer
        , lcRecordAccessor = genericRecordAccessor desc
        , lcDeserialRecordAccessor = \_ k v -> case ldKeyAccess desc of
            "double_bracket" -> v <> "[[" <> dquotes (pretty k) <> "]]"
            _ -> v <> "[" <> dquotes (pretty k) <> "]"
        , lcTupleAccessor = \i v -> case ldIndexStyle desc of
            ZeroBracket -> v <> "[" <> pretty i <> "]"
            OneBracket -> v <> "[" <> pretty (i + 1) <> "]"
            OneDoubleBracket -> [idoc|#{v}[[#{pretty (i + 1)}]]|]
        , lcNewIndex = newIndex
        , lcPrintExpr = genericPrintExpr desc
        , lcPrintStmt = genericPrintStmt desc
        , lcEvalPattern = \t p xs -> return $ genericEvalPattern desc t p xs
        , lcListConstructor = \v _ es -> case ldListStyle desc of
            BracketList -> list es
            FunctionCallList -> pretty (ldGenericListFn desc) <> tupled es
            TypeDependentList -> case v of
              (FV _ (CV typeName))
                | typeName `elem` ldAtomicTypes desc -> pretty (ldAtomicListFn desc) <> tupled es
              _ -> pretty (ldGenericListFn desc) <> tupled es
        , lcTupleConstructor = \_ -> case ldTupleConstructor desc of
            "" -> tupled
            name -> \es -> pretty name <> tupled es
        , lcRecordConstructor = \_ _ _ _ rs ->
            return $
              defaultValue
                { poolExpr =
                    pretty (ldRecordConstructor desc)
                      <> tupled [makeRecordKey desc k <+> pretty (ldRecordSeparator desc) <+> v | (k, v) <- rs]
                }
        , lcForeignCall = \socketFile mid args ->
            let midDoc = pretty mid <> pretty (ldForeignCallIntSuffix desc)
                argsDoc = case ldListStyle desc of
                  BracketList -> list args
                  _ -> pretty (ldGenericListFn desc) <> tupled args
             in pretty (ldForeignCallFn desc)
                  <> tupled [makeGenericSocketPath desc socketFile, midDoc, argsDoc]
        , lcRemoteCall = genericRemoteCall desc
        , lcMakeIf = genericMakeIf desc cfg
        , lcMakeLet = \namer i _ e1 e2 -> return $ genericMakeLet desc namer i e1 e2
        , lcReturn = \e -> pretty $ substituteT (ldReturnTemplate desc) [("expr", render e)]
        , lcMakeDoBlock = \_ stmts expr ->
            let suspendBlock = ldDoBlockBlock desc
             in if T.null suspendBlock
                  then
                    -- pass stmts through, wrap expr only
                    let wrapped = pretty $ substituteT (ldDoBlockExpr desc) [("expr", render expr)]
                     in (stmts, wrapped)
                  else
                    -- absorb stmts into block
                    case stmts of
                      [] ->
                        let wrapped = pretty $ substituteT (ldDoBlockExpr desc) [("expr", render expr)]
                         in ([], wrapped)
                      _ ->
                        let body = render (vsep (stmts <> [expr]))
                            wrapped = pretty $ substituteT suspendBlock [("body", body)]
                         in ([], wrapped)
        , lcSerialize = defaultSerialize cfg
        , lcDeserialize = \_ -> defaultDeserialize cfg
        , lcMakeFunction = \mname args _ priorLines body headForm ->
            let makeExt (Just HeadManifoldFormRemoteWorker) = "_remote"
                makeExt _ = ""
                fullName = render (mname <> makeExt headForm)
                argsText = render (hsep (punctuate "," (map argNamer args)))
                header =
                  pretty $
                    substituteT
                      (ldFuncDefHeader desc)
                      [ ("name", fullName)
                      , ("args", argsText)
                      ]
                wrapError [] = []
                wrapError xs =
                  let openLine = ldErrorWrapOpen desc
                      closeLines = ldErrorWrapClose desc
                   in if T.null openLine
                        then xs
                        else
                          let tryBlock = nest 4 (vsep (pretty openLine : xs))
                              exceptBlock =
                                nest 4 . vsep $
                                  map (\l -> pretty $ substituteT l [("name", fullName)]) closeLines
                           in [vsep [tryBlock, exceptBlock]]
             in return . Just $ case ldBlockStyle desc of
                  IndentBlock ->
                    nest 4 (vsep [header, vsep (wrapError priorLines), body])
                  BraceBlock ->
                    block 4 header (vsep $ priorLines <> [body])
                  EndKeywordBlock ->
                    let endKw = ldBlockEnd desc
                     in vsep [header, indent 4 (vsep $ priorLines <> [body]), pretty endKw]
        , lcMakeLambda = \mname contextArgs boundArgs ->
            let tmpl = ldPartialTemplate desc
                fnText = render mname
                allArgsList = contextArgs <> boundArgs
                fnWithCtxList = mname : contextArgs
                fnWithCtx = render (hsep (punctuate "," fnWithCtxList))
                allArgs = render (hsep (punctuate "," allArgsList))
                boundArgsText = render (hsep (punctuate "," boundArgs))
             in pretty $
                  substituteT
                    tmpl
                    [ ("fn", fnText)
                    , ("fn_with_context", fnWithCtx)
                    , ("all_args", allArgs)
                    , ("bound_args", boundArgsText)
                    ]
        }

{- | Record access: for languages with ldDictStyleRecords=True,
use bracket access for dict/NamRecord and dot access for others.
-}
genericRecordAccessor :: LangDescriptor -> NamType -> CVar -> MDoc -> MDoc -> MDoc
genericRecordAccessor desc namType constructor record field
  | ldDictStyleRecords desc = case (namType, constructor) of
      (NamTable, CV "dict") -> record <> "[" <> dquotes field <> "]"
      (NamRecord, _) -> record <> "[" <> dquotes field <> "]"
      _ -> record <> "." <> field
  | otherwise = case ldFieldAccess desc of
      DotAccess -> record <> "." <> field
      DollarAccess -> record <> "$" <> field

-- | Remote call with template-driven resource packing
genericRemoteCall :: LangDescriptor -> MDoc -> Int -> RemoteResources -> [MDoc] -> IndexM PoolDocs
genericRemoteCall desc socketFile mid res args = do
  let resMem = T.pack . show $ fromMaybe (-1) (remoteResourcesMemory res)
      resTime = T.pack . show $ maybe (-1) unTimeInSeconds (remoteResourcesTime res)
      resCPU = T.pack . show $ fromMaybe (-1) (remoteResourcesThreads res)
      resGPU = T.pack . show $ fromMaybe 0 (remoteResourcesGpus res)
      remoteFn =
        if T.null (ldRemoteCallFn desc)
          then pretty (ldForeignCallFn desc)
          else pretty (ldRemoteCallFn desc)
      resPacked =
        pretty $
          substituteT
            (ldResourcePackTemplate desc)
            [ ("mem", resMem)
            , ("time", resTime)
            , ("cpus", resCPU)
            , ("gpus", resGPU)
            ]
      call =
        remoteFn
          <> tupled [pretty mid, dquotes socketFile, dquotes ".morloc-cache", resPacked, list args]
  return $ defaultValue {poolExpr = call}

-- | Format a record key: bare identifier or quoted string
makeRecordKey :: LangDescriptor -> Key -> MDoc
makeRecordKey desc k
  | ldQuoteRecordKeys desc = dquotes (pretty k)
  | otherwise = pretty k

makeGenericSocketPath :: LangDescriptor -> MDoc -> MDoc
makeGenericSocketPath desc socketFileBasename =
  let tmpl = ldSocketPathTemplate desc
      socketText = render (dquotes socketFileBasename)
   in pretty $ substituteT tmpl [("socket", socketText)]

-- | Generic if/else rendering for descriptor-driven languages
genericMakeIf :: LangDescriptor -> LowerConfig IndexM -> NativeExpr -> PoolDocs -> PoolDocs -> PoolDocs -> IndexM PoolDocs
genericMakeIf desc cfg _ condDocs thenDocs elseDocs = do
  idx <- lcNewIndex cfg
  let v = helperNamer idx
      condE = poolExpr condDocs
      thenE = poolExpr thenDocs
      elseE = poolExpr elseDocs
      thenBlock = poolPriorLines thenDocs <> [v <+> pretty (ldAssignOp desc) <+> thenE]
      elseBlock = poolPriorLines elseDocs <> [v <+> pretty (ldAssignOp desc) <+> elseE]
      ifStmt = case ldBlockStyle desc of
        IndentBlock ->
          vsep
            [ v <+> pretty (ldAssignOp desc) <+> pretty (ldNullLiteral desc)
            , nest 4 (vsep ("if" <+> condE <> ":" : thenBlock))
            , nest 4 (vsep ("else:" : elseBlock))
            ]
        BraceBlock ->
          vsep
            [ v <+> pretty (ldAssignOp desc) <+> pretty (ldNullLiteral desc) <> ";"
            , "if" <+> parens condE <+> "{"
            , indent 4 (vsep thenBlock)
            , "} else {"
            , indent 4 (vsep elseBlock)
            , "}"
            ]
        EndKeywordBlock ->
          let endKw = ldBlockEnd desc
           in vsep
                [ v <+> "<-" <+> "if" <+> parens condE <+> "{"
                , indent 4 (vsep (poolPriorLines thenDocs <> [thenE]))
                , "} else {"
                , indent 4 (vsep (poolPriorLines elseDocs <> [elseE]))
                , "}" <+> pretty endKw
                ]
  return $
    PoolDocs
      { poolCompleteManifolds = poolCompleteManifolds condDocs <> poolCompleteManifolds thenDocs <> poolCompleteManifolds elseDocs
      , poolExpr = v
      , poolPriorLines = poolPriorLines condDocs <> [ifStmt]
      , poolPriorExprs = poolPriorExprs condDocs <> poolPriorExprs thenDocs <> poolPriorExprs elseDocs
      }

genericMakeLet :: LangDescriptor -> (Int -> MDoc) -> Int -> PoolDocs -> PoolDocs -> PoolDocs
genericMakeLet desc namer i (PoolDocs ms1' e1' rs1 pes1) (PoolDocs ms2' e2' rs2 pes2) =
  let rs = rs1 ++ [namer i <+> pretty (ldAssignOp desc) <+> e1'] ++ rs2
   in PoolDocs (ms1' <> ms2') e2' rs (pes1 <> pes2)

-- | Generic expression printer driven by descriptor
genericPrintExpr :: LangDescriptor -> IExpr -> MDoc
genericPrintExpr desc = go
  where
    go (IVar v) = pretty v
    go (IBoolLit True) = pretty (ldBoolTrue desc)
    go (IBoolLit False) = pretty (ldBoolFalse desc)
    go (INullLit _) = pretty (ldNullLiteral desc)
    go (IIntLit _ i) = viaShow i <> pretty (ldIntLiteralSuffix desc)
    go (IRealLit _ r) = viaShow r
    go (IStrLit s) = textEsc' s
    go (IListLit es) = case ldListStyle desc of
      BracketList -> list (map go es)
      FunctionCallList -> pretty (ldGenericListFn desc) <> tupled (map go es)
      TypeDependentList -> pretty (ldGenericListFn desc) <> tupled (map go es)
    go (ITupleLit es) = case ldTupleConstructor desc of
      "" -> tupled (map go es)
      name -> pretty name <> tupled (map go es)
    go (IRecordLit _ _ entries) =
      pretty (ldRecordConstructor desc)
        <> tupled [makeRecordKey desc k <+> pretty (ldRecordSeparator desc) <+> go e | (k, e) <- entries]
    go (IAccess e (IIdx i)) = case ldIndexStyle desc of
      ZeroBracket -> go e <> "[" <> pretty i <> "]"
      OneBracket -> go e <> "[" <> pretty (i + 1) <> "]"
      OneDoubleBracket -> go e <> "[[" <> pretty (i + 1) <> "]]"
    go (IAccess e (IKey k)) = case ldKeyAccess desc of
      "double_bracket" -> go e <> "[[" <> dquotes (pretty k) <> "]]"
      _ -> go e <> "[" <> dquotes (pretty k) <> "]"
    go (IAccess e (IField f)) = case ldFieldAccess desc of
      DotAccess -> go e <> "." <> pretty f
      DollarAccess -> go e <> "$" <> pretty f
    go (ISerCall schema e) =
      pretty (ldSerializeFn desc) <> "(" <> go e <> ", " <> dquotes (pretty schema) <> ")"
    go (IDesCall schema _ e) =
      pretty (ldDeserializeFn desc) <> "(" <> go e <> ", " <> dquotes (pretty schema) <> ")"
    go (IPack packer e) = pretty packer <> parens (go e)
    go (ICall f Nothing argGroups) =
      pretty f <> hsep (map (tupled . map go) argGroups)
    go (ICall f (Just _) argGroups) =
      pretty f <> hsep (map (tupled . map go) argGroups)
    go (IForeignCall _ _ _) = error "use IRawExpr for generic foreign calls"
    go (IRemoteCall _ _ _ _) = error "use IRawExpr for generic remote calls"
    go (ILambda args body) =
      let argsText = render (hsep (punctuate "," (map pretty args)))
          bodyText = render (go body)
       in pretty $
            substituteT
              (ldLambdaTemplate desc)
              [ ("args", argsText)
              , ("body", bodyText)
              ]
    go (IRawExpr d) = pretty d
    go (IDoBlock e) =
      pretty $ substituteT (ldDoBlockExpr desc) [("expr", render (go e))]
    go (IEval e) = go e <> "()"
    go (IIntrinsicHash schema e) =
      let prefix = ldIntrinsicPrefix desc
       in pretty prefix <> "mlc_hash(" <> go e <> ", " <> dquotes (pretty schema) <> ")"
    go (IIntrinsicSave fmt schema e path) =
      let prefix = ldIntrinsicPrefix desc
          saveFn :: Text
          saveFn = case fmt of
            "json"     -> "mlc_save_json"
            "voidstar" -> "mlc_save_voidstar"
            _          -> "mlc_save"
       in pretty prefix <> pretty saveFn <> "(" <> go e <> ", " <> dquotes (pretty schema) <> ", " <> go path <> ")"
    go (IIntrinsicLoad schema _ path) =
      let prefix = ldIntrinsicPrefix desc
       in pretty prefix <> "mlc_load(" <> dquotes (pretty schema) <> ", " <> go path <> ")"
    go (IIntrinsicShow schema e) =
      let prefix = ldIntrinsicPrefix desc
       in pretty prefix <> "mlc_show(" <> go e <> ", " <> dquotes (pretty schema) <> ")"
    go (IIntrinsicRead schema _ e) =
      let prefix = ldIntrinsicPrefix desc
       in pretty prefix <> "mlc_read(" <> dquotes (pretty schema) <> ", " <> go e <> ")"

-- | Generic statement printer driven by descriptor
genericPrintStmt :: LangDescriptor -> IStmt -> MDoc
genericPrintStmt desc = go
  where
    printE = genericPrintExpr desc

    go (IAssign v Nothing e) = pretty v <+> pretty (ldAssignOp desc) <+> printE e
    go (IAssign v (Just _) e) = pretty v <+> pretty (ldAssignOp desc) <+> printE e
    go (IMapList resultVar _ iterVar collection bodyStmts yieldExpr) =
      case ldMapStyle desc of
        LoopAppend ->
          vsep
            [ pretty resultVar <+> pretty (ldAssignOp desc) <+> "[]"
            , nest
                4
                ( vsep
                    ( ("for" <+> pretty iterVar <+> "in" <+> printE collection <> ":")
                        : map go bodyStmts
                        ++ [pretty resultVar <> ".append(" <> printE yieldExpr <> ")"]
                    )
                )
            ]
        ApplyCallback ->
          block
            4
            ( pretty resultVar <+> pretty (ldAssignOp desc) <+> "lapply("
                <> printE collection
                <> "," <+> "function("
                <> pretty iterVar
                <> ")"
            )
            (vsep (map go bodyStmts ++ [printE yieldExpr]))
            <> ")"
        ListComprehension ->
          vsep
            [ pretty resultVar <+> pretty (ldAssignOp desc) <+> "["
                <> printE yieldExpr
                  <+> "for"
                  <+> pretty iterVar
                  <+> "in"
                  <+> printE collection
                <> "]"
            ]
    go (IReturn e) = pretty $ substituteT (ldReturnTemplate desc) [("expr", render (printE e))]
    go (IExprStmt e) = printE e
    go (IIf resultVar _ condExpr thenStmts thenExpr elseStmts elseExpr) =
      case ldBlockStyle desc of
        IndentBlock ->
          vsep
            [ pretty resultVar <+> pretty (ldAssignOp desc) <+> pretty (ldNullLiteral desc)
            , nest 4 (vsep ("if" <+> printE condExpr <> ":" : map go thenStmts ++ [pretty resultVar <+> pretty (ldAssignOp desc) <+> printE thenExpr]))
            , nest 4 (vsep ("else:" : map go elseStmts ++ [pretty resultVar <+> pretty (ldAssignOp desc) <+> printE elseExpr]))
            ]
        BraceBlock ->
          vsep
            [ pretty resultVar <+> pretty (ldAssignOp desc) <+> pretty (ldNullLiteral desc) <> ";"
            , "if" <+> parens (printE condExpr) <+> "{"
            , indent 4 (vsep (map go thenStmts ++ [pretty resultVar <+> pretty (ldAssignOp desc) <+> printE thenExpr <> ";"]))
            , "} else {"
            , indent 4 (vsep (map go elseStmts ++ [pretty resultVar <+> pretty (ldAssignOp desc) <+> printE elseExpr <> ";"]))
            , "}"
            ]
        EndKeywordBlock ->
          vsep
                [ pretty resultVar <+> "<-" <+> "if" <+> parens (printE condExpr) <+> "{"
                , indent 4 (vsep (map go thenStmts ++ [printE thenExpr]))
                , "} else {"
                , indent 4 (vsep (map go elseStmts ++ [printE elseExpr]))
                , "}"
                ]
    go (IFunDef _ _ _ _) = error "IFunDef not yet implemented for generic printer"

-- | Assemble a complete pool file from descriptor, template, and IProgram
printProgram :: LangDescriptor -> IProgram -> MDoc
printProgram desc prog =
  format
    (ldPoolTemplate desc)
    (ldBreakMarker desc)
    sections
  where
    sections =
      [ vsep (map pretty (ipSources prog))
      , vsep (map pretty (ipManifolds prog))
      , templateDispatch
      ]

    templateDispatch = vsep [localD, remoteD]
      where
        localD =
          let hdr = ldDispatchLocalHeader desc
              entryTmpl = ldDispatchLocalEntry desc
              ftr = ldDispatchLocalFooter desc
              entries =
                map
                  ( \(DispatchEntry i _) ->
                      pretty $
                        substituteT
                          entryTmpl
                          [ ("mid", T.pack (show i))
                          , ("name", render (manNamer i))
                          ]
                  )
                  (ipLocalDispatch prog)
           in if T.null hdr && T.null entryTmpl
                then mempty
                else
                  align . vsep $
                    filter
                      (not . isEmpty)
                      [ pretty hdr
                      , vsep entries
                      , pretty ftr
                      ]

        remoteD =
          let hdr = ldDispatchRemoteHeader desc
              entryTmpl = ldDispatchRemoteEntry desc
              ftr = ldDispatchRemoteFooter desc
              entries =
                map
                  ( \(DispatchEntry i _) ->
                      pretty $
                        substituteT
                          entryTmpl
                          [ ("mid", T.pack (show i))
                          , ("name", render (manNamer i))
                          ]
                  )
                  (ipRemoteDispatch prog)
           in if T.null hdr && T.null entryTmpl
                then mempty
                else
                  align . vsep $
                    filter
                      (not . isEmpty)
                      [ pretty hdr
                      , vsep entries
                      , pretty ftr
                      ]

    isEmpty d = T.null (render d)

-- | Generic pattern evaluation
genericEvalPattern :: LangDescriptor -> TypeF -> Pattern -> [MDoc] -> MDoc
genericEvalPattern desc _ (PatternText firstStr fragments) xs =
  case ldPatternStyle desc of
    FStringPattern ->
      let qt = pretty (ldQuoteTerminator desc)
          esc = escapeQuotes (ldQuoteTerminator desc) (ldQuoteTerminatorEsc desc) . escapeStringLit
      in "f" <> qt <> hcat (pretty (esc firstStr) : [("{" <> x <> "}" <> pretty (esc s)) | (x, s) <- zip xs fragments]) <> qt
    ConcatCall ->
      let qt = ldQuoteTerminator desc
          esc = escapeQuotes qt (ldQuoteTerminatorEsc desc) . escapeStringLit
          wrap t = pretty qt <> pretty t <> pretty qt
      in pretty (ldConcatFn desc)
        <> tupled (wrap (esc firstStr) : concat [[x, wrap (esc s)] | (x, s) <- zip xs fragments])
-- getters (always have exactly one argument)
genericEvalPattern desc _ (PatternStruct (ungroup -> [ss])) [m] =
  hcat (m : map (writeSelector desc) ss)
genericEvalPattern desc _ (PatternStruct (ungroup -> sss)) [m] =
  case ldTupleConstructor desc of
    "" -> tupled [hcat (m : map (writeSelector desc) ss) | ss <- sss]
    name -> pretty name <> tupled [hcat (m : map (writeSelector desc) ss) | ss <- sss]
-- setters
genericEvalPattern desc t0 (PatternStruct s0) (m0 : xs0) =
  patternSetter makeTuple makeRecord accessTuple accessRecord m0 t0 s0 xs0
  where
    makeTuple _ xs = case ldTupleConstructor desc of
      "" -> tupled xs
      name -> pretty name <> tupled xs

    makeRecord (NamF _ _ _ rs) xs =
      pretty (ldRecordConstructor desc)
        <> tupled
          [makeRecordKey desc k <+> pretty (ldRecordSeparator desc) <+> x | (k, x) <- zip (map fst rs) xs]
    makeRecord _ _ = error "Incorrectly typed record setter"

    accessTuple _ m i = case ldIndexStyle desc of
      ZeroBracket -> m <> "[" <> pretty i <> "]"
      OneBracket -> m <> "[" <> pretty (i + 1) <> "]"
      OneDoubleBracket -> m <> "[[" <> pretty (i + 1) <> "]]"

    accessRecord (NamF o (FV _ cname) _ _) d k =
      genericRecordAccessor desc o cname d (pretty k)
    accessRecord t _ _ = error $ "Invalid record type: " <> show t
genericEvalPattern _ _ (PatternStruct _) [] = error "Unreachable empty pattern"

writeSelector :: LangDescriptor -> Either Int Text -> MDoc
writeSelector desc (Right k) = case ldKeyAccess desc of
  "double_bracket" -> "[[" <> dquotes (pretty k) <> "]]"
  _ -> "[" <> dquotes (pretty k) <> "]"
writeSelector desc (Left i) = case ldIndexStyle desc of
  ZeroBracket -> "[" <> pretty i <> "]"
  OneBracket -> "[" <> pretty (i + 1) <> "]"
  OneDoubleBracket -> "[[" <> pretty (i + 1) <> "]]"


================================================
FILE: library/Morloc/CodeGenerator/Grammars/Translator/Imperative.hs
================================================
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Grammars.Translator.Imperative
Description : Imperative IR for two-phase translation
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Provides an imperative IR for code generation. The fold from the compiler's
SerialManifold/NativeExpr AST to IR is written once; per-language printers
convert IR to source code.
-}
module Morloc.CodeGenerator.Grammars.Translator.Imperative
  ( -- * IR types
    IStmt (..)
  , IExpr (..)
  , IParam (..)
  , IType (..)
  , IAccessor (..)
  , IFunMeta (..)
  , IProgram (..)

    -- * IType rendering and conversion
  , renderIType
  , renderITypeText
  , toIType

    -- * Program construction
  , buildProgram
  , buildProgramM

    -- * Lowering: serialize/deserialize expansion
  , expandSerialize
  , expandDeserialize

    -- * Expression lowering
  , lowerSerialExpr
  , lowerNativeExpr

    -- * Manifold lowering
  , lowerSerialManifold
  , lowerNativeManifold
  , defaultFoldRules

    -- * Full lowering config
  , LowerConfig (..)

    -- * Default serialize/deserialize (for Python/R)
  , defaultSerialize
  , defaultDeserialize

    -- * Re-exported type alias
  , IndexM
  ) where

import Control.Monad.Identity (Identity)
import qualified Control.Monad.State as CMS
import Data.Binary (Binary)
import Data.Scientific (Scientific)
import Data.Text (Text)
import GHC.Generics (Generic)
import Morloc.CodeGenerator.Grammars.Common
  ( DispatchEntry (..)
  , PoolDocs (..)
  , argNamer
  , extractLocalDispatch
  , extractRemoteDispatch
  , helperNamer
  , manNamer
  , mergePoolDocs
  , nvarNamer
  , provideClosure
  , svarNamer
  )
import Morloc.CodeGenerator.Namespace
import Morloc.CodeGenerator.Serial (isSerializable, serialAstToMsgpackSchema)
import Morloc.Data.Doc
import Morloc.Monad (IndexState)

-- Statements
data IStmt
  = IFunDef IFunMeta [IParam] [IStmt] IExpr
  | IAssign Text (Maybe IType) IExpr
  | -- | resultVar, resultType, iterVar, collection, bodyStmts, yieldExpr
    -- Python/C++: resultVar = []; for iterVar in collection: bodyStmts; resultVar.append(yieldExpr)
    -- R: resultVar <- lapply(collection, function(iterVar) { bodyStmts; yieldExpr })
    -- resultType is used by C++ for typed declarations; Python/R pass Nothing
    IMapList Text (Maybe IType) Text IExpr [IStmt] IExpr
  | -- | resultVar, resultType, condition, thenStmts, thenExpr, elseStmts, elseExpr
    -- Semantics: declare resultVar; if cond { thenStmts; resultVar = thenExpr } else { elseStmts; resultVar = elseExpr }
    -- For elif chains, elseStmts contains another IIf and elseExpr is unused (IVar resultVar)
    IIf Text (Maybe IType) IExpr [IStmt] IExpr [IStmt] IExpr
  | IReturn IExpr
  | IExprStmt IExpr

-- Expressions
data IExpr
  = ICall Text (Maybe [IType]) [[IExpr]]
  | IVar Text
  | IBoolLit Bool
  | IIntLit (Maybe Text) Integer  -- concrete type name (e.g. "int64_t"), Nothing for default
  | IRealLit (Maybe Text) Scientific  -- concrete type name (e.g. "float"), Nothing for default
  | IStrLit Text
  | INullLit (Maybe IType)
  | IListLit [IExpr]
  | ITupleLit [IExpr]
  | IRecordLit NamType FVar [(Key, IExpr)]
  | IAccess IExpr IAccessor
  | ISerCall Text IExpr -- put_value(schema, expr)
  | IDesCall Text (Maybe IType) IExpr -- get_value[<T>](schema, expr); type used by C++ template
  | IForeignCall Text Int [IExpr]
  | IRemoteCall Text Int RemoteResources [IExpr]
  | ILambda [Text] IExpr
  | IPack Text IExpr -- packer(expr)
  | IRawExpr Text
  | IDoBlock IExpr -- effect: lambda wrapping expression
  | IEval IExpr -- eval: call effect with no args
  | IIntrinsicSave Text Text IExpr IExpr -- format, schema, data, path
  | IIntrinsicLoad Text (Maybe IType) IExpr -- schema, returnType, path -> result (nullable)
  | IIntrinsicHash Text IExpr -- schema, data -> hex string
  | IIntrinsicShow Text IExpr -- schema, data -> JSON string
  | IIntrinsicRead Text (Maybe IType) IExpr -- schema, returnType, json_string -> typed data (nullable)

data IParam = IParam Text (Maybe IType)

{- | Structured type representation for the IR.
Carries enough information for any language's printer to render typed declarations.
-}
data IType
  = -- | Primitive type: "int", "double", "std::string", "bool", etc.
    ITyPrim Text
  | -- | List/vector type
    ITyList IType
  | -- | Tuple type
    ITyTuple [IType]
  | -- | Record: name, type params, fields
    ITyRecord Text [IType] [(Key, IType)]
  | -- | Function type
    ITyFunction [IType] IType
  | -- | Unit/void type
    ITyUnit
  | -- | Named type with parameters (e.g., Map k v)
    ITyNamed Text [IType]
  | -- | Serialized data (e.g., const uint8_t* in C++)
    ITySerial
  | -- | Optional type (e.g., std::optional<T> in C++)
    ITyOptional IType
  | -- | Type not known or not needed (Python, R)
    ITyUnknown
  deriving (Show, Eq, Ord, Generic)

instance Binary IType

{- | Render an IType to an MDoc for use in code generation output.
This is used by printers that need the type as rendered text.
-}
renderIType :: IType -> MDoc
renderIType (ITyPrim t) = pretty t
renderIType (ITyList t) = "std::vector<" <> renderIType t <> ">"
renderIType (ITyTuple ts) = "std::tuple<" <> hcat (punctuate ", " (map renderIType ts)) <> ">"
renderIType (ITyRecord name [] _) = pretty name
renderIType (ITyRecord name params _) = pretty name <> encloseSep "<" ">" "," (map renderIType params)
renderIType (ITyFunction args ret) = "std::function<" <> renderIType ret <> tupled (map renderIType args) <> ">"
renderIType ITyUnit = "void"
renderIType (ITyNamed name []) = pretty name
renderIType (ITyNamed name params) = pretty name <> encloseSep "<" ">" "," (map renderIType params)
renderIType (ITyOptional t) = "std::optional<" <> renderIType t <> ">"
renderIType ITySerial = "const uint8_t*"
renderIType ITyUnknown = "auto"

-- | Render an IType to Text (for macro expansion, etc.)
renderITypeText :: IType -> Text
renderITypeText = render . renderIType

{- | Convert a rendered MDoc type to an opaque IType.
This is a transitional bridge: preserves the rendered form as ITyNamed.
C++ currently produces rendered MDoc types; this wraps them for the new IR.
-}
toIType :: MDoc -> IType
toIType d = ITyNamed (render d) []

data IAccessor
  = IIdx Int
  | IKey Key
  | IField Text

data IFunMeta = IFunMeta
  { ifName :: Text
  , ifReturnType :: Maybe IType
  , ifHeadForm :: Maybe HeadManifoldForm
  }

data IProgram = IProgram
  { ipSources :: [Text]
  , ipManifolds :: [Text]
  , ipLocalDispatch :: [DispatchEntry]
  , ipRemoteDispatch :: [DispatchEntry]
  }
  deriving (Generic)

instance Binary IProgram

-- | Build an IProgram from pre-rendered sources and manifolds (pure, for Python/R).
buildProgram :: [MDoc] -> [MDoc] -> [SerialManifold] -> IProgram
buildProgram sources manifolds es =
  IProgram
    { ipSources = map render sources
    , ipManifolds = map render manifolds
    , ipLocalDispatch = extractLocalDispatch es
    , ipRemoteDispatch = extractRemoteDispatch es
    }

-- | Build an IProgram monadically (for C++ where translateSegment runs in a monad).
buildProgramM :: (Monad m) => [MDoc] -> [SerialManifold] -> (SerialManifold -> m MDoc) -> m IProgram
buildProgramM sources es translateSeg = do
  manifolds <- mapM translateSeg es
  return $ buildProgram sources manifolds es

-- | Per-language configuration for lowering
data LowerConfig m = LowerConfig
  { lcSrcName :: Source -> MDoc
  , lcTypeOf :: TypeF -> m (Maybe IType)
  , lcSerialAstType :: SerialAST -> m (Maybe IType)
  -- ^ type of a SerialAST for serialization (used for C++ typed declarations)
  , lcDeserialAstType :: SerialAST -> m (Maybe IType)
  -- ^ type of a SerialAST for deserialization (for C++, uses shallowType)
  , lcRawDeserialAstType :: SerialAST -> m (Maybe IType)
  -- ^ raw deserialized type for the _get_value template parameter (C++ specific)
  -- For records, C++ converts to std::tuple; for others, uses serialAstToType
  , lcTypeMOf :: TypeM -> m (Maybe IType)
  , lcPackerName :: Source -> MDoc
  , lcUnpackerName :: Source -> MDoc
  , lcRecordAccessor :: NamType -> CVar -> MDoc -> MDoc -> MDoc
  , lcDeserialRecordAccessor :: Int -> Key -> MDoc -> MDoc
  -- ^ How to access record fields during deserialization.
  -- For Python/R: same as lcRecordAccessor (by key name)
  -- For C++: uses tuple indexing since records are deserialized as tuples
  , lcTupleAccessor :: Int -> MDoc -> MDoc
  , lcNewIndex :: m Int
  , -- expression/arg lowering fields
    lcPrintExpr :: IExpr -> MDoc
  , lcPrintStmt :: IStmt -> MDoc
  , lcEvalPattern :: TypeF -> Pattern -> [MDoc] -> m MDoc
  -- ^ Pattern evaluation (language-specific because patterns use
  -- language-specific constructors for tuples/records)
  , lcListConstructor :: FVar -> TypeF -> [MDoc] -> MDoc
  -- ^ Build a list literal from rendered elements. R needs FVar to choose c() vs list().
  , lcTupleConstructor :: FVar -> [MDoc] -> MDoc
  , lcRecordConstructor :: TypeF -> NamType -> FVar -> [TypeF] -> [(Key, MDoc)] -> m PoolDocs
  -- ^ Build a record literal. C++ needs type lookup + counter for temp var.
  , lcForeignCall :: MDoc -> Int -> [MDoc] -> MDoc
  , lcRemoteCall :: MDoc -> Int -> RemoteResources -> [MDoc] -> m PoolDocs
  , lcMakeLet :: (Int -> MDoc) -> Int -> Maybe TypeF -> PoolDocs -> PoolDocs -> m PoolDocs
  -- ^ Let binding assembly at the PoolDocs level
  , lcReturn :: MDoc -> MDoc
  , lcMakeIf :: NativeExpr -> PoolDocs -> PoolDocs -> PoolDocs -> m PoolDocs
  -- ^ origExpr, condDocs, thenDocs, elseDocs -> result PoolDocs
  -- Produces language-specific if/else structure using a temp result variable
  , lcMakeDoBlock :: TypeF -> [MDoc] -> MDoc -> ([MDoc], MDoc)
  -- ^ prior statements -> return expression -> (hoisted statements, effect expression)
  , lcSerialize :: MDoc -> SerialAST -> m PoolDocs
  , lcDeserialize :: TypeF -> MDoc -> SerialAST -> m (MDoc, [MDoc])
  , -- manifold lowering fields
    lcMakeFunction ::
      MDoc ->
      [Arg TypeM] ->
      TypeM ->
      [MDoc] ->
      MDoc ->
      Maybe HeadManifoldForm ->
      m (Maybe MDoc)
  -- ^ name, all args, manifold type, priorLines, body, headForm
  -- Returns Nothing if dedup'd (C++), Just funcDef otherwise
  , lcMakeLambda :: MDoc -> [MDoc] -> [MDoc] -> MDoc
  -- ^ name, contextArgs, boundArgs → partial application expression
  }

{- | Expand serialization into IR statements.
Returns (final expression representing the serialized value, prior statements).
-}
expandSerialize :: (Monad m) => LowerConfig m -> MDoc -> SerialAST -> m (IExpr, [IStmt])
expandSerialize cfg v0 s0 = do
  (stmts, vExpr) <- go v0 s0
  let schema = render $ serialAstToMsgpackSchema s0
  return (ISerCall schema vExpr, stmts)
  where
    go v s
      | isSerializable s = return ([], IRawExpr (render v))
      | otherwise = construct v s

    construct v (SerialPack _ (p, s)) =
      let unpacker = lcUnpackerName cfg (typePackerReverse p)
       in go (unpacker <> parens v) s
    construct v lst@(SerialList _ s) = do
      idx <- lcNewIndex cfg
      resultType <- lcSerialAstType cfg lst
      let v' = render $ helperNamer idx
          iterVar = render $ "i" <> pretty idx
      (before, x) <- go ("i" <> pretty idx) s
      return ([IMapList v' resultType iterVar (IRawExpr (render v)) before x], IVar v')
    construct v tup@(SerialTuple _ ss) = do
      results <- zipWithM (\i s -> go (lcTupleAccessor cfg i v) s) [0 ..] ss
      let (befores, exprs) = unzip results
      idx <- lcNewIndex cfg
      typeM <- lcSerialAstType cfg tup
      let v' = render $ helperNamer idx
      return (concat befores ++ [IAssign v' typeM (ITupleLit exprs)], IVar v')
    construct v obj@(SerialObject namType fv@(FV _ constructor) _ rs) = do
      let accessor = lcRecordAccessor cfg namType constructor
      results <- mapM (\(key, s) -> go (accessor v (pretty key)) s) rs
      let (befores, exprs) = unzip results
      idx <- lcNewIndex cfg
      typeM <- lcSerialAstType cfg obj
      let v' = render $ helperNamer idx
      return
        ( concat befores ++ [IAssign v' typeM (IRecordLit namType fv (zip (map fst rs) exprs))]
        , IVar v'
        )
    construct _ _ = error "Unreachable in expandSerialize"

{- | Expand deserialization into IR statements.
Returns (final expression representing the deserialized value, prior statements).
-}
expandDeserialize :: (Monad m) => LowerConfig m -> MDoc -> SerialAST -> m (IExpr, [IStmt])
expandDeserialize cfg v0 s0
  | isSerializable s0 = do
      let schema = render $ serialAstToMsgpackSchema s0
      desType <- lcDeserialAstType cfg s0
      return (IDesCall schema desType (IRawExpr (render v0)), [])
  | otherwise = do
      idx <- lcNewIndex cfg
      rawType <- lcRawDeserialAstType cfg s0
      let rawvar = render $ helperNamer idx
          schema = render $ serialAstToMsgpackSchema s0
      (x, befores) <- check (helperNamer idx) s0
      return (x, IAssign rawvar rawType (IDesCall schema rawType (IRawExpr (render v0))) : befores)
  where
    check v s
      | isSerializable s = return (IRawExpr (render v), [])
      | otherwise = construct v s

    construct v (SerialPack _ (p, s')) = do
      (x, before) <- check v s'
      let packer = render $ lcPackerName cfg (typePackerForward p)
      return (IPack packer x, before)
    construct v lst@(SerialList _ s) = do
      idx <- lcNewIndex cfg
      resultType <- lcDeserialAstType cfg lst
      let v' = render $ helperNamer idx
          iterVar = render $ "i" <> pretty idx
      (x, before) <- check ("i" <> pretty idx) s
      return (IVar v', [IMapList v' resultType iterVar (IRawExpr (render v)) before x])
    construct v tup@(SerialTuple _ ss) = do
      results <- zipWithM (\i s -> check (lcTupleAccessor cfg i v) s) [0 ..] ss
      let (exprs, befores) = unzip results
      typeM <- lcDeserialAstType cfg tup
      v' <- (render . helperNamer) <$> lcNewIndex cfg
      return (IVar v', concat befores ++ [IAssign v' typeM (ITupleLit exprs)])
    construct v (SerialObject namType fv@(FV _ _) _ rs) = do
      let accessor = lcDeserialRecordAccessor cfg
      results <- zipWithM (\i (k, s) -> check (accessor i k v) s) [0 ..] rs
      let (exprs, befores) = unzip results
      typeM <- lcDeserialAstType cfg (SerialObject namType fv [] rs)
      idx <- lcNewIndex cfg
      let v' = render $ helperNamer idx
      return
        (IVar v', concat befores ++ [IAssign v' typeM (IRecordLit namType fv (zip (map fst rs) exprs))])
    construct _ _ = error "Unreachable in expandDeserialize"

-- | Lower a serial expression to PoolDocs via the IR.
lowerSerialExpr ::
  (Monad m) =>
  LowerConfig m ->
  SerialExpr ->
  SerialExpr_ PoolDocs PoolDocs PoolDocs (TypeS, PoolDocs) (TypeM, PoolDocs) ->
  m PoolDocs
lowerSerialExpr _ _ (ManS_ f) = return f
lowerSerialExpr cfg _ (AppPoolS_ _ (PoolCall mid (Socket _ _ socketFile) ForeignCall args) _) =
  return $ defaultValue {poolExpr = lcForeignCall cfg socketFile mid (map argNamer args)}
lowerSerialExpr cfg _ (AppPoolS_ _ (PoolCall mid (Socket _ _ socketFile) (RemoteCall res) args) _) =
  lcRemoteCall cfg socketFile mid res (map argNamer args)
lowerSerialExpr _ _ (AppRecS_ _ mid es) = do
  return $ mergePoolDocs ((<>) (manNamer mid) . tupled) es
lowerSerialExpr cfg _ (AppForeignRecS_ _ mid (Socket _ _ socketFile) es) = do
  return $ mergePoolDocs (\args -> lcForeignCall cfg socketFile mid args) es
lowerSerialExpr cfg _ (ReturnS_ x) = return $ x {poolExpr = lcReturn cfg (poolExpr x)}
lowerSerialExpr cfg _ (SerialLetS_ i e1 e2) =
  lcMakeLet cfg svarNamer i Nothing e1 e2
lowerSerialExpr cfg (NativeLetS _ (typeFof -> t) _) (NativeLetS_ i e1 e2) =
  lcMakeLet cfg nvarNamer i (Just t) e1 e2
lowerSerialExpr cfg _ (NativeLetS_ i e1 e2) =
  lcMakeLet cfg nvarNamer i Nothing e1 e2
lowerSerialExpr _ _ (LetVarS_ _ i) = return $ defaultValue {poolExpr = svarNamer i}
lowerSerialExpr _ _ (BndVarS_ _ i) = return $ defaultValue {poolExpr = svarNamer i}
lowerSerialExpr cfg _ (SerializeS_ s e) = do
  se <- lcSerialize cfg (poolExpr e) s
  return $ e {poolExpr = poolExpr se, poolPriorLines = poolPriorLines e <> poolPriorLines se}

-- | Lower a native expression to PoolDocs via the IR.
lowerNativeExpr ::
  (Monad m) =>
  LowerConfig m ->
  NativeExpr ->
  NativeExpr_ PoolDocs PoolDocs PoolDocs (TypeS, PoolDocs) (TypeM, PoolDocs) ->
  m PoolDocs
-- Binary operator: emit (lhs op rhs) instead of function call
lowerNativeExpr _ _ (AppExeN_ _ (SrcCallP src) (map snd -> [lhs, rhs]))
  | srcOperator src =
      return $ mergePoolDocs (\xs -> case xs of [l, r] -> parens (l <+> pretty (unSrcName (srcName src)) <+> r); _ -> error "binary operator requires exactly 2 args") [lhs, rhs]
lowerNativeExpr cfg _ (AppExeN_ _ (SrcCallP src) (map snd -> es)) = do
  let handleFunctionArgs =
        (<>) (lcSrcName cfg src)
          . hsep
          . map tupled
          . provideClosure src
  return $ mergePoolDocs handleFunctionArgs es
lowerNativeExpr cfg _ (AppExeN_ t (PatCallP p) xs) = do
  let es = map snd xs
  patResult <- lcEvalPattern cfg t p (map poolExpr es)
  return $
    PoolDocs
      { poolCompleteManifolds = concatMap poolCompleteManifolds es
      , poolExpr = patResult
      , poolPriorLines = concatMap poolPriorLines es
      , poolPriorExprs = concatMap poolPriorExprs es
      }
lowerNativeExpr _ _ (AppExeN_ _ (LocalCallP idx) (map snd -> es)) = do
  return $ mergePoolDocs ((<>) (nvarNamer idx) . tupled) es
lowerNativeExpr _ _ (AppExeN_ _ (RecCallP mid _) (map snd -> es)) = do
  return $ mergePoolDocs ((<>) (manNamer mid) . tupled) es
lowerNativeExpr _ _ (ManN_ call) = return call
lowerNativeExpr cfg _ (ReturnN_ x) =
  return $ x {poolExpr = lcReturn cfg (poolExpr x)}
lowerNativeExpr cfg _ (SerialLetN_ i x1 x2) = lcMakeLet cfg svarNamer i Nothing x1 x2
lowerNativeExpr cfg (NativeLetN _ (typeFof -> t) _) (NativeLetN_ i x1 x2) = lcMakeLet cfg nvarNamer i (Just t) x1 x2
lowerNativeExpr cfg _ (NativeLetN_ i x1 x2) = lcMakeLet cfg nvarNamer i Nothing x1 x2
lowerNativeExpr _ _ (LetVarN_ _ i) = return $ defaultValue {poolExpr = nvarNamer i}
lowerNativeExpr _ _ (BndVarN_ _ i) = return $ defaultValue {poolExpr = nvarNamer i}
lowerNativeExpr cfg _ (DeserializeN_ t s x) = do
  (deserialized, assignments) <- lcDeserialize cfg t (poolExpr x) s
  return $
    x
      { poolExpr = deserialized
      , poolPriorLines = poolPriorLines x <> assignments
      }
lowerNativeExpr cfg _ (ExeN_ _ (SrcCallP src)) = return $ defaultValue {poolExpr = lcSrcName cfg src}
lowerNativeExpr _ _ (ExeN_ _ (PatCallP _)) = error "Unreachable: patterns are always used in applications"
lowerNativeExpr _ _ (ExeN_ _ (LocalCallP idx)) = return $ defaultValue {poolExpr = nvarNamer idx}
lowerNativeExpr _ _ (ExeN_ _ (RecCallP mid _)) = return $ defaultValue {poolExpr = manNamer mid}
lowerNativeExpr cfg _ (ListN_ v t xs) = return $ mergePoolDocs (lcListConstructor cfg v t) xs
lowerNativeExpr cfg _ (TupleN_ v xs) = return $ mergePoolDocs (lcTupleConstructor cfg v) xs
lowerNativeExpr cfg origExpr (RecordN_ o v ps rs) = do
  let es = map snd rs
      recType = typeFof origExpr
  rec' <- lcRecordConstructor cfg recType o v ps (zip (map fst rs) (map poolExpr es))
  return $
    rec'
      { poolCompleteManifolds = concatMap poolCompleteManifolds es <> poolCompleteManifolds rec'
      , poolPriorLines = concatMap poolPriorLines es <> poolPriorLines rec'
      , poolPriorExprs = concatMap poolPriorExprs es <> poolPriorExprs rec'
      }
lowerNativeExpr cfg _ (LogN_ _ v) = return $ defaultValue {poolExpr = lcPrintExpr cfg (IBoolLit v)}
lowerNativeExpr cfg _ (RealN_ (FV _ cv) v) = return $ defaultValue {poolExpr = lcPrintExpr cfg (IRealLit (Just (unCVar cv)) v)}
lowerNativeExpr cfg _ (IntN_ (FV _ cv) v) = return $ defaultValue {poolExpr = lcPrintExpr cfg (IIntLit (Just (unCVar cv)) v)}
lowerNativeExpr cfg _ (StrN_ _ v) = return $ defaultValue {poolExpr = lcPrintExpr cfg (IStrLit v)}
lowerNativeExpr cfg _ (NullN_ fv) = do
  mayT <- lcTypeOf cfg (VarF fv)
  return $ defaultValue {poolExpr = lcPrintExpr cfg (INullLit mayT)}
lowerNativeExpr cfg _ (DoBlockN_ t x) =
  let (hoisted, effectExpr) = lcMakeDoBlock cfg t (poolPriorLines x) (poolExpr x)
   in return
        defaultValue
          { poolExpr = effectExpr
          , poolCompleteManifolds = poolCompleteManifolds x
          , poolPriorLines = hoisted
          , poolPriorExprs = poolPriorExprs x
          }
lowerNativeExpr cfg _ (EvalN_ _ x) = return $ x {poolExpr = lcPrintExpr cfg (IEval (IRawExpr (render (poolExpr x))))}
-- CoerceToOptional is a noop in all target languages: T is a valid ?T
lowerNativeExpr _ _ (CoerceN_ CoerceToOptional _ x) = return x
-- CoerceToEffect wraps the value in a suspend (thunk/lambda)
lowerNativeExpr cfg _ (CoerceN_ (CoerceToEffect _) _ x) =
  return $ x {poolExpr = lcPrintExpr cfg (IDoBlock (IRawExpr (render (poolExpr x))))}
lowerNativeExpr cfg origExpr (IfN_ _ condDocs thenDocs elseDocs) =
  lcMakeIf cfg origExpr condDocs thenDocs elseDocs
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrHash (Just schema) [dataDocs]) =
  return $ dataDocs {poolExpr = lcPrintExpr cfg (IIntrinsicHash schema (IRawExpr (render (poolExpr dataDocs))))}
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrSave (Just schema) [dataDocs, pathDocs]) =
  let fmt = "voidstar"
   in return $ mergePoolDocs (const $ lcPrintExpr cfg (IIntrinsicSave fmt schema (IRawExpr (render (poolExpr dataDocs))) (IRawExpr (render (poolExpr pathDocs))))) [dataDocs, pathDocs]
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrSaveM (Just schema) [dataDocs, pathDocs]) =
  let fmt = "msgpack"
   in return $ mergePoolDocs (const $ lcPrintExpr cfg (IIntrinsicSave fmt schema (IRawExpr (render (poolExpr dataDocs))) (IRawExpr (render (poolExpr pathDocs))))) [dataDocs, pathDocs]
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrSaveJ (Just schema) [dataDocs, pathDocs]) =
  let fmt = "json"
   in return $ mergePoolDocs (const $ lcPrintExpr cfg (IIntrinsicSave fmt schema (IRawExpr (render (poolExpr dataDocs))) (IRawExpr (render (poolExpr pathDocs))))) [dataDocs, pathDocs]
lowerNativeExpr cfg origExpr (IntrinsicN_ _ IntrLoad (Just schema) [pathDocs]) = do
  innerType <- case typeFof origExpr of
    OptionalF t -> lcTypeOf cfg t
    _ -> return Nothing
  return $ pathDocs {poolExpr = lcPrintExpr cfg (IIntrinsicLoad schema innerType (IRawExpr (render (poolExpr pathDocs))))}
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrShow (Just schema) [dataDocs]) =
  return $ dataDocs {poolExpr = lcPrintExpr cfg (IIntrinsicShow schema (IRawExpr (render (poolExpr dataDocs))))}
lowerNativeExpr cfg origExpr (IntrinsicN_ _ IntrRead (Just schema) [strDocs]) = do
  innerType <- case typeFof origExpr of
    OptionalF t -> lcTypeOf cfg t
    _ -> return Nothing
  return $ strDocs {poolExpr = lcPrintExpr cfg (IIntrinsicRead schema innerType (IRawExpr (render (poolExpr strDocs))))}
-- @schema and @typeof erase their argument: the result is a compile-time
-- constant string (the schema or user-facing type name), already resolved
-- into the Intrinsic node's schema slot by Serialize.hs. Emit it as a
-- string literal and discard the data expression; the type of the
-- argument is all that matters.
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrSchema (Just s) [dataDocs]) =
  return $ dataDocs {poolExpr = lcPrintExpr cfg (IStrLit s)}
lowerNativeExpr cfg _ (IntrinsicN_ _ IntrTypeof (Just s) [dataDocs]) =
  return $ dataDocs {poolExpr = lcPrintExpr cfg (IStrLit s)}
lowerNativeExpr _ _ (IntrinsicN_ _ intr _ _) =
  error $ "Runtime intrinsic @" <> show intr <> " reached code generation without schema"

{- | Lower a serial manifold to PoolDocs.
Replaces translateManifold from Common.hs for serial manifolds.
-}
lowerSerialManifold ::
  (Monad m) =>
  LowerConfig m ->
  SerialManifold ->
  SerialManifold_ PoolDocs ->
  m PoolDocs
lowerSerialManifold cfg sm (SerialManifold_ m _ form headForm e) =
  lowerManifold cfg m form (Just headForm) (typeMof sm) e

{- | Lower a native manifold to PoolDocs.
Replaces translateManifold from Common.hs for native manifolds.
-}
lowerNativeManifold ::
  (Monad m) =>
  LowerConfig m ->
  NativeManifold ->
  NativeManifold_ PoolDocs ->
  m PoolDocs
lowerNativeManifold cfg nm (NativeManifold_ m _ form e) =
  lowerManifold cfg m form Nothing (typeMof nm) e

lowerManifold ::
  (Monad m, HasTypeM t) =>
  LowerConfig m ->
  Int ->
  ManifoldForm (Or TypeS TypeF) t ->
  Maybe HeadManifoldForm ->
  TypeM ->
  PoolDocs ->
  m PoolDocs
lowerManifold cfg m form headForm manifoldType (PoolDocs completeManifolds body priorLines priorExprs) = do
  let args = typeMofForm form
      mname = manNamer m
  maybeNewManifold <- lcMakeFunction cfg mname args manifoldType priorLines body headForm
  let call = case form of
        (ManifoldPass _) -> mname
        (ManifoldFull rs) -> mname <> tupled (map argNamer (typeMofRs rs))
        (ManifoldPart rs vs) ->
          lcMakeLambda
            cfg
            mname
            (map argNamer (typeMofRs rs))
            [argNamer (Arg i (typeMof t)) | Arg i t <- vs]
  return $
    PoolDocs
      { poolCompleteManifolds = completeManifolds <> maybeToList maybeNewManifold
      , poolExpr = call
      , poolPriorLines = []
      , poolPriorExprs = priorExprs
      }

-- | Bundle all six fold callbacks into a single FoldWithManifoldM record.
defaultFoldRules ::
  (Monad m) =>
  LowerConfig m ->
  FoldWithManifoldM m PoolDocs PoolDocs PoolDocs PoolDocs (TypeS, PoolDocs) (TypeM, PoolDocs)
defaultFoldRules cfg =
  FoldWithManifoldM
    { opFoldWithSerialManifoldM = lowerSerialManifold cfg
    , opFoldWithNativeManifoldM = lowerNativeManifold cfg
    , opFoldWithSerialExprM = lowerSerialExpr cfg
    , opFoldWithNativeExprM = lowerNativeExpr cfg
    , opFoldWithSerialArgM = \sr sa -> return $ case sa of
        SerialArgManifold_ x -> (typeSof sr, x)
        SerialArgExpr_ x -> (typeSof sr, x)
    , opFoldWithNativeArgM = \nr na -> return $ case na of
        NativeArgManifold_ x -> (typeMof nr, x)
        NativeArgExpr_ x -> (typeMof nr, x)
    }

-- | Default serialization for languages without custom PoolDocs logic (Python, R).
defaultSerialize :: (Monad m) => LowerConfig m -> MDoc -> SerialAST -> m PoolDocs
defaultSerialize cfg v s = do
  (expr, stmts) <- expandSerialize cfg v s
  return $
    defaultValue
      { poolExpr = lcPrintExpr cfg expr
      , poolPriorLines = map (lcPrintStmt cfg) stmts
      }

-- | Default deserialization for languages without custom logic (Python, R).
defaultDeserialize :: (Monad m) => LowerConfig m -> MDoc -> SerialAST -> m (MDoc, [MDoc])
defaultDeserialize cfg v s = do
  (expr, stmts) <- expandDeserialize cfg v s
  return (lcPrintExpr cfg expr, map (lcPrintStmt cfg) stmts)

type IndexM = CMS.StateT IndexState Identity


================================================
FILE: library/Morloc/CodeGenerator/Grammars/Translator/PseudoCode.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Grammars.Translator.PseudoCode
Description : Pseudocode renderer for diagnostic output of manifold trees
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Renders 'SerialManifold' and 'NativeManifold' trees as human-readable
pseudocode for debugging and diagnostic dumps. Not a real translator --
produces no executable output.
-}
module Morloc.CodeGenerator.Grammars.Translator.PseudoCode
  ( pseudocodeNativeManifold
  , pseudocodeSerialManifold
  , pseudocodeSerialArg
  , pseudocodeNativeArg
  , pseudocodeSerialExpr
  , pseudocodeNativeExpr
  ) where

import qualified Control.Monad.Identity as MI
import Morloc.CodeGenerator.Grammars.Common
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc

prettyFoldManifold ::
  (Monad m) => FoldWithManifoldM m PoolDocs PoolDocs PoolDocs PoolDocs PoolDocs PoolDocs
prettyFoldManifold =
  FoldWithManifoldM
    { opFoldWithSerialManifoldM = makeSerialManifold
    , opFoldWithNativeManifoldM = makeNativeManifold
    , opFoldWithSerialExprM = makeSerialExpr
    , opFoldWithNativeExprM = makeNativeExpr
    , opFoldWithSerialArgM = makeSerialArg
    , opFoldWithNativeArgM = makeNativeArg
    }
  where
    makeSerialManifold :: (Monad m) => SerialManifold -> SerialManifold_ PoolDocs -> m PoolDocs
    makeSerialManifold _ (SerialManifold_ m _ form headForm x) =
      return $ pseudoManifold (makeFunction "SerialManifold") makeLambda m form (Just headForm) x

    makeNativeManifold :: (Monad m) => NativeManifold -> NativeManifold_ PoolDocs -> m PoolDocs
    makeNativeManifold _ (NativeManifold_ m _ form x) =
      return $ pseudoManifold (makeFunction "NativeManifold") makeLambda m form Nothing x

    makeSerialExpr ::
      (Monad m) => SerialExpr -> SerialExpr_ PoolDocs PoolDocs PoolDocs PoolDocs PoolDocs -> m PoolDocs
    makeSerialExpr _ (ManS_ m) = return m
    makeSerialExpr _ (AppPoolS_ t (PoolCall mid (Socket _ _ socketFile) remote _) args) = return $ mergePoolDocs makePoolCall args
      where
        makePoolCall xs' = case remote of
          ForeignCall ->
            parens (pretty t) <+> "__foreign_call__"
              <> tupled [dquotes socketFile, dquotes (pretty mid), list xs']
          (RemoteCall _) -> "REMOTE_CALL"
    makeSerialExpr _ (AppRecS_ _ mid es) = return $ mergePoolDocs ((<>) (manNamer mid) . tupled) es
    makeSerialExpr _ (AppForeignRecS_ _ mid (Socket _ _ socketFile) es) = return $ mergePoolDocs makeForeignRecCall es
      where
        makeForeignRecCall xs' =
          "__foreign_rec_call__" <> tupled [dquotes socketFile, dquotes (pretty mid), list xs']
    makeSerialExpr _ (ReturnS_ x) = return $ x {poolExpr = "ReturnS(" <> poolExpr x <> ")"}
    makeSerialExpr _ (SerialLetS_ i e1 e2) = return $ makeLet letNamerS "SerialLetS" i e1 e2
    makeSerialExpr _ (NativeLetS_ i e1 e2) = return $ makeLet letNamerN "NativeLetS" i e1 e2
    makeSerialExpr _ (LetVarS_ _ i) = return $ defaultValue {poolExpr = letNamerS i}
    makeSerialExpr _ (BndVarS_ _ i) = return $ defaultValue {poolExpr = bndNamerS i}
    makeSerialExpr _ (SerializeS_ _ e) = return $ e {poolExpr = "SerializeS" <> parens (poolExpr e)}

    makeNativeExpr ::
      (Monad m) => NativeExpr -> NativeExpr_ PoolDocs PoolDocs PoolDocs PoolDocs PoolDocs -> m PoolDocs
    makeNativeExpr _ (AppExeN_ _ (SrcCallP src) xs) =
      return $ mergePoolDocs ((<>) (pretty $ srcName src) . tupled) xs
    makeNativeExpr _ (AppExeN_ _ (PatCallP pat) xs) =
      return $ mergePoolDocs ((<>) (pretty pat) . tupled) xs
    makeNativeExpr _ (AppExeN_ _ (LocalCallP idx) xs) =
      return $ mergePoolDocs ((<>) (letNamerN idx) . tupled) xs
    makeNativeExpr _ (AppExeN_ _ (RecCallP mid _) xs) =
      return $ mergePoolDocs ((<>) (manNamer mid) . tupled) xs
    makeNativeExpr _ (ManN_ call) = return call
    makeNativeExpr _ (ReturnN_ x) =
      return $ x {poolExpr = "ReturnN(" <> poolExpr x <> ")"}
    makeNativeExpr _ (SerialLetN_ i x1 x2) = return $ makeLet letNamerS "SerialLetN" i x1 x2
    makeNativeExpr _ (NativeLetN_ i x1 x2) = return $ makeLet letNamerN "NativeLetN" i x1 x2
    makeNativeExpr _ (LetVarN_ _ i) = return $ defaultValue {poolExpr = letNamerN i}
    makeNativeExpr _ (BndVarN_ _ i) = return $ defaultValue {poolExpr = bndNamerN i}
    makeNativeExpr _ (DeserializeN_ _ _ e) = return $ e {poolExpr = "DeserializeN" <> parens (poolExpr e)}
    makeNativeExpr _ (ExeN_ _ (SrcCallP src)) = return $ defaultValue {poolExpr = pretty (srcName src)}
    makeNativeExpr _ (ExeN_ _ (PatCallP pat)) = return $ defaultValue {poolExpr = pretty pat}
    makeNativeExpr _ (ExeN_ _ (LocalCallP idx)) = return $ defaultValue {poolExpr = letNamerN idx}
    makeNativeExpr _ (ExeN_ _ (RecCallP mid _)) = return $ defaultValue {poolExpr = manNamer mid}
    makeNativeExpr _ (ListN_ _ _ xs) = return $ mergePoolDocs list xs
    makeNativeExpr _ (TupleN_ _ xs) = return $ mergePoolDocs tupled xs
    makeNativeExpr _ (RecordN_ _ _ _ rs) =
      return $ mergePoolDocs pyDict (map snd rs)
      where
        pyDict es' =
          let entries' = zipWith (\k v -> pretty k <> "=" <> v) (map fst rs) es'
           in "OrderedDict" <> tupled entries'
    makeNativeExpr _ (LogN_ _ v) = return $ defaultValue {poolExpr = if v then "True" else "False"}
    makeNativeExpr _ (RealN_ _ v) = return $ defaultValue {poolExpr = viaShow v}
    makeNativeExpr _ (IntN_ _ v) = return $ defaultValue {poolExpr = viaShow v}
    makeNativeExpr _ (StrN_ _ v) = return $ defaultValue {poolExpr = dquotes $ pretty v}
    makeNativeExpr _ (NullN_ _) = return $ defaultValue {poolExpr = "None"}
    makeNativeExpr _ _ = return $ defaultValue {poolExpr = "<unhandled>"}

    makeSerialArg :: (Monad m) => SerialArg -> SerialArg_ PoolDocs PoolDocs -> m PoolDocs
    makeSerialArg _ (SerialArgManifold_ x) = return x
    makeSerialArg _ (SerialArgExpr_ x) = return x

    makeNativeArg :: (Monad m) => NativeArg -> NativeArg_ PoolDocs PoolDocs -> m PoolDocs
    makeNativeArg _ (NativeArgManifold_ x) = return x
    makeNativeArg _ (NativeArgExpr_ x) = return x

    makeFunction :: MDoc -> MDoc -> [Arg TypeM] -> [MDoc] -> MDoc -> Maybe HeadManifoldForm -> MDoc
    makeFunction manStr mname args priorLines body headForm =
      block 4 def (vsep $ priorLines <> [body])
      where
        makeExt (Just HeadManifoldFormRemoteWorker) = "_remote"
        makeExt _ = ""

        def =
          manStr <+> mname
            <> makeExt headForm
            <> tupled [argName r <+> ":" <+> pretty t | r@(Arg _ t) <- args]
            <> ":"

    makeLambda :: MDoc -> [MDoc] -> [MDoc] -> MDoc
    makeLambda mname contextArgs boundArgs =
      let functionCall = mname <> tupled (contextArgs <> boundArgs)
       in "lambda" <+> tupled boundArgs <> ":" <+> functionCall

    makeLet :: (Int -> MDoc) -> MDoc -> Int -> PoolDocs -> PoolDocs -> PoolDocs
    makeLet letNamer letStr i (PoolDocs ms1' e1' rs1 pes1) (PoolDocs ms2' e2' rs2 pes2) =
      let rs = rs1 ++ [letStr <+> letNamer i <+> "=" <+> e1'] ++ rs2
       in PoolDocs (ms1' <> ms2') e2' rs (pes1 <> pes2)

    letNamerS :: Int -> MDoc
    letNamerS i = "letSvar_" <> pretty i

    letNamerN :: Int -> MDoc
    letNamerN i = "letNvar_" <> pretty i

    bndNamerS :: Int -> MDoc
    bndNamerS i = "bndSvar" <> pretty i

    bndNamerN :: Int -> MDoc
    bndNamerN i = "bndNvar" <> pretty i

    argName :: Arg TypeM -> MDoc
    argName (Arg i (Native _)) = bndNamerN i
    argName (Arg i _) = bndNamerS i

pseudoManifold ::
  (HasTypeM t) =>
  (MDoc -> [Arg TypeM] -> [MDoc] -> MDoc -> Maybe HeadManifoldForm -> MDoc) ->
  (MDoc -> [MDoc] -> [MDoc] -> MDoc) ->
  Int ->
  ManifoldForm (Or TypeS TypeF) t ->
  Maybe HeadManifoldForm ->
  PoolDocs ->
  PoolDocs
pseudoManifold makeFunc makeLam m form headForm (PoolDocs completeManifolds body priorLines priorExprs) =
  let args = typeMofForm form
      mname = manNamer m
      newManifold = makeFunc mname args priorLines body headForm
      call = case form of
        (ManifoldPass _) -> mname
        (ManifoldFull rs) -> mname <> tupled (map argNamer (typeMofRs rs))
        (ManifoldPart rs vs) ->
          makeLam
            mname
            (map argNamer (typeMofRs rs))
            [argNamer (Arg i (typeMof t)) | Arg i t <- vs]
   in PoolDocs
        { poolCompleteManifolds = newManifold : completeManifolds
        , poolExpr = call
        , poolPriorLines = []
        , poolPriorExprs = priorExprs
        }

prettyThing :: (p -> MI.Identity PoolDocs) -> p -> Doc ()
prettyThing f a =
  let e = MI.runIdentity $ f a
   in vsep . punctuate line $ poolPriorExprs e <> poolCompleteManifolds e

pseudocodeNativeManifold :: NativeManifold -> MDoc
pseudocodeNativeManifold = prettyThing (foldWithNativeManifoldM prettyFoldManifold)

pseudocodeSerialManifold :: SerialManifold -> MDoc
pseudocodeSerialManifold = prettyThing (foldWithSerialManifoldM prettyFoldManifold)

pseudocodeSerialArg :: SerialArg -> MDoc
pseudocodeSerialArg = prettyThing (foldWithSerialArgM prettyFoldManifold)

pseudocodeNativeArg :: NativeArg -> MDoc
pseudocodeNativeArg = prettyThing (foldWithNativeArgM prettyFoldManifold)

pseudocodeSerialExpr :: SerialExpr -> MDoc
pseudocodeSerialExpr = prettyThing (foldWithSerialExprM prettyFoldManifold)

pseudocodeNativeExpr :: NativeExpr -> MDoc
pseudocodeNativeExpr = prettyThing (foldWithNativeExprM prettyFoldManifold)


================================================
FILE: library/Morloc/CodeGenerator/Infer.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Infer
Description : Infer concrete (language-specific) types from type aliases
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Maps general types to their concrete counterparts by evaluating type
aliases in the language-specific scope. Used by 'Express' and 'Serialize'
to determine how values are represented in each target language.
-}
module Morloc.CodeGenerator.Infer
  ( getScope
  , inferConcreteType
  , inferConcreteTypeUniversal
  , inferConcreteTypeU
  , inferConcreteVar
  , evalGeneralStep
  ) where

import qualified Control.Monad.State as CMS
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM
import qualified Morloc.TypeEval as T

-- TODO: do not use global scope here
getScope :: Int -> Lang -> MorlocMonad (Scope, Scope)
getScope _ lang = do
  cscope <- MM.getConcreteUniversalScope lang
  gscope <- MM.getGeneralUniversalScope
  MM.sayVVV $ "cscope:" <+> viaShow cscope
  return (cscope, gscope)

evalGeneralStep :: Int -> TypeU -> MorlocMonad (Maybe TypeU)
evalGeneralStep i t = T.evaluateStep <$> MM.getGeneralScope i <*> pure t

inferConcreteTypeU :: Lang -> Indexed TypeU -> MorlocMonad TypeU
inferConcreteTypeU lang (Idx i t0) = do
  attemptT <- inferConcreteTypeU' t0 <$> getScope i lang
  case attemptT of
    (Right t') -> return t'
    (Left _) -> do
      gscopeUni <- MM.getGeneralUniversalScope
      cscopeUni <- MM.getConcreteUniversalScope lang
      case inferConcreteTypeU' t0 (cscopeUni, gscopeUni) of
        (Right t') -> return t'
        (Left (SystemError e2)) -> MM.throwSourcedError i e2
        (Left e2) -> MM.throwError e2

inferConcreteTypeU' :: TypeU -> (Scope, Scope) -> Either MorlocError TypeU
inferConcreteTypeU' generalType (cscope, gscope) = T.pairEval cscope gscope generalType

inferConcreteType :: Lang -> Indexed Type -> MorlocMonad TypeF
inferConcreteType _ (Idx i (UnkT _)) =
  MM.throwSourcedError i "Cannot infer concrete type for UnkT. This may be an unsolved generic term"
inferConcreteType lang (Idx i (type2typeu -> generalType)) = do
  concreteType <- inferConcreteTypeU lang (Idx i generalType)
  (_, gscope) <- getScope i lang
  case weave gscope generalType concreteType of
    (Right tf) -> return tf
    (Left _) -> do
      gscopeUni <- CMS.gets stateUniversalGeneralTypedefs
      case weave gscopeUni generalType concreteType of
        (Right tf) -> return tf
        (Left _) -> do
          -- Evaluate the general type one level and try again
          --
          -- Weaving will fail for parameterize type definitions, such as
          --   type (Foo a) = [(a, Str)]
          -- Here the primitive type (e.g., "std::vector<std::tuple<$1,std::string>>" a)
          -- cannot be woven with the `Foo a` type. So `Foo a` needs to be
          -- substituted for [(a, Str)], which can be woven.
          mayReducedGType <- evalGeneralStep i generalType
          case mayReducedGType of
            (Just reducedGType) -> inferConcreteType lang (Idx i (typeOf reducedGType))
            Nothing ->
              MM.throwSourcedError i $
                "Cannot infer concrete type for" <+> pretty generalType <> "\nCould not reduce type"

inferConcreteTypeUniversal :: Lang -> Type -> MorlocMonad TypeF
inferConcreteTypeUniversal lang t@(type2typeu -> generalType) = do
  gscopeUni <- CMS.gets stateUniversalGeneralTypedefs
  concreteType <- inferConcreteTypeUUniversal lang generalType
  case weave gscopeUni generalType concreteType of
    (Right tf) -> return tf
    (Left _) -> do
      -- Evaluate the general type one level and try again
      case T.evaluateStep gscopeUni generalType of
        (Just reducedGType) ->
          if reducedGType == generalType
            then
              MM.throwSystemError $
                "Failed to resolve concrete type for" <+> pretty t <+> "and cannot evaluate any further"
            else
              MM.throwSystemError $
                "Failed to infer concrete type for" <+> pretty generalType
                  <> ": Cannot unify with" <+> pretty reducedGType
        Nothing ->
          MM.throwSystemError $
            "Failed to infer concrete type for" <+> pretty t <+> ": Could not reduce type in broadest scope"

inferConcreteTypeUUniversal :: Lang -> TypeU -> MorlocMonad TypeU
inferConcreteTypeUUniversal lang generalType = do
  gscopeUni <- CMS.gets stateUniversalGeneralTypedefs
  cscopeUni <- CMS.gets stateUniversalConcreteTypedefs |>> fromMaybe Map.empty . Map.lookup lang
  let attemptUni = inferConcreteTypeU' generalType (cscopeUni, gscopeUni)
  case attemptUni of
    (Right t) -> return t
    (Left (SystemError e2)) ->
      MM.throwSystemError $
        "Failed to infer concrete universal type for lang"
          <+> pretty lang
          <+> "for type"
          <+> pretty generalType
          <> ":" <+> e2
    (Left e) -> MM.throwError e

weave :: Scope -> TypeU -> TypeU -> Either MDoc TypeF
weave gscope = w
  where
    w (VarU v1) (VarU (TV v2)) = return $ VarF (FV v1 (CV v2))
    w (FunU ts1 t1) (FunU ts2 t2) = FunF <$> zipWithM w ts1 ts2 <*> w t1 t2
    w (AppU t1 ts1) (AppU t2 ts2) = AppF <$> w t1 t2 <*> weaveArgs ts1 ts2
    w t1@(NamU o1 v1 ts1 rs1) t2@(NamU o2 v2 ts2 rs2)
      | o1 == o2 && length ts1 == length ts2 && length rs1 == length rs2 =
          NamF o1 (FV v1 (CV (unTVar v2)))
            <$> zipWithM w ts1 ts2
            <*> zipWithM (\(_, t1') (k2', t2') -> (,) k2' <$> w t1' t2') rs1 rs2
      | otherwise = Left $ "failed to weave:" <+> "\n  t1:" <+> pretty t1 <+> "\n  t2:" <+> pretty t2
    w (EffectU effs t1) (EffectU _ t2) = EffectF (resolveEffectSet effs) <$> w t1 t2
    w (OptionalU t1) (OptionalU t2) = OptionalF <$> w t1 t2
    w (NatLitU n) (NatLitU _) = return $ NatLitF n
    w (NatLitU n) _ = return $ NatLitF n  -- Nat params may be erased in concrete type
    w (NatAddU _ _) _ = return $ NatLitF 0  -- Nat arithmetic erased in concrete type
    w (NatMulU _ _) _ = return $ NatLitF 0  -- Nat arithmetic erased in concrete type
    w (NatSubU _ _) _ = return $ NatLitF 0  -- Nat arithmetic erased in concrete type
    w (NatDivU _ _) _ = return $ NatLitF 0  -- Nat arithmetic erased in concrete type
    w (NatVarU _) _ = return $ NatLitF 0  -- Nat variable erased in concrete type
    w (LabeledU _ t1) t2 = w t1 t2
    w (ForallU v (VarU v')) _ | v == v' = return $ NatLitF 0  -- Unresolved variable (UnkT pattern)
    w t1 t2 = case T.evaluateStep gscope t1 of
      Nothing -> Left $ "failed to weave:" <+> "\n  t1:" <+> pretty t1 <> "\n  t2:" <> pretty t2
      (Just t1') ->
        if t1 == t1'
          then Left ("failed to weave:" <> pretty t1 <+> "vs" <+> pretty t1')
          else do
            w t1' t2

    -- Weave type arguments, handling Nat params that may be erased in concrete type.
    -- Nat-kinded general args have no concrete counterpart, so we consume them
    -- without advancing the concrete list, but still emit a NatLitF placeholder.
    weaveArgs :: [TypeU] -> [TypeU] -> Either MDoc [TypeF]
    weaveArgs [] [] = Right []
    weaveArgs [] _ = Left "concrete type has more args than general type in weave"
    weaveArgs (NatLitU n : gs) cs = (NatLitF n :) <$> weaveArgs gs cs
    weaveArgs (NatAddU _ _ : gs) cs = (NatLitF 0 :) <$> weaveArgs gs cs
    weaveArgs (NatMulU _ _ : gs) cs = (NatLitF 0 :) <$> weaveArgs gs cs
    weaveArgs (NatSubU _ _ : gs) cs = (NatLitF 0 :) <$> weaveArgs gs cs
    weaveArgs (NatDivU _ _ : gs) cs = (NatLitF 0 :) <$> weaveArgs gs cs
    -- Unresolved nat dimension variable (opaque output dims): treat as erased
    weaveArgs (NatVarU _ : gs) cs = (NatLitF 0 :) <$> weaveArgs gs cs
    weaveArgs (ForallU v (VarU v') : gs) cs | v == v' = (NatLitF 0 :) <$> weaveArgs gs cs
    weaveArgs (g:gs) (c:cs) = (:) <$> w g c <*> weaveArgs gs cs
    weaveArgs _ [] = Left "general type has more non-Nat args than concrete type in weave"

inferConcreteVar :: Lang -> Indexed TVar -> MorlocMonad FVar
inferConcreteVar lang t0@(Idx i v) = do
  MM.sayVVV $ "inferConcreteVar" <+> pretty lang <+> pretty t0
  localScope <- MM.getConcreteScope i lang
  globalScope <- MM.getConcreteUniversalScope lang
  case Map.lookup v localScope of
    (Just ((_, t, _, True) : _)) -> return $ FV v (CV . unTVar $ extractKey t)
    (Just ((_, t, _, False) : _)) -> error $ "Substituting the non-terminal " <> show (extractKey t) <> " into type " <> show t
    _ -> case Map.lookup v globalScope of
      (Just ((_, t, _, True) : _)) -> do
        -- TODO fix this, the types should be in scope
        MM.sayVVV $ "WARNING: using global definition for v=" <> pretty v
        return $ FV v (CV . unTVar $ extractKey t)
      (Just ((_, t, _, False) : _)) -> error $ "Substituting the non-terminal " <> show (extractKey t) <> " into type " <> show t
      _ -> do
        -- Try transitive resolution: expand through general scope
        (cscope, gscope) <- getScope i lang
        case T.pairEval cscope gscope (VarU v) of
          Right (VarU v') -> return $ FV v (CV (unTVar v'))
          Right _ -> error $ "Transitive resolution of " <> show (unTVar v)
                          <> " yielded non-variable type"
          Left _ -> error $ "Cannot find type variable "
                         <> show (unTVar v) <> " in scope"


================================================
FILE: library/Morloc/CodeGenerator/LambdaEval.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.LambdaEval
Description : Beta-reduce applied lambdas in the codegen AST
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Performs beta-reduction on lambda applications in the 'AnnoS' tree so
that the code generator sees only fully-applied function calls or
unapplied lambdas, never @(\\x -> body) arg@.
-}
module Morloc.CodeGenerator.LambdaEval
  ( applyLambdas
  ) where

import Morloc.CodeGenerator.Namespace

-- {- | Remove lambdas introduced through substitution
--
-- For example:
--
--  bif x = add x 10
--  bar py :: "int" -> "int"
--  bar y = add y 30
--  f z = bar (bif z)
--
-- In Treeify.hs, the morloc declarations will be substituted in as lambdas. But
-- we want to preserve the link to any annotations (in this case, the annotation
-- that `bar` should be in terms of python ints). The morloc declarations can be
-- substituted in as follows:
--
--  f z = (\y -> add y 30) ((\x -> add x 10) z)
--
-- The indices for bif and bar that link the annotations to the functions are
-- relative to the lambda expressions, so this substitution preserves the link.
-- Typechecking can proceed safely.
--
-- The expression can be simplified:
--
--  f z = (\y -> add y 30) ((\x -> add x 10) z)
--  f z = (\y -> add y 30) (add z 10)            -- [z / x]
--  f z = add (add z 10) 30                      -- [add z 10 / y]
--
-- The simplified expression is what should be written in the generated code. It
-- would also be easier to typecheck and debug. So should these substitutions be
-- done immediately after parsing? We need to preserve
--  1. links to locations in the original source code (for error messages)
--  2. type annotations.
--  3. declaration names for generated comments and subcommands
--
-- Here is the original expression again, but annotated and indexed
--
--  (\x -> add_2 x_3 10_4)_1
--  (\y -> add_6 y_7 30_8)_5
--  (\z -> bar_10 (bif_11 z_12))_9
--
--  1: name="bif"
--  5: name="bar", type="int"@py -> "int"@py
--  9: name="f"
--
-- Each add is also associated with a type defined in a signature in an
-- unmentioned imported library, but those will be looked up by the typechecker
-- and will not be affected by rewriting.
--
-- Substitution requires reindexing. A definition can be used multiple times and
-- we need to distinguish between the use cases.
--
-- Replace bif and bar with their definition and create fresh indices:
--
--  (\z -> (\y -> add_18 y_19 30_20)_17 ((\x -> add_14 x_15 10_16)_13 z_12)_9
--
--  13,1: name="bif"
--  17,5: name="bar", type="int"@py -> "int"@py
--  9: name="f"
--
-- Now we can substitute for y
--
--  (\z -> add_18 ((\x -> add_14 x_15 10_16)_13 z_12)_9 30_20)
--
-- But this destroyed index 17 and the link to the python annotation. We can
-- preserve the type by splitting the annotation of bar.
--
--  13,1: name="bif"
--  18,17,5: name="bar"
--  12: "int"@py
--  13: "int"@py
--  9: name="f"
--
-- Index 18 should be associated with the *name* "bar", but not the type, since it
-- has been applied. The type of bar is now split between indices 12 and 13.
--
-- This case works fine, but it breaks down when types are polymorphic. If the
-- annotation of bar had been `a -> a`, then how would we type 12 and 13? We can't
-- say that `12 :: forall a . a` and `13 :: forall a . a`, since this
-- eliminates the constraint that the `a`s must be the same.
--
-- If instead we rewrite lambdas after typechecking, then everything works out.
--
-- Thus applyLambdas is done here, rather than in Treeify.hs or Desugar.hs.
--
-- Lambda application can also NOT be done before collapsing from Many to One in
-- AnnoS. The reason is that in ((VarS (Many es)) 42), the values in es
-- may contain `CallS src` or `LamS vs e` types. The CallS terms cannot be
-- reduced but the lambdas can. So applying here would lead to divergence.
--
-- It also must be done BEFORE conversion to ExprM in `express`, where manifolds
-- are resolved.
-- -}
applyLambdas ::
  AnnoS (Indexed Type) One a ->
  MorlocMonad (AnnoS (Indexed Type) One a)
-- eliminate empty lambdas
applyLambdas (AnnoS g1 _ (AppS (AnnoS _ _ (LamS [] (AnnoS _ c2 e))) [])) = applyLambdas $ AnnoS g1 c2 e
-- eliminate empty applications
applyLambdas (AnnoS g1 _ (AppS (AnnoS _ c2 e) [])) = applyLambdas $ AnnoS g1 c2 e
-- substitute applied lambdas
applyLambdas
  ( AnnoS
      i1
      tb1
      ( AppS
          ( AnnoS
              (Idx i2 (FunT (_ : tas) tb2))
              c
              (LamS (v : vs) e2)
            )
          (e1 : es)
        )
    ) =
    let e2' = substituteAnnoS v e1 e2
     in applyLambdas
          ( AnnoS
              i1
              tb1
              ( AppS
                  ( AnnoS
                      (Idx i2 (FunT tas tb2))
                      c
                      (LamS vs e2')
                  )
                  es
              )
          )
-- propagate the changes
applyLambdas (AnnoS g c (AppS f es)) = do
  f' <- applyLambdas f
  es' <- mapM applyLambdas es
  return (AnnoS g c (AppS f' es'))
applyLambdas (AnnoS g c (LamS vs e)) = AnnoS g c . LamS vs <$> applyLambdas e
applyLambdas (AnnoS g c (LstS es)) = AnnoS g c . LstS <$> mapM applyLambdas es
applyLambdas (AnnoS g c (TupS es)) = AnnoS g c . TupS <$> mapM applyLambdas es
applyLambdas (AnnoS g c (NamS rs)) = AnnoS g c . NamS <$> mapM (secondM applyLambdas) rs
applyLambdas (AnnoS g c (VarS v (One e))) = AnnoS g c . VarS v . One <$> applyLambdas e
-- Inline let-bound lambdas: the nexus evaluator cannot serialize function types,
-- so substitute the lambda for all references and re-process to beta-reduce
applyLambdas (AnnoS g c (LetS v e1@(AnnoS _ _ (LamS _ _)) e2)) = do
  e1' <- applyLambdas e1
  let e2' = substituteAnnoS v e1' e2
  inner <- applyLambdas e2'
  let AnnoS _ _ innerExpr = inner
  return (AnnoS g c innerExpr)
applyLambdas (AnnoS g c (LetS v e1 e2)) = do
  e1' <- applyLambdas e1
  e2' <- applyLambdas e2
  return (AnnoS g c (LetS v e1' e2'))
applyLambdas (AnnoS g c (IfS cond thenE elseE)) = do
  cond' <- applyLambdas cond
  thenE' <- applyLambdas thenE
  elseE' <- applyLambdas elseE
  return (AnnoS g c (IfS cond' thenE' elseE'))
applyLambdas (AnnoS g c (DoBlockS e)) = AnnoS g c . DoBlockS <$> applyLambdas e
-- cancel force-suspend: !{e} --> e, preserving outer annotation
applyLambdas (AnnoS g c (EvalS (AnnoS _ _ (DoBlockS e)))) = do
  e' <- applyLambdas e
  let AnnoS _ _ inner = e'
  return (AnnoS g c inner)
applyLambdas (AnnoS g c (EvalS e)) = AnnoS g c . EvalS <$> applyLambdas e
applyLambdas (AnnoS g c (CoerceS co e)) = AnnoS g c . CoerceS co <$> applyLambdas e
applyLambdas (AnnoS g c (IntrinsicS intr es)) = AnnoS g c . IntrinsicS intr <$> mapM applyLambdas es
applyLambdas (AnnoS g c (CallS v)) = return (AnnoS g c (CallS v))
applyLambdas x = return x

substituteAnnoS ::
  EVar ->
  AnnoS (Indexed Type) One a ->
  AnnoS (Indexed Type) One a ->
  AnnoS (Indexed Type) One a
substituteAnnoS v r = f
  where
    f e@(AnnoS _ _ (BndS v'))
      | v == v' = r
      | otherwise = e
    -- propagate the changes
    f (AnnoS g c (AppS e es)) =
      let f' = f e
          es' = map f es
       in AnnoS g c (AppS f' es')
    f e0@(AnnoS g c (LamS vs e))
      | v `elem` vs = e0 -- the replacement term is shadowed
      | otherwise =
          let e' = f e
           in AnnoS g c (LamS vs e')
    f (AnnoS g c (LstS es)) =
      let es' = map f es
       in AnnoS g c (LstS es')
    f (AnnoS g c (TupS es)) =
      let es' = map f es
       in AnnoS g c (TupS es')
    f (AnnoS g c (NamS rs)) =
      let es' = map (f . snd) rs
       in AnnoS g c (NamS (zip (map fst rs) es'))
    f e@(AnnoS _ _ (LetBndS v'))
      | v == v' = r
      | otherwise = e
    f e0@(AnnoS g c (LetS v' e1 e2))
      | v == v' = e0 -- shadowed by let binding
      | otherwise = AnnoS g c (LetS v' (f e1) (f e2))
    f (AnnoS g c (IfS cond thenE elseE)) = AnnoS g c (IfS (f cond) (f thenE) (f elseE))
    f (AnnoS g c (DoBlockS e)) = AnnoS g c (DoBlockS (f e))
    f (AnnoS g c (EvalS e)) = AnnoS g c (EvalS (f e))
    f (AnnoS g c (CoerceS co e)) = AnnoS g c (CoerceS co (f e))
    f (AnnoS g c (IntrinsicS intr es)) = AnnoS g c (IntrinsicS intr (map f es))
    -- CallS is a recursive back-edge, not a variable reference to substitute
    f x = x


================================================
FILE: library/Morloc/CodeGenerator/LanguageDescriptor.hs
================================================
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.CodeGenerator.LanguageDescriptor
Description : Language descriptor for generic code generation
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Defines a descriptor format that captures the syntactic differences between
dynamically-typed interpreted languages. Used by the generic translator to
generate pool code without language-specific Haskell modules.
-}
module Morloc.CodeGenerator.LanguageDescriptor
  ( LangDescriptor (..)
  , IndexStyle (..)
  , FieldAccessStyle (..)
  , BlockStyle (..)
  , MapStyle (..)
  , ListStyle (..)
  , PatternStyle (..)
  , loadLangDescriptor
  , loadLangDescriptorFromText
  , defaultLangDescriptor
  ) where

import qualified Data.Aeson as Aeson
import qualified Data.Aeson.Key as AesonKey
import qualified Data.Aeson.KeyMap as KM
import Data.Text (Text)
import qualified Data.Text as T
import qualified Data.Text.Encoding as TE
import qualified Data.Yaml as Y
import GHC.Generics (Generic)

-- | How to access tuple/list elements by index
data IndexStyle
  = ZeroBracket -- e[i]     (Python, JS, Julia, Lua)
  | OneBracket -- e[i+1]   (R-like with [], 1-indexed)
  | OneDoubleBracket -- e[[i+1]] (R with [[]], 1-indexed)
  deriving (Eq, Show, Generic)

-- | How to access record fields
data FieldAccessStyle
  = DotAccess -- e.field  (Python, JS, Julia)
  | DollarAccess -- e$field  (R)
  deriving (Eq, Show, Generic)

-- | Block structure for function definitions
data BlockStyle
  = IndentBlock -- Python-style: header + indented body
  | BraceBlock -- R/JS-style: header { body }
  | EndKeywordBlock -- Julia/Ruby-style: header body end
  deriving (Eq, Show, Generic)

-- | List iteration / map style
data MapStyle
  = LoopAppend -- for x in col: result.append(...)
  | ApplyCallback -- lapply(col, function(x) ...)
  | ListComprehension -- [body for x in col]
  deriving (Eq, Show, Generic)

-- | List constructor style
data ListStyle
  = BracketList -- [a, b, c]
  | FunctionCallList -- list(a, b, c)
  | TypeDependentList -- c(a,b) for atomic types, list(a,b) for complex
  deriving (Eq, Show, Generic)

-- | String interpolation / pattern style
data PatternStyle
  = FStringPattern -- f"prefix{var}suffix"
  | ConcatCall -- paste0("prefix", var, "suffix") or string(...)
  deriving (Eq, Show, Generic)

-- | Complete language descriptor
data LangDescriptor = LangDescriptor
  { -- Identity
    ldName :: !Text
  , ldExtension :: !String
  , -- Literals
    ldBoolTrue :: !Text
  , ldBoolFalse :: !Text
  , ldNullLiteral :: !Text
  , -- Constructors
    ldListStyle :: !ListStyle
  , ldTupleConstructor :: !Text -- "tuple" or "list" or ""
  , ldRecordConstructor :: !Text -- "dict" or "OrderedDict" or "list"
  , ldRecordSeparator :: !Text -- "=" for Python/R, "=>" for Julia
  , -- Access styles
    ldIndexStyle :: !IndexStyle
  , ldKeyAccess :: !Text -- "bracket" -> e["k"], "double_bracket" -> e[["k"]]
  , ldFieldAccess :: !FieldAccessStyle
  , -- Serialize/deserialize function names
    ldSerializeFn :: !Text -- "morloc.put_value" or "morloc_put_value"
  , ldDeserializeFn :: !Text -- "morloc.get_value" or "morloc_get_value"
  , -- Intrinsic function prefix (for mlc_show, mlc_hash, etc.)
    ldIntrinsicPrefix :: !Text -- "morloc." or "morloc_" or "MorlocRuntime."
  , -- Foreign call template
    ldForeignCallFn :: !Text -- "morloc.foreign_call" or "morloc_foreign_call"
  , ldForeignCallIntSuffix :: !Text -- "L" for R, "" for others
  , ldIntLiteralSuffix :: !Text -- "L" for R, "" for others
  , -- Remote call
    ldRemoteCallFn :: !Text -- "morloc.remote_call" or "morloc_remote_call"
  , -- Record access
    ldDictStyleRecords :: !Bool -- True: NamRecord/dict use bracket access, others use dot (Python)
  , ldQuoteRecordKeys :: !Bool -- True: "k" => v (Julia), False: k=v (Python, R)
  , -- Import syntax
    ldQualifiedImports :: !Bool -- True: qualify source names with module path (Python)
  , ldIncludeRelToFile :: !Bool -- True if include() resolves relative to file (Julia), False for CWD (R)
  , -- Pool template
    ldPoolTemplate :: !Text -- pool template content
  , ldBreakMarker :: !Text -- "# <<<BREAK>>>"
  , ldCommentMarker :: !Text -- "#" or "//" or "--"
  , -- Execution
    ldRunCommand :: ![Text] -- command to run pool, e.g. ["python3"]
  , ldIsCompiled :: !Bool
  , -- External codegen (optional)
    ldCodegenCommand :: !(Maybe Text) -- e.g. "morloc-codegen-generic"
  , -- == Template fields (Layer 1 & 2) ==

    -- Assignment
    ldAssignOp :: !Text -- "=" or "<-"
  , -- Lambda
    ldLambdaTemplate :: !Text -- e.g. "lambda {{args}}: {{body}}"
  , -- Do-block (effect wrapper)
    ldDoBlockExpr :: !Text -- e.g. "(lambda: {{expr}})"
  , ldDoBlockBlock :: !Text -- e.g. "function(){\n{{body}}\n}" or "" for pass-through
  , -- Partial application
    ldPartialTemplate :: !Text -- e.g. "functools.partial({{fn_with_context}})"
  , -- Import
    ldImportTemplate :: !Text -- e.g. "{{namespace}} = importlib.import_module(\"{{module_path}}\")"
  , -- Socket path
    ldSocketPathTemplate :: !Text -- e.g. "os.path.join(global_state[\"tmpdir\"], {{socket}})"
  , -- Resource packing for remote calls
    ldResourcePackTemplate :: !Text -- e.g. "struct.pack('iiii', {{mem}}, {{time}}, {{cpus}}, {{gpus}})"
  , -- Return statement
    ldReturnTemplate :: !Text -- e.g. "return({{expr}})"
  , -- Function definition
    ldFuncDefHeader :: !Text -- e.g. "def {{name}}({{args}}):"
  , ldBlockStyle :: !BlockStyle
  , ldBlockEnd :: !Text -- "" or "end"
  , -- Error wrapping
    ldErrorWrapOpen :: !Text -- "try:" for Python, "" for others
  , ldErrorWrapClose :: ![Text] -- Except block lines with {{name}} template var
  , -- Pattern/string interpolation support
    ldPatternStyle :: !PatternStyle
  , ldConcatFn :: !Text -- For ConcatCall: "paste0", "string"
  , ldQuoteTerminator :: !Text -- String delimiter: "\"" for R/C++, "\"\"\"" for Python
  , ldQuoteTerminatorEsc :: !Text -- Escaped form: "\\\"" for R/C++, "\\\"\\\"\\\"" for Python
  , -- List constructor support
    ldAtomicTypes :: ![Text] -- For TypeDependentList: ["integer", "numeric", ...]
  , ldAtomicListFn :: !Text -- For TypeDependentList: "c"
  , ldGenericListFn :: !Text -- For FunctionCallList/TypeDependentList: "list"
  , -- Map iteration style (kept as enum - needs different code structure)
    ldMapStyle :: !MapStyle
  , -- Dispatch table templates
    ldDispatchLocalHeader :: !Text -- e.g. "dispatch = {"
  , ldDispatchLocalEntry :: !Text -- e.g. "    {{mid}}: {{name}},"
  , ldDispatchLocalFooter :: !Text -- e.g. "}"
  , ldDispatchRemoteHeader :: !Text -- e.g. "remote_dispatch = {"
  , ldDispatchRemoteEntry :: !Text -- e.g. "    {{mid}}: {{name}}_remote,"
  , ldDispatchRemoteFooter :: !Text -- e.g. "}"
  }
  deriving (Eq, Show, Generic)

-- YAML instances

instance Y.FromJSON IndexStyle where
  parseJSON = Y.withText "IndexStyle" $ \t -> case t of
    "zero_bracket" -> pure ZeroBracket
    "one_bracket" -> pure OneBracket
    "one_double_bracket" -> pure OneDoubleBracket
    _ -> fail $ "Unknown IndexStyle: " <> T.unpack t

instance Y.FromJSON FieldAccessStyle where
  parseJSON = Y.withText "FieldAccessStyle" $ \t -> case t of
    "dot" -> pure DotAccess
    "dollar" -> pure DollarAccess
    _ -> fail $ "Unknown FieldAccessStyle: " <> T.unpack t

instance Y.FromJSON BlockStyle where
  parseJSON = Y.withText "BlockStyle" $ \t -> case t of
    "indent" -> pure IndentBlock
    "braces" -> pure BraceBlock
    "end_keyword" -> pure EndKeywordBlock
    _ -> fail $ "Unknown BlockStyle: " <> T.unpack t

instance Y.FromJSON MapStyle where
  parseJSON = Y.withText "MapStyle" $ \t -> case t of
    "loop_append" -> pure LoopAppend
    "apply_callback" -> pure ApplyCallback
    "list_comprehension" -> pure ListComprehension
    _ -> fail $ "Unknown MapStyle: " <> T.unpack t

instance Y.FromJSON ListStyle where
  parseJSON = Y.withText "ListStyle" $ \t -> case t of
    "bracket" -> pure BracketList
    "function_call" -> pure FunctionCallList
    "type_dependent" -> pure TypeDependentList
    _ -> fail $ "Unknown ListStyle: " <> T.unpack t

instance Y.FromJSON PatternStyle where
  parseJSON = Y.withText "PatternStyle" $ \t -> case t of
    "fstring" -> pure FStringPattern
    "concat_call" -> pure ConcatCall
    _ -> fail $ "Unknown PatternStyle: " <> T.unpack t

-- | Custom FromJSON that injects defaults for optional fields.
instance Y.FromJSON LangDescriptor where
  parseJSON = Y.withObject "LangDescriptor" $ \obj -> do
    let ins k v = KM.insertWith (\_ old -> old) (AesonKey.fromText k) v
        -- Map registry metadata fields to descriptor fields if not already present
        nameVal = KM.lookup (AesonKey.fromText "name") obj
        extVal = KM.lookup (AesonKey.fromText "extension") obj
        runCmdVal = KM.lookup (AesonKey.fromText "run_command") obj
        isCompiledVal = KM.lookup (AesonKey.fromText "is_compiled") obj
        -- ins keeps old value if key exists, so insert specific overrides first
        withDefaults =
          maybe id (ins "ldName") nameVal
            . maybe id (ins "ldExtension") extVal
            . maybe id (ins "ldRunCommand") runCmdVal
            . maybe id (ins "ldIsCompiled") isCompiledVal
            . ins "ldCodegenCommand" Y.Null
            . ins "ldIntLiteralSuffix" (Y.String "")
            . ins "ldIntrinsicPrefix" (Y.String "")
            . ins "ldRemoteCallFn" (Y.String "")
            . ins "ldDictStyleRecords" (Y.Bool False)
            . ins "ldQuoteRecordKeys" (Y.Bool True)
            . ins "ldQualifiedImports" (Y.Bool False)
            . ins "ldRunCommand" (Y.Array mempty)
            . ins "ldIsCompiled" (Y.Bool False)
            -- Template field defaults
            . ins "ldAssignOp" (Y.String "=")
            . ins "ldLambdaTemplate" (Y.String "({{args}}) -> {{body}}")
            . ins "ldDoBlockExpr" (Y.String "(() -> {{expr}})")
            . ins "ldDoBlockBlock" (Y.String "")
            . ins "ldPartialTemplate" (Y.String "({{bound_args}}) -> {{fn}}({{all_args}})")
            . ins "ldImportTemplate" (Y.String "")
            . ins "ldSocketPathTemplate" (Y.String "")
            . ins "ldResourcePackTemplate" (Y.String "[{{mem}}, {{time}}, {{cpus}}, {{gpus}}]")
            . ins "ldReturnTemplate" (Y.String "return({{expr}})")
            . ins "ldFuncDefHeader" (Y.String "")
            . ins "ldBlockStyle" (Y.String "indent")
            . ins "ldBlockEnd" (Y.String "")
            . ins "ldErrorWrapOpen" (Y.String "")
            . ins "ldErrorWrapClose" (Y.Array mempty)
            . ins "ldPatternStyle" (Y.String "fstring")
            . ins "ldConcatFn" (Y.String "")
            . ins "ldQuoteTerminator" (Y.String "\"")
            . ins "ldQuoteTerminatorEsc" (Y.String "\\\"")
            . ins "ldAtomicTypes" (Y.Array mempty)
            . ins "ldAtomicListFn" (Y.String "")
            . ins "ldGenericListFn" (Y.String "list")
            . ins "ldMapStyle" (Y.String "loop_append")
            . ins "ldDispatchLocalHeader" (Y.String "")
            . ins "ldDispatchLocalEntry" (Y.String "")
            . ins "ldDispatchLocalFooter" (Y.String "")
            . ins "ldDispatchRemoteHeader" (Y.String "")
            . ins "ldDispatchRemoteEntry" (Y.String "")
            . ins "ldDispatchRemoteFooter" (Y.String "")
            $ obj
    Aeson.genericParseJSON Aeson.defaultOptions (Y.Object withDefaults)

-- | Load a language descriptor from a YAML file
loadLangDescriptor :: FilePath -> IO (Either String LangDescriptor)
loadLangDescriptor path = do
  result <- Y.decodeFileEither path
  return $ case result of
    Left err -> Left $ Y.prettyPrintParseException err
    Right desc -> Right desc

-- | Load a language descriptor from YAML text
loadLangDescriptorFromText :: Text -> Either String LangDescriptor
loadLangDescriptorFromText content =
  case Y.decodeEither' (TE.encodeUtf8 content) of
    Left err -> Left $ Y.prettyPrintParseException err
    Right desc -> Right desc

-- | Default descriptor
defaultLangDescriptor :: Text -> String -> LangDescriptor
defaultLangDescriptor name ext =
  LangDescriptor
    { ldName = name
    , ldExtension = ext
    , ldBoolTrue = "True"
    , ldBoolFalse = "False"
    , ldNullLiteral = "None"
    , ldListStyle = BracketList
    , ldTupleConstructor = ""
    , ldRecordConstructor = "dict"
    , ldRecordSeparator = "="
    , ldIndexStyle = ZeroBracket
    , ldKeyAccess = "bracket"
    , ldFieldAccess = DotAccess
    , ldSerializeFn = "morloc.put_value"
    , ldDeserializeFn = "morloc.get_value"
    , ldIntrinsicPrefix = ""
    , ldForeignCallFn = "morloc.foreign_call"
    , ldForeignCallIntSuffix = ""
    , ldIntLiteralSuffix = ""
    , ldRemoteCallFn = ""
    , ldDictStyleRecords = False
    , ldQuoteRecordKeys = True
    , ldQualifiedImports = False
    , ldIncludeRelToFile = False
    , ldPoolTemplate = ""
    , ldBreakMarker = "# <<<BREAK>>>"
    , ldCommentMarker = "#"
    , ldRunCommand = []
    , ldIsCompiled = False
    , ldCodegenCommand = Nothing
    , -- Template fields
      ldAssignOp = "="
    , ldLambdaTemplate = "({{args}}) -> {{body}}"
    , ldDoBlockExpr = "(() -> {{expr}})"
    , ldDoBlockBlock = ""
    , ldPartialTemplate = "({{bound_args}}) -> {{fn}}({{all_args}})"
    , ldImportTemplate = ""
    , ldSocketPathTemplate = ""
    , ldResourcePackTemplate = "[{{mem}}, {{time}}, {{cpus}}, {{gpus}}]"
    , ldReturnTemplate = "return({{expr}})"
    , ldFuncDefHeader = ""
    , ldBlockStyle = IndentBlock
    , ldBlockEnd = ""
    , ldErrorWrapOpen = ""
    , ldErrorWrapClose = []
    , ldPatternStyle = FStringPattern
    , ldConcatFn = ""
    , ldQuoteTerminator = "\""
    , ldQuoteTerminatorEsc = "\\\""
    , ldAtomicTypes = []
    , ldAtomicListFn = ""
    , ldGenericListFn = "list"
    , ldMapStyle = LoopAppend
    , ldDispatchLocalHeader = ""
    , ldDispatchLocalEntry = ""
    , ldDispatchLocalFooter = ""
    , ldDispatchRemoteHeader = ""
    , ldDispatchRemoteEntry = ""
    , ldDispatchRemoteFooter = ""
    }


================================================
FILE: library/Morloc/CodeGenerator/Namespace.hs
================================================
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE UndecidableInstances #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Namespace
Description : Types and re-exports for the code generation pipeline
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Aggregates core namespace modules and defines code-generator-specific types:
'SerialManifold' (the serialization-annotated call tree), 'SerialAST'
(serialization plans), pool/nexus configuration records, and the 'Script'
output type. This is the prelude import for all codegen modules.
-}
module Morloc.CodeGenerator.Namespace
  ( module Morloc.Namespace.Prim
  , module Morloc.Namespace.Type
  , module Morloc.Namespace.Expr
  , module Morloc.Namespace.State

    -- ** Types used in final translations
  , TypeM (..)
  , TypeF (..)
  , TypeS (..)
  , FVar (..)

    -- ** Typeclasses
  , HasTypeF (..)
  , MayHaveTypeF (..)
  , HasTypeS (..)
  , HasTypeM (..)
  , typeMofRs
  , typeMofForm
  , Arg
  , ArgGeneral (..)
  , ManifoldForm (..)
  , HeadManifoldForm (..)
  , manifoldContext
  , manifoldBound
  , ArgTypes (..)
  , argTypesToTypeM

    -- ** Manifold data types
  , ExecutableExpressionPool (..)
  , RemoteForm (..)
  , PolyHead (..)
  , PolyExpr (..)
  , MonoHead (..)
  , MonoExpr (..)
  , PoolCall (..)
  , MFunctor (..)
  , GateMap (..)
  , ManifoldMap (..)
  , NativeManifold (..)
  , SerialManifold (..)
  , SerialArg (..)
  , NativeArg (..)
  , SerialExpr (..)
  , NativeExpr (..)
  -- unrecursive types
  , FoldManifoldM (..)
  , SurroundManifoldM (..)
  , NativeManifold_ (..)
  , SerialManifold_ (..)
  , SerialArg_ (..)
  , NativeArg_ (..)
  , SerialExpr_ (..)
  , NativeExpr_ (..)
  , foldlSM
  , foldlNM
  , foldlSE
  , foldlNE
  , foldlSA
  , foldlNA

    -- ** Serialization AST
  , SerialAST (..)
  , TypePacker (..)

    -- ** Simple fold over expressions
  , foldSerialManifoldM
  , foldNativeManifoldM
  , foldSerialExprM
  , foldNativeExprM
  , foldNativeArgM
  , foldSerialArgM

    -- ** Contextual fold over expressions
  , surroundFoldSerialManifoldM
  , surroundFoldNativeManifoldM
  , surroundFoldSerialExprM
  , surroundFoldNativeExprM
  , surroundFoldNativeArgM
  , surroundFoldSerialArgM

    -- ** fold withs
  , FoldWithManifoldM (..)
  , foldWithSerialManifoldM
  , foldWithNativeManifoldM
  , foldWithSerialArgM
  , foldWithNativeArgM
  , foldWithSerialExprM
  , foldWithNativeExprM

    -- ** arg magic
  , abimapM
  , abilistM
  , afirstM
  , asecondM
  , abilist
  , abimap
  , afirst
  , asecond
  , abiappendM
  , abiappend

    -- ** docstrings
  , CmdArg (..)
  , CmdDocSet (..)
  , RecDocSet (..)
  , ArgOptDocSet (..)
  , ArgFlagDocSet (..)
  , ArgPosDocSet (..)

    -- ** weird baby schemes
  , MonoidFold (..)
  , makeMonoidFoldDefault
  ) where

import Control.Monad.Identity (runIdentity)
import Data.Scientific (Scientific)
import qualified Data.Set as Set
import Data.Text (Text)
import Morloc.Data.Doc
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type

-- The final types used in code generation. The language annotation is removed,
-- since the language for all types within a pool are the same.
--
-- The general type annotation will be used for documentation only
data FVar = FV TVar CVar
  deriving (Show, Ord, Eq)

-- The most minimal type that contains both general and concrete types
data TypeF
  = UnkF FVar -- this should be parameterized by `Type`, since the general type should be known
  | VarF FVar
  | FunF [TypeF] TypeF
  | AppF TypeF [TypeF]
  | NamF NamType FVar [TypeF] [(Key, TypeF)]
  | EffectF (Set.Set EffectLabel) TypeF
  | OptionalF TypeF
  | NatLitF Integer
  deriving (Show, Ord, Eq)

data TypeM
  = -- | serialized data that is not deserialized (and may not be representable) in this segment
    Passthrough
  | -- | serialized data that may be deserialized in this language
    Serial TypeF
  | -- | an unserialized native data type
    Native TypeF
  | -- | a function of n inputs and one output (cannot be serialized)
    Function [TypeM] TypeM
  deriving (Show, Eq, Ord)

-- | TypeS is a subset of TypeM that does not allow native types
data TypeS
  = PassthroughS
  | SerialS TypeF
  | FunctionS [TypeM] TypeS -- This is the type of a manifold
  deriving (Show, Eq, Ord)

-- | A tree describing how to (de)serialize an object
data SerialAST
  = -- | use an (un)pack function to simplify an object
    SerialPack FVar (TypePacker, SerialAST)
  | SerialList FVar SerialAST
  | -- | Dense N-dimensional tensor. ndim is the rank (1=vector, 2=matrix, etc.)
    -- and the inner SerialAST is the element type (must be a numeric primitive).
    SerialTensor FVar Int SerialAST
  | SerialTuple FVar [SerialAST]
  | -- | Make a record, table, or object. The parameters indicate
    --   1) NamType - record/table/object
    --   2) FVar - telling the name of the object (e.g., "Person")
    --   3) [TypeF] - the types of the parameters (used as parameters in C++ templates, e.g., map<int, map<int,string>>)
    --   4) [(FVar, SerialAST)] - entries with keys for concrete and general cases
    SerialObject NamType FVar [TypeF] [(Key, SerialAST)]
  | SerialReal FVar
  | SerialFloat32 FVar
  | SerialFloat64 FVar
  | SerialInt FVar
  | SerialInt8 FVar
  | SerialInt16 FVar
  | SerialInt32 FVar
  | SerialInt64 FVar
  | SerialUInt FVar
  | SerialUInt8 FVar
  | SerialUInt16 FVar
  | SerialUInt32 FVar
  | SerialUInt64 FVar
  | SerialBool FVar
  | SerialString FVar
  | SerialNull FVar
  | SerialOptional FVar SerialAST
  | -- | depending on the language, this may or may not raise an error down the
    -- line, the parameter contains the variable name, which is useful only for
    -- source code comments.
    SerialUnknown FVar
  deriving (Ord, Eq, Show)

instance Pretty SerialAST where
  pretty (SerialPack v (packer, s)) =
    parens $
      "SerialPack"
        <+> pretty v
        <+> braces (vsep [pretty packer, pretty s])
  pretty (SerialList _ ef) = parens $ "SerialList" <+> pretty ef
  pretty (SerialTensor v ndim s) = parens ("SerialTensor" <+> pretty v <+> pretty ndim <+> pretty s)
  pretty (SerialTuple _ efs) = parens $ "SerialTuple" <+> tupled (map pretty efs)
  pretty (SerialObject o _ vs rs) =
    parens $
      "SerialObject"
        <+> pretty o
        <+> tupled (map pretty vs)
        <+> encloseSep "{" "}" "," [pretty k <+> "=" <+> pretty p | (k, p) <- rs]
  pretty (SerialReal v) = parens ("SerialReal" <+> pretty v)
  pretty (SerialFloat32 v) = parens ("SerialFloat32" <+> pretty v)
  pretty (SerialFloat64 v) = parens ("SerialFloat64" <+> pretty v)
  pretty (SerialInt v) = parens ("SerialInt" <+> pretty v)
  pretty (SerialInt8 v) = parens ("SerialInt8" <+> pretty v)
  pretty (SerialInt16 v) = parens ("SerialInt16" <+> pretty v)
  pretty (SerialInt32 v) = parens ("SerialInt32" <+> pretty v)
  pretty (SerialInt64 v) = parens ("SerialInt64" <+> pretty v)
  pretty (SerialUInt v) = parens ("SerialUInt" <+> pretty v)
  pretty (SerialUInt8 v) = parens ("SerialUInt8" <+> pretty v)
  pretty (SerialUInt16 v) = parens ("SerialUInt16" <+> pretty v)
  pretty (SerialUInt32 v) = parens ("SerialUInt32" <+> pretty v)
  pretty (SerialUInt64 v) = parens ("SerialUInt64" <+> pretty v)
  pretty (SerialBool v) = parens ("SerialBool" <+> pretty v)
  pretty (SerialString v) = parens ("SerialString" <+> pretty v)
  pretty (SerialNull v) = parens ("SerialNull" <+> pretty v)
  pretty (SerialOptional v s) = parens ("SerialOptional" <+> pretty v <+> pretty s)
  pretty (SerialUnknown v) = parens ("SerialUnknown" <+> pretty v)

data ExecutableExpressionPool
  = SrcCallP Source -- source code
  | PatCallP Pattern -- pattern function
  | LocalCallP Int -- a locally defined function
  | RecCallP Int (Maybe Lang)
  -- ^ Recursive call to manifold. Nothing = same pool, Just lang = foreign pool.
  deriving (Show, Ord, Eq)

instance Pretty ExecutableExpressionPool where
  pretty (SrcCallP src) = pretty src
  pretty (PatCallP pat) = pretty pat
  pretty (LocalCallP i) = "x" <> pretty i
  pretty (RecCallP i Nothing) = "rec_m" <> pretty i
  pretty (RecCallP i (Just lang)) = "rec_foreign_m" <> pretty i <> "@" <> pretty lang

data TypePacker = TypePacker
  { typePackerPacked :: TypeF
  , typePackerUnpacked :: TypeF
  , typePackerForward :: Source
  , typePackerReverse :: Source
  }
  deriving (Show, Ord, Eq)

instance Pretty TypePacker where
  pretty p =
    "TypePacker"
      <+> encloseSep
        "{"
        "}"
        ","
        [ "typePackerPacked" <+> "=" <+> pretty (typePackerPacked p)
        , "typePackerUnpacked" <+> "=" <+> pretty (typePackerUnpacked p)
        , "typePackerForward" <+> "=" <+> pretty (typePackerForward p)
        , "typePackerReverse" <+> "=" <+> pretty (typePackerReverse p)
        ]

type Arg = ArgGeneral Int

data ArgGeneral k a = Arg k a
  deriving (Show, Eq, Ord)

instance Annotated ArgGeneral where
  val (Arg _ x) = x
  ann (Arg i _) = i
  annotate i x = Arg i x

instance Functor (ArgGeneral k) where
  fmap f (Arg i x) = Arg i (f x)

instance Bifunctor ArgGeneral where
  bimapM f g (Arg k x) = Arg <$> f k <*> g x

instance HasTypeM TypeS where
  typeMof PassthroughS = Passthrough
  typeMof (SerialS t) = Serial t
  typeMof (FunctionS ts t) = Function (map typeMof ts) (typeMof t)

class HasTypeS a where
  typeSof :: a -> TypeS

{- | Stores arguments to a manifold

Examples:

#1: ManifoldFull [x1 = (runif 0 1), x2 = var "x"]
  source py "foo.py" ("add", "runif")
  foo x = add (runif 0 1) x

Add and runif are both fully applied and their arguments are associated with
expressions.

#2: for `add`:  ManifoldPass [x1 : "float", x2 : "float"]
  source py "foo.py" ("add")
  foo xs = zipWith add xs

x1 and x2 are supplied by the source function

#3: ManifoldPart [x1 = (runif 0 1), x2 = var "x"] [x2 : "float"]
  source py "foo.py" ("add", "runif")
  foo xs = map (add (runif 0 1)) xs

add takes one expression and one bound argument.

The "context" comes first here, it can be partially applied
-}
data ManifoldForm context bound
  = -- | Unapplied function passed as argument.
    ManifoldPass [Arg bound]
  | -- | Fully applied function.
    ManifoldFull [Arg context]
  | -- | Partially applied function
    ManifoldPart [Arg context] [Arg bound]
  deriving (Show, Eq, Ord)

manifoldContext :: ManifoldForm a b -> [Arg a]
manifoldContext (ManifoldFull xs) = xs
manifoldContext (ManifoldPass _) = []
manifoldContext (ManifoldPart xs _) = xs

manifoldBound :: ManifoldForm a b -> [Arg b]
manifoldBound (ManifoldFull _) = []
manifoldBound (ManifoldPass xs) = xs
manifoldBound (ManifoldPart _ ys) = ys

instance Bifunctor ManifoldForm where
  bimapM f _ (ManifoldFull xs) = ManifoldFull <$> mapM (\(Arg i x) -> Arg i <$> f x) xs
  bimapM _ g (ManifoldPass xs) = ManifoldPass <$> mapM (\(Arg i x) -> Arg i <$> g x) xs
  bimapM f g (ManifoldPart xs ys) =
    ManifoldPart
      <$> mapM (\(Arg i x) -> Arg i <$> f x) xs
      <*> mapM (\(Arg i x) -> Arg i <$> g x) ys

instance Bifoldable ManifoldForm where
  bilistM f _ (ManifoldFull xs) = mapM (f . val) xs
  bilistM _ g (ManifoldPass xs) = mapM (g . val) xs
  bilistM f g (ManifoldPart xs ys) = (<>) <$> mapM (f . val) xs <*> mapM (g . val) ys

abimapM ::
  (Monad m) => (Int -> a -> m a') -> (Int -> b -> m b') -> ManifoldForm a b -> m (ManifoldForm a' b')
abimapM f _ (ManifoldFull xs) = ManifoldFull <$> mapM (\t -> annotate (ann t) <$> f (ann t) (val t)) xs
abimapM _ g (ManifoldPass xs) = ManifoldPass <$> mapM (\t -> annotate (ann t) <$> g (ann t) (val t)) xs
abimapM f g (ManifoldPart xs ys) =
  ManifoldPart
    <$> mapM (\t -> annotate (ann t) <$> f (ann t) (val t)) xs
    <*> mapM (\t -> annotate (ann t) <$> g (ann t) (val t)) ys

afirstM :: (Monad m) => (Int -> a -> m a') -> ManifoldForm a b -> m (ManifoldForm a' b)
afirstM f = abimapM f (return2 seq)

asecondM :: (Monad m) => (Int -> b -> m b') -> ManifoldForm a b -> m (ManifoldForm a b')
asecondM = abimapM (return2 seq)

abimap :: (Int -> a -> a') -> (Int -> b -> b') -> ManifoldForm a b -> ManifoldForm a' b'
abimap f g = runIdentity . abimapM (return2 f) (return2 g)

afirst :: (Int -> a -> a') -> ManifoldForm a b -> ManifoldForm a' b
afirst f = runIdentity . afirstM (return2 f)

asecond :: (Int -> b -> b') -> ManifoldForm a b -> ManifoldForm a b'
asecond f = runIdentity . asecondM (return2 f)

abilistM :: (Monad m) => (Int -> a -> m c) -> (Int -> b -> m c) -> ManifoldForm a b -> m [c]
abilistM f _ (ManifoldFull xs) = mapM (annappM f) xs
abilistM _ g (ManifoldPass xs) = mapM (annappM g) xs
abilistM f g (ManifoldPart xs ys) = (<>) <$> mapM (annappM f) xs <*> mapM (annappM g) ys

abilist :: (Int -> a -> c) -> (Int -> b -> c) -> ManifoldForm a b -> [c]
abilist f g = runIdentity . abilistM (return2 f) (return2 g)

abiappendM ::
  (Monad m, Monoid c) => (Int -> a -> m c) -> (Int -> b -> m c) -> ManifoldForm a b -> m c
abiappendM f g = fmap mconcat . abilistM f g

abiappend :: (Monoid c) => (Int -> a -> c) -> (Int -> b -> c) -> ManifoldForm a b -> c
abiappend f g = runIdentity . abiappendM (return2 f) (return2 g)

instance Pretty FVar where
  pretty (FV _ c) = pretty c

data RemoteForm = ForeignCall | RemoteCall RemoteResources
  deriving (Show, Eq)

data HeadManifoldForm
  = HeadManifoldFormLocalRoot
  | HeadManifoldFormRemoteWorker
  | HeadManifoldFormLocalForeign
  deriving (Show, Eq)

data PolyHead = PolyHead Lang Int [Arg None] PolyExpr

-- no serialization and no argument types
data PolyExpr
  = -- organizational terms that may have undefined types
    PolyManifold Lang Int (ManifoldForm None (Maybe Type)) PolyExpr
  | PolyRemoteInterface
      Lang -- foreign language
      (Indexed Type) -- return type in calling language
      [Int] -- argument ids
      RemoteForm
      PolyExpr -- foreign expression
  | PolyLet Int PolyExpr PolyExpr
  | PolyReturn PolyExpr
  | PolyApp PolyExpr [PolyExpr]
  | -- variables in the original tree will all be typed
    -- but I also may need to generate passthrough terms
    PolyBndVar
      ( Three
          Lang -- no type information is known
          Type -- the general type is known, but this is a passing variable without an locally identifiable concrete index
          (Indexed Type)
      )
      Int
  | -- The Let variables are generated only in partialExpress, where the type is known
    PolyLetVar (Indexed Type) Int
  | -- terms that map 1:1 versus SAnno; have defined types in one language
    PolyExe (Indexed Type) ExecutableExpressionPool
  | -- data types
    PolyList (Indexed TVar) (Indexed Type) [PolyExpr]
  | PolyTuple (Indexed TVar) [(Indexed Type, PolyExpr)]
  | PolyRecord NamType (Indexed TVar) [Indexed Type] [(Key, (Indexed Type, PolyExpr))]
  | PolyLog (Indexed TVar) Bool
  | PolyReal (Indexed TVar) Scientific
  | PolyInt (Indexed TVar) Integer
  | PolyStr (Indexed TVar) Text
  | PolyNull (Indexed TVar)
  | PolyDoBlock (Indexed Type) PolyExpr
  | PolyEval (Indexed Type) PolyExpr
  | PolyCoerce Coercion (Indexed Type) PolyExpr
  | PolyIf PolyExpr PolyExpr PolyExpr
  | PolyIntrinsic (Indexed Type) Intrinsic [PolyExpr]

data MonoHead = MonoHead Lang Int [Arg None] HeadManifoldForm MonoExpr

data MonoExpr
  = -- organizational terms that may have undefined types
    MonoManifold Int (ManifoldForm None (Maybe Type)) MonoExpr
  | MonoPoolCall
      (Indexed Type) -- return type in calling language
      Int -- foreign manifold id
      Socket -- shell command components that preceed the passed data
      RemoteForm
      [Arg None] -- arguments
  | MonoLet Int MonoExpr MonoExpr
  | MonoLetVar (Indexed Type) Int
  | MonoReturn MonoExpr
  | MonoApp MonoExpr [MonoExpr]
  | -- terms that map 1:1 versus SAnno; have defined types in one language
    MonoExe (Indexed Type) ExecutableExpressionPool
  | MonoBndVar (Three None Type (Indexed Type)) Int -- (Three Lang Type (Indexed Type)) Int  -- (Maybe (Indexed Type))
  -- data types
  | MonoRecord NamType (Indexed TVar) [Indexed Type] [(Key, (Indexed Type, MonoExpr))]
  | MonoList (Indexed TVar) (Indexed Type) [MonoExpr]
  | MonoTuple (Indexed TVar) [(Indexed Type, MonoExpr)]
  | MonoLog (Indexed TVar) Bool
  | MonoReal (Indexed TVar) Scientific
  | MonoInt (Indexed TVar) Integer
  | MonoStr (Indexed TVar) Text
  | MonoNull (Indexed TVar)
  | MonoDoBlock (Indexed Type) MonoExpr
  | MonoEval (Indexed Type) MonoExpr
  | MonoCoerce Coercion (Indexed Type) MonoExpr
  | MonoIf MonoExpr MonoExpr MonoExpr
  | MonoIntrinsic (Indexed Type) Intrinsic [MonoExpr]

data PoolCall
  = PoolCall
      Int -- foreign manifold id
      Socket
      RemoteForm
      [Arg TypeM] -- contextual argument that are passed to the foreign function
      -- (not the main arguments to the foreign function)
  deriving (Show)

{- | Represents a single data value that may be passed as an argument through a
pool. It may be serialized, native, or both. If it is serialized only, then
it may be a passthrough type, in whch case its type is not known.
-}
data ArgTypes
  = SerialOnly TypeS
  | NativeOnly TypeF
  | SerialAndNative TypeF
  deriving (Show)

data NativeManifold = NativeManifold Int Lang (ManifoldForm (Or TypeS TypeF) TypeF) NativeExpr
  deriving (Show)

data SerialManifold
  = SerialManifold Int Lang (ManifoldForm (Or TypeS TypeF) TypeS) HeadManifoldForm SerialExpr
  deriving (Show)

data SerialArg = SerialArgManifold SerialManifold | SerialArgExpr SerialExpr
  deriving (Show)

data NativeArg = NativeArgManifold NativeManifold | NativeArgExpr NativeExpr
  deriving (Show)

data SerialExpr
  = ManS SerialManifold
  | AppPoolS TypeF PoolCall [SerialArg]
  | AppRecS TypeF Int [SerialExpr]
    -- ^ Same-language recursive call: return type, manifold ID, serialized args
  | AppForeignRecS TypeF Int Socket [SerialExpr]
    -- ^ Cross-language recursive call: return type, manifold ID, socket, serialized args
  | ReturnS SerialExpr
  | SerialLetS Int SerialExpr SerialExpr
  | NativeLetS Int NativeExpr SerialExpr
  | LetVarS (Maybe TypeF) Int
  | BndVarS (Maybe TypeF) Int
  | SerializeS SerialAST NativeExpr
  deriving (Show)

data NativeExpr
  = ManN NativeManifold
  | AppExeN TypeF ExecutableExpressionPool [NativeArg]
  | ReturnN NativeExpr
  | SerialLetN Int SerialExpr NativeExpr
  | NativeLetN Int NativeExpr NativeExpr
  | LetVarN TypeF Int
  | BndVarN TypeF Int
  | DeserializeN TypeF SerialAST SerialExpr
  | ExeN TypeF ExecutableExpressionPool
  | -- data types
    ListN FVar TypeF [NativeExpr]
  | TupleN FVar [NativeExpr]
  | RecordN NamType FVar [TypeF] [(Key, NativeExpr)]
  | LogN FVar Bool
  | RealN FVar Scientific
  | IntN FVar Integer
  | StrN FVar Text
  | NullN FVar
  | DoBlockN TypeF NativeExpr
  | EvalN TypeF NativeExpr
  | CoerceN Coercion TypeF NativeExpr
  | IfN TypeF NativeExpr NativeExpr NativeExpr
  | IntrinsicN TypeF Intrinsic (Maybe Text) [NativeExpr]
  -- ^ The Maybe Text is the precomputed msgpack schema string for the data arg
  -- (Nothing for compile-time intrinsics that are resolved by Reduce)
  deriving (Show)

foldlSM :: (b -> a -> b) -> b -> SerialManifold_ a -> b
foldlSM f b (SerialManifold_ _ _ _ _ se) = f b se

foldlNM :: (b -> a -> b) -> b -> NativeManifold_ a -> b
foldlNM f b (NativeManifold_ _ _ _ ne) = f b ne

foldlSA :: (b -> a -> b) -> b -> SerialArg_ a a -> b
foldlSA f b (SerialArgManifold_ sm) = f b sm
foldlSA f b (SerialArgExpr_ se) = f b se

foldlNA :: (b -> a -> b) -> b -> NativeArg_ a a -> b
foldlNA f b (NativeArgManifold_ nm) = f b nm
foldlNA f b (NativeArgExpr_ ne) = f b ne

foldlSE :: (b -> a -> b) -> b -> SerialExpr_ a a a a a -> b
foldlSE f b (ManS_ x) = f b x
foldlSE f b (AppPoolS_ _ _ xs) = foldl f b xs
foldlSE f b (AppRecS_ _ _ xs) = foldl f b xs
foldlSE f b (AppForeignRecS_ _ _ _ xs) = foldl f b xs
foldlSE f b (ReturnS_ x) = f b x
foldlSE f b (SerialLetS_ _ x1 x2) = foldl f b [x1, x2]
foldlSE f b (NativeLetS_ _ x1 x2) = foldl f b [x1, x2]
foldlSE _ b (LetVarS_ _ _) = b
foldlSE _ b (BndVarS_ _ _) = b
foldlSE f b (SerializeS_ _ x) = f b x

foldlNE :: (b -> a -> b) -> b -> NativeExpr_ a a a a a -> b
foldlNE f b (AppExeN_ _ _ xs) = foldl f b xs
foldlNE f b (ManN_ x) = f b x
foldlNE f b (ReturnN_ x) = f b x
foldlNE f b (SerialLetN_ _ x1 x2) = foldl f b [x1, x2]
foldlNE f b (NativeLetN_ _ x1 x2) = foldl f b [x1, x2]
foldlNE _ b (LetVarN_ _ _) = b
foldlNE _ b (BndVarN_ _ _) = b
foldlNE f b (DeserializeN_ _ _ x) = f b x
foldlNE _ b (ExeN_ _ _) = b
foldlNE f b (ListN_ _ _ xs) = foldl f b xs
foldlNE f b (TupleN_ _ xs) = foldl f b xs
foldlNE f b (RecordN_ _ _ _ rs) = foldl (\b' (_, a') -> f b' a') b rs
foldlNE _ b (LogN_ _ _) = b
foldlNE _ b (RealN_ _ _) = b
foldlNE _ b (IntN_ _ _) = b
foldlNE _ b (StrN_ _ _) = b
foldlNE _ b (NullN_ _) = b
foldlNE f b (DoBlockN_ _ x) = f b x
foldlNE f b (EvalN_ _ x) = f b x
foldlNE f b (CoerceN_ _ _ x) = f b x
foldlNE f b (IfN_ _ c t e) = foldl f b [c, t, e]
foldlNE f b (IntrinsicN_ _ _ _ xs) = foldl f b xs

data MonoidFold m a = MonoidFold
  { monoidSerialManifold :: SerialManifold_ (a, SerialExpr) -> m (a, SerialManifold)
  , monoidNativeManifold :: NativeManifold_ (a, NativeExpr) -> m (a, NativeManifold)
  , monoidSerialArg :: SerialArg_ (a, SerialManifold) (a, SerialExpr) -> m (a, SerialArg)
  , monoidNativeArg :: NativeArg_ (a, NativeManifold) (a, NativeExpr) -> m (a, NativeArg)
  , monoidSerialExpr ::
      SerialExpr_ (a, SerialManifold) (a, SerialExpr) (a, NativeExpr) (a, SerialArg) (a, NativeArg) ->
      m (a, SerialExpr)
  , monoidNativeExpr ::
      NativeExpr_ (a, NativeManifold) (a, SerialExpr) (a, NativeExpr) (a, SerialArg) (a, NativeArg) ->
      m (a, NativeExpr)
  }

makeMonoidFoldDefault :: (Monad m) => a -> (a -> a -> a) -> MonoidFold m a
makeMonoidFoldDefault mempty' mappend' =
  MonoidFold
    { monoidSerialManifold = monoidSerialManifold'
    , monoidNativeManifold = monoidNativeManifold'
    , monoidSerialArg = monoidSerialArg'
    , monoidNativeArg = monoidNativeArg'
    , monoidSerialExpr = monoidSerialExpr'
    , monoidNativeExpr = monoidNativeExpr'
    }
  where
    monoidSerialManifold' (SerialManifold_ m lang form headForm (req, ne)) = do
      return (req, SerialManifold m lang form headForm ne)

    monoidNativeManifold' (NativeManifold_ m lang form (req, ne)) = do
      return (req, NativeManifold m lang form ne)

    monoidSerialArg' (SerialArgManifold_ (req, sm)) = return (req, SerialArgManifold sm)
    monoidSerialArg' (SerialArgExpr_ (req, se)) = return (req, SerialArgExpr se)

    monoidNativeArg' (NativeArgManifold_ (req, nm)) = return (req, NativeArgManifold nm)
    monoidNativeArg' (NativeArgExpr_ (req, ne)) = return (req, NativeArgExpr ne)

    monoidSerialExpr' (ManS_ (req, sm)) = return (req, ManS sm)
    monoidSerialExpr' (AppPoolS_ t p (unzip -> (reqs, es))) = return (foldl mappend' mempty' reqs, AppPoolS t p es)
    monoidSerialExpr' (AppRecS_ t m (unzip -> (reqs, es))) = return (foldl mappend' mempty' reqs, AppRecS t m es)
    monoidSerialExpr' (AppForeignRecS_ t m s (unzip -> (reqs, es))) = return (foldl mappend' mempty' reqs, AppForeignRecS t m s es)
    monoidSerialExpr' (ReturnS_ (req, se)) = return (req, ReturnS se)
    monoidSerialExpr' (SerialLetS_ i (req1, se1) (req2, se2)) = return (mappend' req1 req2, SerialLetS i se1 se2)
    monoidSerialExpr' (NativeLetS_ i (req1, ne) (req2, se)) = return (mappend' req1 req2, NativeLetS i ne se)
    monoidSerialExpr' (LetVarS_ mayT i) = return (mempty', LetVarS mayT i)
    monoidSerialExpr' (BndVarS_ mayT i) = return (mempty', BndVarS mayT i)
    monoidSerialExpr' (SerializeS_ s (req, ne)) = return (req, SerializeS s ne)

    monoidNativeExpr' (ManN_ (req, nm)) = return (req, ManN nm)
    monoidNativeExpr' (AppExeN_ t exe (unzip -> (reqs, es))) = return (foldl mappend' mempty' reqs, AppExeN t exe es)
    monoidNativeExpr' (ReturnN_ (req, ne)) = return (req, ReturnN ne)
    monoidNativeExpr' (SerialLetN_ i (req1, se) (req2, ne)) = return (mappend' req1 req2, SerialLetN i se ne)
    monoidNativeExpr' (NativeLetN_ i (req1, ne1) (req2, ne2)) = return (mappend' req1 req2, NativeLetN i ne1 ne2)
    monoidNativeExpr' (LetVarN_ t i) = return (mempty', LetVarN t i)
    monoidNativeExpr' (BndVarN_ t i) = return (mempty', BndVarN t i)
    monoidNativeExpr' (DeserializeN_ t s (req, e)) = return (req, DeserializeN t s e)
    monoidNativeExpr' (ExeN_ t exe) = return (mempty', ExeN t exe)
    monoidNativeExpr' (ListN_ v t xs) = return (foldl mappend' mempty' (map fst xs), ListN v t (map snd xs))
    monoidNativeExpr' (TupleN_ v xs) = return (foldl mappend' mempty' (map fst xs), TupleN v $ map snd xs)
    monoidNativeExpr' (RecordN_ o v ps rs) =
      return
        ( foldl mappend' mempty' $ map (fst . snd) rs
        , RecordN o v ps (map (second snd) rs)
        )
    monoidNativeExpr' (LogN_ v x) = return (mempty', LogN v x)
    monoidNativeExpr' (RealN_ v x) = return (mempty', RealN v x)
    monoidNativeExpr' (IntN_ v x) = return (mempty', IntN v x)
    monoidNativeExpr' (StrN_ v x) = return (mempty', StrN v x)
    monoidNativeExpr' (NullN_ v) = return (mempty', NullN v)
    monoidNativeExpr' (DoBlockN_ t (a, ne)) = return (a, DoBlockN t ne)
    monoidNativeExpr' (EvalN_ t (a, ne)) = return (a, EvalN t ne)
    monoidNativeExpr' (CoerceN_ c t (a, ne)) = return (a, CoerceN c t ne)
    monoidNativeExpr' (IfN_ t (a1, c) (a2, thenE) (a3, elseE)) =
      return (foldl mappend' mempty' [a1, a2, a3], IfN t c thenE elseE)
    monoidNativeExpr' (IntrinsicN_ t intr msch (unzip -> (reqs, es))) =
      return (foldl mappend' mempty' reqs, IntrinsicN t intr msch es)

-- where
--  * m - monad
--  * sm - SerialManifold folded type
--  * nm - NativeManifold
--  * se - SerialExpr
--  * ne - NativeExpr
--  * sr - SerialArg
--  * nr - NativeArg
data FoldManifoldM m sm nm se ne sr nr = FoldManifoldM
  { opSerialManifoldM :: SerialManifold_ se -> m sm
  , opNativeManifoldM :: NativeManifold_ ne -> m nm
  , opSerialExprM :: SerialExpr_ sm se ne sr nr -> m se
  , opNativeExprM :: NativeExpr_ nm se ne sr nr -> m ne
  , opSerialArgM :: SerialArg_ sm se -> m sr
  , opNativeArgM :: NativeArg_ nm ne -> m nr
  }

instance (Monoid a, Monad m, a ~ b, a ~ c, a ~ d, a ~ e, a ~ f) => Defaultable (FoldManifoldM m a b c d e f) where
  defaultValue =
    FoldManifoldM
      { opSerialManifoldM = return . foldlSM mappend mempty
      , opNativeManifoldM = return . foldlNM mappend mempty
      , opSerialExprM = return . foldlSE mappend mempty
      , opNativeExprM = return . foldlNE mappend mempty
      , opSerialArgM = return . foldlSA mappend mempty
      , opNativeArgM = return . foldlNA mappend mempty
      }

instance
  (Monoid a, Monad m, a ~ b, a ~ c, a ~ d, a ~ e, a ~ f) =>
  Defaultable (FoldWithManifoldM m a b c d e f)
  where
  defaultValue =
    FoldWithManifoldM
      { opFoldWithSerialManifoldM = \_ e -> return . foldlSM mappend mempty $ e
      , opFoldWithNativeManifoldM = \_ e -> return . foldlNM mappend mempty $ e
      , opFoldWithSerialExprM = \_ e -> return . foldlSE mappend mempty $ e
      , opFoldWithNativeExprM = \_ e -> return . foldlNE mappend mempty $ e
      , opFoldWithSerialArgM = \_ e -> return . foldlSA mappend mempty $ e
      , opFoldWithNativeArgM = \_ e -> return . foldlNA mappend mempty $ e
      }

data FoldWithManifoldM m sm nm se ne sr nr = FoldWithManifoldM
  { opFoldWithSerialManifoldM :: SerialManifold -> SerialManifold_ se -> m sm
  , opFoldWithNativeManifoldM :: NativeManifold -> NativeManifold_ ne -> m nm
  , opFoldWithSerialExprM :: SerialExpr -> SerialExpr_ sm se ne sr nr -> m se
  , opFoldWithNativeExprM :: NativeExpr -> NativeExpr_ nm se ne sr nr -> m ne
  , opFoldWithSerialArgM :: SerialArg -> SerialArg_ sm se -> m sr
  , opFoldWithNativeArgM :: NativeArg -> NativeArg_ nm ne -> m nr
  }

data SurroundManifoldM m sm nm se ne sr nr = SurroundManifoldM
  { surroundSerialManifoldM :: (SerialManifold -> m sm) -> SerialManifold -> m sm
  , surroundNativeManifoldM :: (NativeManifold -> m nm) -> NativeManifold -> m nm
  , surroundSerialExprM :: (SerialExpr -> m se) -> SerialExpr -> m se
  , surroundNativeExprM :: (NativeExpr -> m ne) -> NativeExpr -> m ne
  , surroundSerialArgM :: (SerialArg -> m sr) -> SerialArg -> m sr
  , surroundNativeArgM :: (NativeArg -> m nr) -> NativeArg -> m nr
  }

instance Defaultable (SurroundManifoldM m sm nm se ne sr nr) where
  defaultValue =
    SurroundManifoldM
      { surroundSerialManifoldM = \f x -> f x
      , surroundNativeManifoldM = \f x -> f x
      , surroundSerialExprM = \f x -> f x
      , surroundNativeExprM = \f x -> f x
      , surroundSerialArgM = \f x -> f x
      , surroundNativeArgM = \f x -> f x
      }

instance (HasTypeF a) => HasTypeM (Maybe a) where
  typeMof (Just x) = Serial (typeFof x)
  typeMof Nothing = Passthrough

class MayHaveTypeF a where
  mayHaveTypeF :: a -> Maybe TypeF

instance MayHaveTypeF TypeF where
  mayHaveTypeF = Just

instance MayHaveTypeF TypeS where
  mayHaveTypeF PassthroughS = Nothing
  mayHaveTypeF (SerialS t) = Just t
  mayHaveTypeF (FunctionS ts t) = FunF <$> mapM mayHaveTypeF ts <*> mayHaveTypeF t

instance MayHaveTypeF TypeM where
  mayHaveTypeF Passthrough = Nothing
  mayHaveTypeF (Serial t) = Just t
  mayHaveTypeF (Native t) = Just t
  mayHaveTypeF (Function ts t) = FunF <$> mapM mayHaveTypeF ts <*> mayHaveTypeF t

data NativeManifold_ ne = NativeManifold_ Int Lang (ManifoldForm (Or TypeS TypeF) TypeF) ne
data SerialManifold_ se
  = SerialManifold_ Int Lang (ManifoldForm (Or TypeS TypeF) TypeS) HeadManifoldForm se
data SerialArg_ sm se = SerialArgManifold_ sm | SerialArgExpr_ se
data NativeArg_ nm ne = NativeArgManifold_ nm | NativeArgExpr_ ne

typeMofRs :: [Arg (Or TypeS TypeF)] -> [Arg TypeM]
typeMofRs rs = concat [[Arg i t | t <- bilist typeMof typeMof orT] | (Arg i orT) <- rs]

typeMofForm :: (HasTypeM t) => ManifoldForm (Or TypeS TypeF) t -> [Arg TypeM]
typeMofForm =
  concat . abilist (\i r -> [Arg i t | t <- bilist typeMof typeMof r]) (\i r -> [Arg i (typeMof r)])

data SerialExpr_ sm se ne sr nr
  = ManS_ sm
  | AppPoolS_ TypeF PoolCall [sr]
  | AppRecS_ TypeF Int [se]
  | AppForeignRecS_ TypeF Int Socket [se]
  | ReturnS_ se
  | SerialLetS_ Int se se
  | NativeLetS_ Int ne se
  | LetVarS_ (Maybe TypeF) Int
  | BndVarS_ (Maybe TypeF) Int
  | SerializeS_ SerialAST ne

data NativeExpr_ nm se ne sr nr
  = AppExeN_ TypeF ExecutableExpressionPool [nr]
  | ManN_ nm
  | ReturnN_ ne
  | SerialLetN_ Int se ne
  | NativeLetN_ Int ne ne
  | LetVarN_ TypeF Int
  | BndVarN_ TypeF Int
  | DeserializeN_ TypeF SerialAST se
  | ExeN_ TypeF ExecutableExpressionPool
  | -- data types
    ListN_ FVar TypeF [ne]
  | TupleN_ FVar [ne]
  | RecordN_ NamType FVar [TypeF] [(Key, ne)]
  | LogN_ FVar Bool
  | RealN_ FVar Scientific
  | IntN_ FVar Integer
  | StrN_ FVar Text
  | NullN_ FVar
  | DoBlockN_ TypeF ne
  | EvalN_ TypeF ne
  | CoerceN_ Coercion TypeF ne
  | IfN_ TypeF ne ne ne
  | IntrinsicN_ TypeF Intrinsic (Maybe Text) [ne]

manifoldFoldToFoldWith :: FoldManifoldM m sm nm se ne sr nr -> FoldWithManifoldM m sm nm se ne sr nr
manifoldFoldToFoldWith fm =
  FoldWithManifoldM
    { opFoldWithSerialManifoldM = \_ e -> opSerialManifoldM fm e
    , opFoldWithNativeManifoldM = \_ e -> opNativeManifoldM fm e
    , opFoldWithSerialExprM = \_ e -> opSerialExprM fm e
    , opFoldWithNativeExprM = \_ e -> opNativeExprM fm e
    , opFoldWithSerialArgM = \_ e -> opSerialArgM fm e
    , opFoldWithNativeArgM = \_ e -> opNativeArgM fm e
    }

foldSerialManifoldM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> SerialManifold -> m sm
foldSerialManifoldM = surroundFoldSerialManifoldM defaultValue . manifoldFoldToFoldWith

foldNativeManifoldM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> NativeManifold -> m nm
foldNativeManifoldM = surroundFoldNativeManifoldM defaultValue . manifoldFoldToFoldWith

foldSerialArgM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> SerialArg -> m sr
foldSerialArgM = surroundFoldSerialArgM defaultValue . manifoldFoldToFoldWith

foldNativeArgM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> NativeArg -> m nr
foldNativeArgM = surroundFoldNativeArgM defaultValue . manifoldFoldToFoldWith

foldSerialExprM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> SerialExpr -> m se
foldSerialExprM = surroundFoldSerialExprM defaultValue . manifoldFoldToFoldWith

foldNativeExprM :: (Monad m) => FoldManifoldM m sm nm se ne sr nr -> NativeExpr -> m ne
foldNativeExprM = surroundFoldNativeExprM defaultValue . manifoldFoldToFoldWith

foldWithSerialManifoldM ::
  (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> SerialManifold -> m sm
foldWithSerialManifoldM = surroundFoldSerialManifoldM defaultValue

foldWithNativeManifoldM ::
  (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> NativeManifold -> m nm
foldWithNativeManifoldM = surroundFoldNativeManifoldM defaultValue

foldWithSerialArgM :: (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> SerialArg -> m sr
foldWithSerialArgM = surroundFoldSerialArgM defaultValue

foldWithNativeArgM :: (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> NativeArg -> m nr
foldWithNativeArgM = surroundFoldNativeArgM defaultValue

foldWithSerialExprM :: (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> SerialExpr -> m se
foldWithSerialExprM = surroundFoldSerialExprM defaultValue

foldWithNativeExprM :: (Monad m) => FoldWithManifoldM m sm nm se ne sr nr -> NativeExpr -> m ne
foldWithNativeExprM = surroundFoldNativeExprM defaultValue

surroundFoldSerialManifoldM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  SerialManifold ->
  m sm
surroundFoldSerialManifoldM sfm fm = surroundSerialManifoldM sfm f
  where
    f full@(SerialManifold m lang form headForm e) = do
      e' <- surroundFoldSerialExprM sfm fm e
      opFoldWithSerialManifoldM fm full $ SerialManifold_ m lang form headForm e'

surroundFoldNativeManifoldM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  NativeManifold ->
  m nm
surroundFoldNativeManifoldM sfm fm = surroundNativeManifoldM sfm f
  where
    f full@(NativeManifold m lang form e) = do
      e' <- surroundFoldNativeExprM sfm fm e
      opFoldWithNativeManifoldM fm full $ NativeManifold_ m lang form e'

surroundFoldSerialArgM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  SerialArg ->
  m sr
surroundFoldSerialArgM sfm fm = surroundSerialArgM sfm f
  where
    f full@(SerialArgManifold sm) = do
      sm' <- surroundFoldSerialManifoldM sfm fm sm
      opFoldWithSerialArgM fm full $ SerialArgManifold_ sm'
    f full@(SerialArgExpr se) = do
      se' <- surroundFoldSerialExprM sfm fm se
      opFoldWithSerialArgM fm full $ SerialArgExpr_ se'

surroundFoldNativeArgM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  NativeArg ->
  m nr
surroundFoldNativeArgM sfm fm = surroundNativeArgM sfm f
  where
    f full@(NativeArgManifold nm) = do
      nm' <- surroundFoldNativeManifoldM sfm fm nm
      opFoldWithNativeArgM fm full $ NativeArgManifold_ nm'
    f full@(NativeArgExpr ne) = do
      ne' <- surroundFoldNativeExprM sfm fm ne
      opFoldWithNativeArgM fm full $ NativeArgExpr_ ne'

surroundFoldSerialExprM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  SerialExpr ->
  m se
surroundFoldSerialExprM sfm fm = surroundSerialExprM sfm f
  where
    f full@(ManS e) = do
      e' <- surroundFoldSerialManifoldM sfm fm e
      opFoldWithSerialExprM fm full $ ManS_ e'
    f full@(AppPoolS t pool es) = do
      es' <- mapM (surroundFoldSerialArgM sfm fm) es
      opFoldWithSerialExprM fm full $ AppPoolS_ t pool es'
    f full@(AppRecS t m es) = do
      es' <- mapM (surroundFoldSerialExprM sfm fm) es
      opFoldWithSerialExprM fm full $ AppRecS_ t m es'
    f full@(AppForeignRecS t m s es) = do
      es' <- mapM (surroundFoldSerialExprM sfm fm) es
      opFoldWithSerialExprM fm full $ AppForeignRecS_ t m s es'
    f full@(ReturnS e) = do
      e' <- surroundFoldSerialExprM sfm fm e
      opFoldWithSerialExprM fm full $ ReturnS_ e'
    f full@(SerialLetS i sa sb) = do
      sa' <- surroundFoldSerialExprM sfm fm sa
      sb' <- surroundFoldSerialExprM sfm fm sb
      opFoldWithSerialExprM fm full $ SerialLetS_ i sa' sb'
    f full@(NativeLetS i na sb) = do
      sa' <- surroundFoldNativeExprM sfm fm na
      nb' <- surroundFoldSerialExprM sfm fm sb
      opFoldWithSerialExprM fm full $ NativeLetS_ i sa' nb'
    f full@(LetVarS t i) = opFoldWithSerialExprM fm full (LetVarS_ t i)
    f full@(BndVarS t i) = opFoldWithSerialExprM fm full (BndVarS_ t i)
    f full@(SerializeS s e) = do
      e' <- surroundFoldNativeExprM sfm fm e
      opFoldWithSerialExprM fm full $ SerializeS_ s e'

surroundFoldNativeExprM ::
  (Monad m) =>
  SurroundManifoldM m sm nm se ne sr nr ->
  FoldWithManifoldM m sm nm se ne sr nr ->
  NativeExpr ->
  m ne
surroundFoldNativeExprM sfm fm = surroundNativeExprM sfm f
  where
    f full@(AppExeN t exe nativeArgs) = do
      nativeArgs' <- mapM (surroundFoldNativeArgM sfm fm) nativeArgs
      opFoldWithNativeExprM fm full $ AppExeN_ t exe nativeArgs'
    f full@(ManN nativeManifold) = do
      nativeManifold' <- surroundFoldNativeManifoldM sfm fm nativeManifold
      opFoldWithNativeExprM fm full $ ManN_ nativeManifold'
    f full@(ReturnN ne) = do
      ne' <- surroundFoldNativeExprM sfm fm ne
      opFoldWithNativeExprM fm full $ ReturnN_ ne'
    f full@(SerialLetN i se1 ne2) = do
      se1' <- surroundFoldSerialExprM sfm fm se1
      ne2' <- surroundFoldNativeExprM sfm fm ne2
      opFoldWithNativeExprM fm full (SerialLetN_ i se1' ne2')
    f full@(NativeLetN i ne1 ne2) = do
      ne1' <- surroundFoldNativeExprM sfm fm ne1
      ne2' <- surroundFoldNativeExprM sfm fm ne2
      opFoldWithNativeExprM fm full (NativeLetN_ i ne1' ne2')
    f full@(LetVarN t i) = opFoldWithNativeExprM fm full (LetVarN_ t i)
    f full@(BndVarN t i) = opFoldWithNativeExprM fm full (BndVarN_ t i)
    f full@(DeserializeN t s se) = do
      se' <- surroundFoldSerialExprM sfm fm se
      opFoldWithNativeExprM fm full (DeserializeN_ t s se')
    f full@(ExeN t exe) = opFoldWithNativeExprM fm full (ExeN_ t exe)
    f full@(ListN v t nes) = do
      nes' <- mapM (surroundFoldNativeExprM sfm fm) nes
      opFoldWithNativeExprM fm full (ListN_ v t nes')
    f full@(TupleN t nes) = do
      nes' <- mapM (surroundFoldNativeExprM sfm fm) nes
      opFoldWithNativeExprM fm full (TupleN_ t nes')
    f full@(RecordN o n ps rs) = do
      rs' <- mapM (onSndM (surroundFoldNativeExprM sfm fm)) rs
      opFoldWithNativeExprM fm full (RecordN_ o n ps rs')
      where
        onSndM :: (Monad m) => (b -> m b') -> (a, b) -> m (a, b')
        onSndM g (a, b) = (,) a <$> g b
    f full@(LogN t x) = opFoldWithNativeExprM fm full (LogN_ t x)
    f full@(RealN t x) = opFoldWithNativeExprM fm full (RealN_ t x)
    f full@(IntN t x) = opFoldWithNativeExprM fm full (IntN_ t x)
    f full@(StrN t x) = opFoldWithNativeExprM fm full (StrN_ t x)
    f full@(NullN t) = opFoldWithNativeExprM fm full (NullN_ t)
    f full@(DoBlockN t ne) = do
      ne' <- surroundFoldNativeExprM sfm fm ne
      opFoldWithNativeExprM fm full (DoBlockN_ t ne')
    f full@(EvalN t ne) = do
      ne' <- surroundFoldNativeExprM sfm fm ne
      opFoldWithNativeExprM fm full (EvalN_ t ne')
    f full@(CoerceN c t ne) = do
      ne' <- surroundFoldNativeExprM sfm fm ne
      opFoldWithNativeExprM fm full (CoerceN_ c t ne')
    f full@(IfN t cond thenE elseE) = do
      cond' <- surroundFoldNativeExprM sfm fm cond
      thenE' <- surroundFoldNativeExprM sfm fm thenE
      elseE' <- surroundFoldNativeExprM sfm fm elseE
      opFoldWithNativeExprM fm full (IfN_ t cond' thenE' elseE')
    f full@(IntrinsicN t intr msch nes) = do
      nes' <- mapM (surroundFoldNativeExprM sfm fm) nes
      opFoldWithNativeExprM fm full (IntrinsicN_ t intr msch nes')

class HasTypeF a where
  typeFof :: a -> TypeF

instance HasTypeF TypeF where
  typeFof = id

instance HasTypeF NativeExpr where
  typeFof (ManN nm) = typeFof nm
  typeFof (AppExeN t _ _) = t
  typeFof (ReturnN e) = typeFof e
  typeFof (SerialLetN _ _ e) = typeFof e
  typeFof (NativeLetN _ _ e) = typeFof e
  typeFof (LetVarN t _) = t
  typeFof (BndVarN t _) = t
  typeFof (DeserializeN t _ _) = t
  typeFof (ExeN t _) = t
  typeFof (ListN v p _) = AppF (VarF v) [p]
  typeFof (TupleN v (map typeFof -> ps)) = AppF (VarF v) ps
  typeFof (RecordN o n ps (map (second typeFof) -> rs)) = NamF o n ps rs
  typeFof (LogN v _) = VarF v
  typeFof (RealN v _) = VarF v
  typeFof (IntN v _) = VarF v
  typeFof (StrN v _) = VarF v
  typeFof (NullN v) = VarF v
  typeFof (DoBlockN t _) = t
  typeFof (EvalN t _) = t
  typeFof (CoerceN _ t _) = t
  typeFof (IfN t _ _ _) = t
  typeFof (IntrinsicN t _ _ _) = t

class HasTypeM e where
  typeMof :: e -> TypeM

instance HasTypeM TypeM where
  typeMof = id

instance HasTypeM TypeF where
  typeMof (FunF ts t) = Function (map typeMof ts) (typeMof t)
  typeMof (UnkF _) = Passthrough
  typeMof t = Native t

instance HasTypeM NativeExpr where
  typeMof = typeMof . typeFof

instance HasTypeS TypeF where
  typeSof (FunF ts t) = FunctionS (map typeMof ts) (typeSof t)
  typeSof t = SerialS t

instance HasTypeS (Maybe TypeF) where
  typeSof (Just t) = typeSof t
  typeSof Nothing = PassthroughS

-- TODO: fix this - the type of a native manifold should be the full function
-- type, but the manifold function type may not be entirely native
instance HasTypeF NativeManifold where
  typeFof (NativeManifold _ _ _ ne) = typeFof ne

instance HasTypeS SerialExpr where
  typeSof (ManS sm) = typeSof sm
  typeSof (AppPoolS t _ sargs) = FunctionS (map typeMof sargs) (SerialS t)
  typeSof (AppRecS t _ _) = SerialS t
  typeSof (AppForeignRecS t _ _ _) = SerialS t
  typeSof (ReturnS e) = typeSof e
  typeSof (SerialLetS _ _ e) = typeSof e
  typeSof (NativeLetS _ _ e) = typeSof e
  typeSof (LetVarS t _) = maybe PassthroughS SerialS t
  typeSof (BndVarS t _) = maybe PassthroughS SerialS t
  typeSof (SerializeS _ e) = SerialS (typeFof e)

instance HasTypeM SerialExpr where
  typeMof = typeMof . typeSof

instance HasTypeM NativeManifold where
  typeMof (NativeManifold _ _ form e) = typeOfManifold form (typeMof e)

instance HasTypeM SerialManifold where
  typeMof (SerialManifold _ _ form _ e) = typeOfManifold form (typeMof e)

instance HasTypeS SerialManifold where
  typeSof (SerialManifold _ _ form _ e) =
    let inputTypes = concat $ bilist (bilist typeMof typeMof) (return . typeMof) form
     in case inputTypes of
          [] -> typeSof e
          _ -> FunctionS inputTypes (typeSof e)

instance HasTypeS SerialArg where
  typeSof (SerialArgManifold x) = typeSof x
  typeSof (SerialArgExpr x) = typeSof x

typeOfManifold :: (HasTypeM e) => ManifoldForm (Or TypeS TypeF) e -> TypeM -> TypeM
typeOfManifold form outputType =
  let inputTypes = concat $ bilist (bilist typeMof typeMof) (return . typeMof) form
   in case inputTypes of
        [] -> outputType
        _ -> Function inputTypes outputType

instance HasTypeM SerialArg where
  typeMof (SerialArgManifold sm) = typeMof sm
  typeMof (SerialArgExpr e) = typeMof e

instance HasTypeM NativeArg where
  typeMof (NativeArgManifold sm) = typeMof sm
  typeMof (NativeArgExpr e) = typeMof e

{- | Generate one or two types from an ArgType. These types may be native,
serial, or (serial, native) (in that order). The serial types are rendered in
the serial form, currently strings. Note that this operation erases the type
annotation for the serial type, if it exists.
-}
argTypesToTypeM :: ArgTypes -> [TypeM]
argTypesToTypeM (SerialOnly (typeMof -> t)) = [t]
argTypesToTypeM (NativeOnly (typeMof -> t)) = [t]
argTypesToTypeM (SerialAndNative t) = argTypesToTypeM (SerialOnly (SerialS t)) <> argTypesToTypeM (NativeOnly t)

data ManifoldMap = ManifoldMap
  { mapSerialManifold :: SerialManifold -> SerialManifold
  , mapNativeManifold :: NativeManifold -> NativeManifold
  , mapSerialExpr :: SerialExpr -> SerialExpr
  , mapNativeExpr :: NativeExpr -> NativeExpr
  , mapSerialArg :: SerialArg -> SerialArg
  , mapNativeArg :: NativeArg -> NativeArg
  }

instance Defaultable ManifoldMap where
  defaultValue =
    ManifoldMap
      { mapSerialManifold = id
      , mapNativeManifold = id
      , mapSerialExpr = id
      , mapNativeExpr = id
      , mapSerialArg = id
      , mapNativeArg = id
      }

data GateMap = GateMap
  { gateSerialManifold :: SerialManifold -> Bool
  , gateNativeManifold :: NativeManifold -> Bool
  , gateSerialExpr :: SerialExpr -> Bool
  , gateNativeExpr :: NativeExpr -> Bool
  , gateSerialArg :: SerialArg -> Bool
  , gateNativeArg :: NativeArg -> Bool
  }

instance Defaultable GateMap where
  defaultValue =
    GateMap
      { gateSerialManifold = const True
      , gateNativeManifold = const True
      , gateSerialExpr = const True
      , gateNativeExpr = const True
      , gateSerialArg = const True
      , gateNativeArg = const True
      }

class MFunctor a where
  mgatedMap :: GateMap -> ManifoldMap -> a -> a

  mmap :: ManifoldMap -> a -> a
  mmap = mgatedMap defaultValue

instance MFunctor NativeManifold where
  mgatedMap g f nm@(NativeManifold m l form ne)
    | gateNativeManifold g nm = mapNativeManifold f $ NativeManifold m l form (mgatedMap g f ne)
    | otherwise = mapNativeManifold f nm

instance MFunctor SerialManifold where
  mgatedMap g f sm@(SerialManifold m l form headForm se)
    | gateSerialManifold g sm =
        mapSerialManifold f $ SerialManifold m l form headForm (mgatedMap g f se)
    | otherwise = mapSerialManifold f sm

instance MFunctor SerialArg where
  mgatedMap g f sr
    | gateSerialArg g sr = case sr of
        (SerialArgManifold sm) -> mapSerialArg f $ SerialArgManifold (mgatedMap g f sm)
        (SerialArgExpr se) -> mapSerialArg f $ SerialArgExpr (mgatedMap g f se)
    | otherwise = mapSerialArg f sr

instance MFunctor NativeArg where
  mgatedMap g f nr
    | gateNativeArg g nr = case nr of
        (NativeArgManifold nm) -> mapNativeArg f $ NativeArgManifold (mgatedMap g f nm)
        (NativeArgExpr ne) -> mapNativeArg f $ NativeArgExpr (mgatedMap g f ne)
    | otherwise = mapNativeArg f nr

instance MFunctor SerialExpr where
  mgatedMap g f se0
    | gateSerialExpr g se0 = case se0 of
        (ManS sm) -> mapSerialExpr f $ ManS (mgatedMap g f sm)
        (AppPoolS t p serialArgs) -> mapSerialExpr f $ AppPoolS t p (map (mgatedMap g f) serialArgs)
        (AppRecS t m es) -> mapSerialExpr f $ AppRecS t m (map (mgatedMap g f) es)
        (AppForeignRecS t m s es) -> mapSerialExpr f $ AppForeignRecS t m s (map (mgatedMap g f) es)
        (ReturnS se) -> mapSerialExpr f $ ReturnS (mgatedMap g f se)
        (SerialLetS i se1 se2) -> mapSerialExpr f $ SerialLetS i (mgatedMap g f se1) (mgatedMap g f se2)
        (NativeLetS i ne1 se2) -> mapSerialExpr f $ NativeLetS i (mgatedMap g f ne1) (mgatedMap g f se2)
        e@(LetVarS _ _) -> mapSerialExpr f e
        e@(BndVarS _ _) -> mapSerialExpr f e
        (SerializeS s ne) -> mapSerialExpr f $ SerializeS s (mgatedMap g f ne)
    | otherwise = mapSerialExpr f se0

-- WARNING - mapping must not change the type of any argument
instance MFunctor NativeExpr where
  mgatedMap g f ne0
    | gateNativeExpr g ne0 = case ne0 of
        (AppExeN t exe nativeArgs) -> mapNativeExpr f $ AppExeN t exe (map (mgatedMap g f) nativeArgs)
        (ManN nm) -> mapNativeExpr f $ ManN (mgatedMap g f nm)
        (ReturnN ne) -> mapNativeExpr f $ ReturnN (mgatedMap g f ne)
        (SerialLetN i se ne) -> mapNativeExpr f $ SerialLetN i (mgatedMap g f se) (mgatedMap g f ne)
        (NativeLetN i ne1 ne2) -> mapNativeExpr f $ NativeLetN i (mgatedMap g f ne1) (mgatedMap g f ne2)
        e@(LetVarN _ _) -> mapNativeExpr f e
        e@(BndVarN _ _) -> mapNativeExpr f e
        (DeserializeN t s se) -> mapNativeExpr f $ DeserializeN t s (mgatedMap g f se)
        e@(ExeN _ _) -> mapNativeExpr f e
        (ListN v t nes) -> mapNativeExpr f $ ListN v t (map (mgatedMap g f) nes)
        (TupleN v xs) -> mapNativeExpr f $ TupleN v (map (mgatedMap g f) xs)
        (RecordN o v ps rs) -> mapNativeExpr f $ RecordN o v ps (map (second (mgatedMap g f)) rs)
        e@(LogN _ _) -> mapNativeExpr f e
        e@(RealN _ _) -> mapNativeExpr f e
        e@(IntN _ _) -> mapNativeExpr f e
        e@(StrN _ _) -> mapNativeExpr f e
        e@(NullN _) -> mapNativeExpr f e
        (DoBlockN t ne) -> mapNativeExpr f $ DoBlockN t (mgatedMap g f ne)
        (EvalN t ne) -> mapNativeExpr f $ EvalN t (mgatedMap g f ne)
        (CoerceN c t ne) -> mapNativeExpr f $ CoerceN c t (mgatedMap g f ne)
        (IfN t c thenE elseE) -> mapNativeExpr f $ IfN t (mgatedMap g f c) (mgatedMap g f thenE) (mgatedMap g f elseE)
        (IntrinsicN t intr msch nes) -> mapNativeExpr f $ IntrinsicN t intr msch (map (mgatedMap g f) nes)
    | otherwise = mapNativeExpr f ne0

instance (Pretty a) => Pretty (Arg a) where
  pretty (Arg i x) = "x" <> pretty i <> braces (pretty x)

instance Pretty TypeF where
  pretty = viaShow

instance Pretty TypeM where
  pretty Passthrough = "Passthrough"
  pretty (Serial c) = "Serial{" <> pretty c <> "}"
  pretty (Native c) = "Native{" <> pretty c <> "}"
  pretty (Function ts t) =
    nest 4 (vsep $ ["Function{"] <> map (\x -> pretty x <+> "->") ts <> [pretty t <> "}"])

instance Pretty TypeS where
  pretty PassthroughS = "PassthroughS"
  pretty (SerialS t) = "SeralS{" <> pretty t <> "}"
  pretty (FunctionS ts t) =
    nest 4 (vsep $ ["Function{"] <> map (\x -> pretty x <+> "->") ts <> [pretty t <> "}"])

instance Pretty PolyHead where
  pretty _ = "PolyHead stub"

instance Pretty PolyExpr where
  pretty (PolyManifold _ _ _ _) = "PolyManifold"
  pretty (PolyRemoteInterface _ _ _ _ _) = "PolyRemoteInterface"
  pretty (PolyLet i e1 e2) = "PolyLet<" <> pretty i <> ">" <+> list [pretty e1, pretty e2]
  pretty (PolyReturn e) = "PolyReturn" <+> parens (pretty e)
  pretty (PolyApp e es) = "PolyApp" <+> list (map pretty (e : es))
  pretty (PolyBndVar _ _) = "PolyBndVar"
  pretty (PolyLetVar _ _) = "PolyLetVar"
  pretty (PolyExe _ (SrcCallP src)) = "PolyExe<" <> pretty (srcAlias src) <> ">"
  pretty (PolyExe _ (PatCallP _)) = "PolyExe<pattern>"
  pretty (PolyExe _ (LocalCallP _)) = "PolyExe<local>"
  pretty (PolyExe _ (RecCallP i _)) = "PolyExe<rec_m" <> pretty i <> ">"
  pretty (PolyList _ _ _) = "PolyList"
  pretty (PolyTuple _ xs) = "PolyTuple" <+> pretty (length xs)
  pretty (PolyRecord _ _ _ _) = "PolyRecord"
  pretty (PolyLog _ _) = "PolyLog"
  pretty (PolyReal _ _) = "PolyReal"
  pretty (PolyInt _ _) = "PolyInt"
  pretty (PolyStr _ _) = "PolyStr"
  pretty (PolyNull _) = "PolyNull"
  pretty (PolyDoBlock _ e) = "PolyDoBlock" <+> pretty e
  pretty (PolyEval _ e) = "PolyEval" <+> pretty e
  pretty (PolyCoerce _ _ e) = "PolyCoerce" <+> pretty e
  pretty (PolyIf c t e) = "PolyIf" <+> pretty c <+> pretty t <+> pretty e
  pretty (PolyIntrinsic _ intr es) = "@" <> pretty (intrinsicName intr) <+> list (map pretty es)

instance Pretty MonoExpr where
  pretty (MonoManifold i form e) =
    block 4 ("m" <> pretty i <> tupled (abilist contextArg boundArg form)) (pretty e)
    where
      contextArg j _ = "c" <> pretty j
      boundArg j _ = "b" <> pretty j
  pretty (MonoPoolCall t i _ _ _) = "PoolCall" <> parens (pretty i) <> parens (pretty t)
  pretty (MonoLet i e1 e2) = vsep ["let" <+> "x" <> pretty i <+> "=" <+> pretty e1, pretty e2]
  pretty (MonoLetVar t i) = parens $ "x" <> pretty i <> " :: " <> pretty t
  pretty (MonoReturn e) = "return" <> parens (pretty e)
  pretty (MonoApp e es) = parens (pretty e) <+> hsep (map (parens . pretty) es)
  pretty (MonoExe _ exe) = pretty exe
  pretty (MonoBndVar (A _) i) = parens $ "x" <> pretty i <+> ":" <+> "<unknown>"
  pretty (MonoBndVar (B t) i) = parens $ "x" <> pretty i <+> ":" <+> pretty t
  pretty (MonoBndVar (C t) i) = parens $ "x" <> pretty i <+> ":" <+> pretty t
  pretty (MonoList _ _ es) = list (map pretty es)
  pretty (MonoTuple v es) = pretty v <+> tupled (map pretty es)
  pretty (MonoRecord o v fs _) =
    block 4 (pretty o <+> pretty v <> encloseSep "<" ">" "," (map pretty fs)) "manifold record stub"
  pretty (MonoLog _ x) = viaShow x
  pretty (MonoReal _ x) = viaShow x
  pretty (MonoInt _ x) = viaShow x
  pretty (MonoStr _ x) = viaShow x
  pretty (MonoNull _) = "NULL"
  pretty (MonoDoBlock _ e) = "{" <> pretty e <> "}"
  pretty (MonoEval _ e) = "!" <> pretty e
  pretty (MonoCoerce _ _ e) = "coerce(" <> pretty e <> ")"
  pretty (MonoIf c t e) = "if" <+> pretty c <+> "then" <+> pretty t <+> "else" <+> pretty e
  pretty (MonoIntrinsic _ intr es) = "@" <> pretty (intrinsicName intr) <+> list (map pretty es)

instance Pretty MonoHead where
  pretty (MonoHead lang i args headForm e) =
    block 4 "MonoHead" $
      encloseSep
        "{"
        "}"
        ","
        [ "lang:" <+> pretty lang
        , "index:" <+> pretty i
        , "args:" <+> list (map pretty args)
        , "headForm:" <+> viaShow headForm
        , "expr:" <+> pretty e
        ]

instance Pretty PoolCall where
  pretty _ = "PoolCall stub"

instance (Pretty context, Pretty bound) => Pretty (ManifoldForm context bound) where
  pretty (ManifoldPass args) = "ManifoldPass" <+> list (map pretty args)
  pretty (ManifoldFull args) = "ManifoldFull" <+> list (map pretty args)
  pretty (ManifoldPart cargs bargs) =
    "ManifoldFull"
      <+> "{context:"
      <+> list (map pretty cargs)
      <> ","
        <+> "bound:"
        <+> list (map pretty bargs)
      <> "}"

data CmdArg
  = CmdArgPos ArgPosDocSet
  | -- positional argument
    CmdArgOpt ArgOptDocSet
  | -- optional argument
    CmdArgGrp RecDocSet
  | -- argument group (made from a record)
    CmdArgFlag ArgFlagDocSet
  -- flag option
  deriving (Show, Ord, Eq)

data CmdDocSet = CmdDocSet
  { cmdDocDesc :: [Text]
  , -- free description, the first line is used in the top-level help statement
    cmdDocName :: Maybe Text
  , -- an alternative name to give this subcommand (defaults to the function name)
    cmdDocArgs :: [CmdArg]
  , -- one element for each argument to the function
    cmdDocRet :: (Type, [Text])
    -- description of the return data
  }
  deriving (Show, Ord, Eq)

data RecDocSet = RecDocSet
  { recDocType :: Type
  , -- fully resolved type
    recDocDesc :: [Text]
  , -- free description
    recDocMetavar :: Text
  , -- name of the record used in docs, with record type in uppercase as the default
    recDocOpt :: Maybe CliOpt
  , -- optional argument that expects the entire record
    recDocEntries :: [(Key, Either ArgFlagDocSet ArgOptDocSet)]
    -- all options for this record
  }
  deriving (Show, Ord, Eq)

data ArgOptDocSet = ArgOptDocSet
  { argOptDocType :: Type
  , -- argument type
    argOptDocDesc :: [Text]
  , -- free description
    argOptDocMetavar :: Text
  , -- a variable used in the interface to refer to this argument term
    argOptDocLiteral :: Maybe Bool
  , -- if Just True, require an argument be literal rather than from a file
    -- if Just False, require an argument be from a file
    -- if Nothing, infer as usual
    argOptDocArg :: CliOpt
  , -- the option
    argOptDocDefault :: Text
    -- the required default vale for an argument
  }
  deriving (Show, Ord, Eq)

data ArgFlagDocSet = ArgFlagDocSet
  { argFlagDocDesc :: [Text]
  , -- free description
    argFlagDocOpt :: CliOpt
  , -- invert the default value
    argFlagDocOptRev :: Maybe CliOpt
  , -- force the default value
    argFlagDocDefault :: Text
    -- the possibly inferred default value
  }
  deriving (Show, Ord, Eq)

data ArgPosDocSet = ArgPosDocSet
  { argPosDocType :: Type
  , argPosDocDesc :: [Text]
  , -- free description
    argPosDocMetavar :: Maybe Text
  , -- a variable used in the interface to refer to this argument term
    argPosDocLiteral :: Maybe Bool
    -- if Just True, require an argument be literal rather than from a file
    -- if Just False, require an argument be from a file
    -- if Nothing, infer as usual
  }
  deriving (Show, Ord, Eq)


================================================
FILE: library/Morloc/CodeGenerator/Nexus.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Nexus
Description : Generate the @.manifest@ JSON file consumed by the pre-compiled nexus
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Produces the JSON manifest that the static nexus binary reads at startup.
The manifest describes all exported subcommands, their argument types,
help text, and which pool executables to dispatch to.
-}
module Morloc.CodeGenerator.Nexus
  ( generate
  ) where

import qualified Control.Monad as CM
import qualified Control.Monad.State as CMS
import qualified Data.Map as Map
import Data.Text (Text)
import qualified Data.Text as MT
import qualified Data.Time.Clock
import qualified Data.Time.Clock.POSIX as Time
import qualified Data.Time.Format
import qualified Morloc.BaseTypes as MBT
import qualified Morloc.CodeGenerator.Infer as Infer
import Morloc.CodeGenerator.Namespace
import qualified Morloc.CodeGenerator.Serial as Serial
import qualified Morloc.Config as MC
import Morloc.Data.Doc (pretty, render)
import Morloc.Data.Json
import qualified Morloc.LangRegistry as LR
import qualified Morloc.Language as ML
import qualified Morloc.Monad as MM
import qualified Morloc.Version
import qualified System.Directory as Dir

-- ======================================================================
-- Data types
-- ======================================================================

cLang :: ML.Lang
cLang = Lang "c" "c"

data FData = FData
  { fdataSocket :: Socket
  , fdataSubcommand :: Text
  , fdataMid :: Int
  , fdataType :: Type
  , fdataSubSockets :: [Socket]
  , fdataArgSchemas :: [Text]
  , fdataReturnSchema :: Text
  , fdataCmdDocSet :: CmdDocSet
  }

data GastData = GastData
  { commandName :: Text
  , commandMid :: Int
  , commandType :: Type
  , commandDocs :: CmdDocSet
  , commandExpr :: NexusExpr
  , commandReturnSchema :: Text
  , commandArgSchemas :: [Text]
  }

data NexusExpr
  = AppX Text NexusExpr [NexusExpr]
  | LamX [Text] NexusExpr
  | BndX Text Text
  | PatX Text Pattern
  | LstX Text [NexusExpr]
  | TupX Text [NexusExpr]
  | NamX Text [(Text, NexusExpr)]
  | StrX Text Text
  | LitX LitType Text
  | ShowX Text NexusExpr  -- schema (return type = Str), child expression
  | ReadX Text NexusExpr  -- schema (return type = ?a), child expression
  | HashX Text NexusExpr  -- schema + child -> Str (xxhash hex)
  | SaveX Text Text NexusExpr NexusExpr  -- format + schema + value + path -> ()
  | LoadX Text NexusExpr  -- schema + path -> ?a

data LitType = F32X | F64X | I8X | I16X | I32X | I64X | U8X | U16X | U32X | U64X | BoolX | NullX

-- ======================================================================
-- Data extraction
-- ======================================================================

makeFData ::
  (AnnoS (Indexed Type) One (Indexed Lang), CmdDocSet) ->
  MorlocMonad (Type, Int, Lang, CmdDocSet, [Socket])
makeFData (e@(AnnoS (Idx i t) (Idx _ lang) _), d) = do
  sockets <- findSockets e
  return (t, i, lang, d, sockets)

findSockets :: AnnoS e One (Indexed Lang) -> MorlocMonad [Socket]
findSockets rAST = do
  config <- MM.ask
  registry <- MM.gets stateLangRegistry
  return . map (MC.setupServerAndSocket config registry) . unique $ findAllLangsSAnno rAST

findAllLangsSAnno :: AnnoS e One (Indexed Lang) -> [Lang]
findAllLangsSAnno (AnnoS _ (Idx _ lang) e) = lang : findAllLangsExpr e
  where
    findAllLangsExpr (VarS _ (One x)) = findAllLangsSAnno x
    findAllLangsExpr (AppS x xs) = concatMap findAllLangsSAnno (x : xs)
    findAllLangsExpr (LamS _ x) = findAllLangsSAnno x
    findAllLangsExpr (LstS xs) = concatMap findAllLangsSAnno xs
    findAllLangsExpr (TupS xs) = concatMap findAllLangsSAnno xs
    findAllLangsExpr (NamS rs) = concatMap (findAllLangsSAnno . snd) rs
    findAllLangsExpr (LetS _ e1 e2) = findAllLangsSAnno e1 ++ findAllLangsSAnno e2
    findAllLangsExpr (IfS c t e') = concatMap findAllLangsSAnno [c, t, e']
    findAllLangsExpr (DoBlockS x) = findAllLangsSAnno x
    findAllLangsExpr (EvalS x) = findAllLangsSAnno x
    findAllLangsExpr (CoerceS _ x) = findAllLangsSAnno x
    findAllLangsExpr _ = []

getFData :: (Type, Int, Lang, CmdDocSet, [Socket]) -> MorlocMonad FData
getFData (t, i, lang, doc, sockets) = do
  mayName <- MM.metaName i
  (argSchemas, returnSchema) <- makeSchemas i lang t

  case mayName of
    (Just name') -> do
      config <- MM.ask
      registry <- MM.gets stateLangRegistry
      let socket = MC.setupServerAndSocket config registry lang
      return $
        FData
          { fdataSocket = socket
          , fdataSubcommand = maybe (unEVar name') id (cmdDocName doc)
          , fdataMid = i
          , fdataType = t
          , fdataSubSockets = sockets
          , fdataArgSchemas = map render argSchemas
          , fdataReturnSchema = render returnSchema
          , fdataCmdDocSet = doc
          }
    Nothing -> MM.throwSourcedError i $ "No name in FData"

-- ======================================================================
-- Schema building
-- ======================================================================

makeSchemas :: Int -> Lang -> Type -> MorlocMonad ([MDoc], MDoc)
makeSchemas mid lang (FunT ts t) = do
  ss <- mapM (makeSchema mid lang) ts
  s <- makeSchema mid lang t
  return (ss, s)
makeSchemas mid lang t = do
  s <- makeSchema mid lang t
  return ([], s)

makeSchema :: Int -> Lang -> Type -> MorlocMonad MDoc
makeSchema mid lang t = do
  ft <- Infer.inferConcreteTypeUniversal lang t
  ast <- Serial.makeSerialAST mid lang ft
  return $ Serial.serialAstToMsgpackSchema ast

makeGastSchemas :: Type -> MorlocMonad (MDoc, [MDoc])
makeGastSchemas (FunT ts t) = do
  serialAsts <- mapM generalTypeToSerialAST (t : ts)
  case map Serial.serialAstToMsgpackSchema serialAsts of
    (s : ss) -> return (s, ss)
    [] -> error "makeGastSchemas: FunT produced empty serial AST list"
makeGastSchemas t = do
  s <- Serial.serialAstToMsgpackSchema <$> generalTypeToSerialAST t
  return (s, [])

generalTypeToSerialAST :: Type -> MorlocMonad SerialAST
generalTypeToSerialAST (VarT v)
  | v == MBT.real = return $ SerialReal (FV v (CV ""))
  | v == MBT.f32 = return $ SerialReal (FV v (CV ""))
  | v == MBT.f64 = return $ SerialReal (FV v (CV ""))
  | v == MBT.int = return $ SerialInt (FV v (CV ""))
  | v == MBT.i8 = return $ SerialInt8 (FV v (CV ""))
  | v == MBT.i16 = return $ SerialInt16 (FV v (CV ""))
  | v == MBT.i32 = return $ SerialInt32 (FV v (CV ""))
  | v == MBT.i64 = return $ SerialInt64 (FV v (CV ""))
  | v == MBT.u8 = return $ SerialUInt8 (FV v (CV ""))
  | v == MBT.u16 = return $ SerialUInt16 (FV v (CV ""))
  | v == MBT.u32 = return $ SerialUInt32 (FV v (CV ""))
  | v == MBT.u64 = return $ SerialUInt64 (FV v (CV ""))
  | v == MBT.bool = return $ SerialBool (FV v (CV ""))
  | v == MBT.str = return $ SerialString (FV v (CV ""))
  | v == MBT.unit = return $ SerialNull (FV v (CV ""))
  | otherwise = do
      scope <- MM.gets stateUniversalGeneralTypedefs
      case Map.lookup v scope of
        (Just [(_, _, _, True)]) -> error "Cannot handle terminal types"
        (Just [([], t', _, False)]) -> generalTypeToSerialAST (typeOf t')
        (Just [_]) -> error $ "Cannot currently handle parameterized pure morloc types"
        Nothing -> error $ "Failed to interpret type variable: " <> show (unTVar v)
        x -> error $ "Unexpected scope: " <> show x
generalTypeToSerialAST (AppT (VarT v) [t])
  | v == MBT.list = SerialList (FV v (CV "")) <$> generalTypeToSerialAST t
  | otherwise = resolveAliasApp v [t]
generalTypeToSerialAST (AppT (VarT v) ts)
  | v == (MBT.tuple (length ts)) = SerialTuple (FV v (CV "")) <$> mapM generalTypeToSerialAST ts
  | otherwise = resolveAliasApp v ts
generalTypeToSerialAST (EffectT _ t) = generalTypeToSerialAST t
generalTypeToSerialAST (OptionalT t) = do
  inner <- generalTypeToSerialAST t
  return $ SerialOptional (FV (TV "Optional") (CV "")) inner
generalTypeToSerialAST (NamT o v [] rs) =
  SerialObject o (FV v (CV "")) []
    <$> mapM (secondM generalTypeToSerialAST) rs
generalTypeToSerialAST t = error $ "cannot serialize this type: " <> show t

resolveAliasApp :: TVar -> [Type] -> MorlocMonad SerialAST
resolveAliasApp v ts = do
  scope <- MM.gets stateUniversalGeneralTypedefs
  case Map.lookup v scope of
    (Just [(params, body, _, False)]) ->
      let tvars = [tv | Left (tv, _) <- params]
          resolved = foldl (\acc (tv, arg) -> substituteTVar tv arg acc) (typeOf body) (zip tvars ts)
      in generalTypeToSerialAST resolved
    _ -> error $ "Cannot serialize type: " <> show (AppT (VarT v) ts)

-- ======================================================================
-- Pure expression extraction
-- ======================================================================

annotateGasts :: (AnnoS (Indexed Type) One (), CmdDocSet) -> MorlocMonad GastData
annotateGasts (x0@(AnnoS (Idx i gtype) _ _), docs) = do
  mayName <- MM.metaName i
  gname <- case mayName of
    Nothing -> MM.throwSourcedError i $ "No name found for call-free function"
    (Just n') -> return n'

  (retSchemaDoc, argSchemaDocs) <- makeGastSchemas gtype
  expr <- toNexusExpr x0

  return $
    GastData
      { commandName = maybe (unEVar gname) id (cmdDocName docs)
      , commandMid = i
      , commandType = gtype
      , commandDocs = docs
      , commandExpr = expr
      , commandReturnSchema = render retSchemaDoc
      , commandArgSchemas = map render argSchemaDocs
      }
  where
    type2schema :: Type -> MorlocMonad Text
    type2schema t = (render . Serial.serialAstToMsgpackSchema) <$> generalTypeToSerialAST t

    toNexusExpr :: AnnoS (Indexed Type) One () -> MorlocMonad NexusExpr
    toNexusExpr (AnnoS (Idx _ t) _ (AppS e es)) = AppX <$> type2schema t <*> toNexusExpr e <*> mapM toNexusExpr es
    toNexusExpr (AnnoS _ _ (LamS vs e)) = LamX (map (render . pretty) vs) <$> toNexusExpr e
    toNexusExpr (AnnoS (Idx _ (FunT _ t)) _ (ExeS (PatCall p))) = PatX <$> type2schema t <*> pure p
    toNexusExpr (AnnoS (Idx _ t) _ (BndS v)) = BndX <$> type2schema t <*> pure (render (pretty v))
    toNexusExpr (AnnoS (Idx _ t) _ (LstS es)) = LstX <$> type2schema t <*> mapM toNexusExpr es
    toNexusExpr (AnnoS (Idx _ t) _ (TupS es)) = TupX <$> type2schema t <*> mapM toNexusExpr es
    toNexusExpr (AnnoS (Idx _ t) _ (NamS rs)) =
      NamX <$> type2schema t <*> mapM (\(k, e) -> (,) (unKey k) <$> toNexusExpr e) rs
    toNexusExpr (AnnoS (Idx _ t) _ (StrS v)) = StrX <$> type2schema t <*> pure v
    toNexusExpr (AnnoS (Idx _ t) _ (RealS v)) = do
      s <- generalTypeToSerialAST t
      return $ case s of
        (SerialFloat32 _) -> LitX F32X (MT.pack (show v))
        _ -> LitX F64X (MT.pack (show v))
    toNexusExpr (AnnoS (Idx _ t) _ (IntS v)) = do
      s <- generalTypeToSerialAST t
      return $ case s of
        (SerialInt8 _) -> LitX I8X (MT.pack (show v))
        (SerialInt16 _) -> LitX I16X (MT.pack (show v))
        (SerialInt _) -> LitX I32X (MT.pack (show v))
        (SerialInt32 _) -> LitX I32X (MT.pack (show v))
        (SerialInt64 _) -> LitX I64X (MT.pack (show v))
        (SerialUInt8 _) -> LitX U8X (MT.pack (show v))
        (SerialUInt16 _) -> LitX U16X (MT.pack (show v))
        (SerialUInt _) -> LitX U32X (MT.pack (show v))
        (SerialUInt32 _) -> LitX U32X (MT.pack (show v))
        (SerialUInt64 _) -> LitX U64X (MT.pack (show v))
        _ -> LitX I64X (MT.pack (show v))
    toNexusExpr (AnnoS _ _ (LogS True)) = return $ LitX BoolX "1"
    toNexusExpr (AnnoS _ _ (LogS False)) = return $ LitX BoolX "0"
    toNexusExpr (AnnoS _ _ UniS) = return $ LitX NullX "0"
    toNexusExpr (AnnoS _ _ NullS) = return $ LitX NullX "0"
    toNexusExpr (AnnoS (Idx _ t) _ (LetBndS v)) = BndX <$> type2schema t <*> pure (render (pretty v))
    -- Desugar let to lambda application: let x = e1 in e2 -> (\x -> e2) e1
    toNexusExpr (AnnoS (Idx _ t) _ (LetS v e1 body)) = do
      schema <- type2schema t
      bodyX <- toNexusExpr body
      e1X <- toNexusExpr e1
      return $ AppX schema (LamX [render (pretty v)] bodyX) [e1X]
    toNexusExpr (AnnoS _ _ (IfS _ t _)) = toNexusExpr t
    toNexusExpr (AnnoS _ _ (DoBlockS e)) = toNexusExpr e
    toNexusExpr (AnnoS _ _ (EvalS e)) = toNexusExpr e
    toNexusExpr (AnnoS _ _ (CoerceS _ e)) = toNexusExpr e
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrShow [arg])) =
      ShowX <$> type2schema t <*> toNexusExpr arg
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrRead [arg])) =
      ReadX <$> type2schema t <*> toNexusExpr arg
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrHash [arg])) =
      HashX <$> type2schema t <*> toNexusExpr arg
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrSave [valExpr, path])) =
      SaveX "voidstar" <$> type2schema t <*> toNexusExpr valExpr <*> toNexusExpr path
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrSaveM [valExpr, path])) =
      SaveX "msgpack" <$> type2schema t <*> toNexusExpr valExpr <*> toNexusExpr path
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrSaveJ [valExpr, path])) =
      SaveX "json" <$> type2schema t <*> toNexusExpr valExpr <*> toNexusExpr path
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS IntrLoad [path])) =
      LoadX <$> type2schema t <*> toNexusExpr path
    toNexusExpr (AnnoS (Idx _ t) _ (IntrinsicS intr _)) = do
      v <- resolveCompileTimeIntrinsic intr
      StrX <$> type2schema t <*> pure v
    toNexusExpr (AnnoS (Idx _ t) _ (CallS v)) = BndX <$> type2schema t <*> pure (render (pretty v))
    toNexusExpr _ = error $ "Unreachable value of type reached"

resolveCompileTimeIntrinsic :: Intrinsic -> MorlocMonad Text
resolveCompileTimeIntrinsic IntrVersion = return $ MT.pack Morloc.Version.versionStr
resolveCompileTimeIntrinsic IntrCompiled = do
  now <- liftIO Data.Time.Clock.getCurrentTime
  return . MT.pack $ Data.Time.Format.formatTime Data.Time.Format.defaultTimeLocale "%Y-%m-%dT%H:%M:%SZ" now
resolveCompileTimeIntrinsic intr =
  MM.throwSystemError $ "@" <> pretty (intrinsicName intr) <> " cannot be used in a language-independent context"

-- ======================================================================
-- CLI argument serialization
-- ======================================================================

-- | Serialize a 'CmdArg' to its JSON manifest form. The optional
-- 'Maybe Text' is the pre-rendered serialization schema for typed
-- args (pos/opt/grp); flags pass 'Nothing' since they have no schema.
-- Group entries also pass 'Nothing' because the group's top-level
-- schema covers the whole record; entries never dispatch individually.
argToJson :: Maybe Text -> CmdArg -> Text
argToJson mschema (CmdArgPos r) =
  jsonObj $
    [ ("kind", jsonStr "pos") ]
    ++ schemaField mschema
    ++ [ ("type", jsonStr (typeDescStr (argPosDocType r) (argPosDocLiteral r)))
       , ("metavar", jsonMaybeStr (argPosDocMetavar r))
       , ("quoted", jsonBool (argPosDocLiteral r == Just True && isStrType (argPosDocType r)))
       , ("desc", jsonStrArr (argPosDocDesc r))
       , ("constraints", constraintsJsonFor (argPosDocType r))
       , ("metadata", metadataEmpty)
       ]
argToJson mschema (CmdArgOpt r) =
  jsonObj $
    [ ("kind", jsonStr "opt") ]
    ++ schemaField mschema
    ++ [ ("type", jsonStr (typeDescStr (argOptDocType r) (argOptDocLiteral r)))
       , ("metavar", jsonStr (argOptDocMetavar r))
       , ("quoted", jsonBool (argOptDocLiteral r == Just True && isStrType (argOptDocType r)))
       , ("short", cliOptShortJson (argOptDocArg r))
       , ("long", cliOptLongJson (argOptDocArg r))
       , ("default", jsonStr (argOptDocDefault r))
       , ("desc", jsonStrArr (argOptDocDesc r))
       , ("constraints", constraintsJsonFor (argOptDocType r))
       , ("metadata", metadataEmpty)
       ]
argToJson _ (CmdArgFlag r) =
  jsonObj
    [ ("kind", jsonStr "flag")
    , ("short", cliOptShortJson (argFlagDocOpt r))
    , ("long", cliOptLongJson (argFlagDocOpt r))
    , ("long_rev", flagRevJson (argFlagDocOptRev r))
    , ("default", jsonStr (argFlagDocDefault r))
    , ("desc", jsonStrArr (argFlagDocDesc r))
    , ("metadata", metadataEmpty)
    ]
argToJson mschema (CmdArgGrp r) =
  jsonObj $
    [ ("kind", jsonStr "grp") ]
    ++ schemaField mschema
    ++ [ ("type", jsonStr (render (pretty (recDocType r))))
       , ("metavar", jsonStr (recDocMetavar r))
       , ("desc", jsonStrArr (recDocDesc r))
       , ("group_opt", grpOptJson (recDocOpt r))
       , ("entries", jsonArr [grpEntryJson k v | (k, v) <- recDocEntries r])
       , ("constraints", constraintsJsonFor (recDocType r))
       , ("metadata", metadataEmpty)
       ]
  where
    grpOptJson Nothing = jsonNull
    grpOptJson (Just opt) =
      jsonObj
        [ ("short", cliOptShortJson opt)
        , ("long", cliOptLongJson opt)
        ]

    -- Group entries never carry their own schema; the group's top-level
    -- schema is used for dispatch. Pass 'Nothing' to the recursive call.
    grpEntryJson key entry =
      jsonObj
        [ ("key", jsonStr (unKey key))
        , ("arg", argToJson Nothing (either CmdArgFlag CmdArgOpt entry))
        ]

-- | Prefixed @schema@ field when a schema is present, otherwise empty.
-- Used by 'argToJson' to splice the field into the per-variant field
-- list in a consistent position.
schemaField :: Maybe Text -> [(Text, Text)]
schemaField Nothing  = []
schemaField (Just s) = [("schema", jsonStr s)]

-- Check if a type is Str or ?Str (for literal string handling)
isStrType :: Type -> Bool
isStrType (VarT v) = v == MBT.str
isStrType (OptionalT t) = isStrType t
isStrType _ = False

typeDescStr :: Type -> Maybe Bool -> Text
typeDescStr t isLiteral
  | isStrType t && isLiteral /= Just True = "Str    (a filename or quoted JSON string)"
  | otherwise = render (pretty t)

-- | Strip outer wrappers that don't change a type's "name kind" identity
-- (Optional and Effect wrappers are transparent for record/object/table
-- classification). Used by 'surfaceNamKind'.
stripSurface :: Type -> Type
stripSurface (OptionalT t) = stripSurface t
stripSurface (EffectT _ t) = stripSurface t
stripSurface t             = t

-- | If a type's surface form is a named type, return its 'NamType' tag.
-- Otherwise Nothing. Single source of the @kind@ constraint.
surfaceNamKind :: Type -> Maybe NamType
surfaceNamKind t = case stripSurface t of
  NamT o _ _ _ -> Just o
  _            -> Nothing

-- | Lowercase label for a 'NamType' constructor, used as the value of
-- the @kind@ constraint in the manifest.
namTagLabel :: NamType -> Text
namTagLabel NamRecord = "record"
namTagLabel NamObject = "object"
namTagLabel NamTable  = "table"

-- | Build the JSON @constraints@ array for a surface type. Only the
-- @kind@ constraint is populated today; future constraints (min, max,
-- regex, length, ...) will append to this list.
constraintsJsonFor :: Type -> Text
constraintsJsonFor t = jsonArr $ catMaybes
  [ (\nt -> jsonObj
      [ ("type", jsonStr "kind")
      , ("value", jsonStr (namTagLabel nt))
      ]) <$> surfaceNamKind t
  ]

-- | An empty @metadata@ slot. Always emitted so consumers never have to
-- check presence.
metadataEmpty :: Text
metadataEmpty = jsonObj []

cliOptShortJson :: CliOpt -> Text
cliOptShortJson (CliOptShort c) = jsonStr (MT.singleton c)
cliOptShortJson (CliOptBoth c _) = jsonStr (MT.singleton c)
cliOptShortJson _ = jsonNull

cliOptLongJson :: CliOpt -> Text
cliOptLongJson (CliOptLong l) = jsonStr l
cliOptLongJson (CliOptBoth _ l) = jsonStr l
cliOptLongJson _ = jsonNull

flagRevJson :: Maybe CliOpt -> Text
flagRevJson Nothing = jsonNull
flagRevJson (Just (CliOptLong l)) = jsonStr l
flagRevJson (Just (CliOptBoth _ l)) = jsonStr l
flagRevJson _ = jsonNull

-- ======================================================================
-- Expression tree serialization
-- ======================================================================

exprToJson :: NexusExpr -> Text
exprToJson (LitX lt v) =
  jsonObj
    [ ("tag", jsonStr "lit")
    , ("schema", jsonStr (litSchemaStr lt))
    , ("lit_type", jsonStr (litSchemaStr lt))
    , ("value", jsonStr v)
    ]
exprToJson (StrX schema v) =
  jsonObj
    [ ("tag", jsonStr "str")
    , ("schema", jsonStr schema)
    , ("value", jsonStr v)
    ]
exprToJson (LstX schema es) =
  jsonObj
    [ ("tag", jsonStr "container")
    , ("schema", jsonStr schema)
    , ("elements", jsonArr (map exprToJson es))
    ]
exprToJson (TupX schema es) =
  jsonObj
    [ ("tag", jsonStr "container")
    , ("schema", jsonStr schema)
    , ("elements", jsonArr (map exprToJson es))
    ]
exprToJson (NamX schema entries) =
  jsonObj
    [ ("tag", jsonStr "container")
    , ("schema", jsonStr schema)
    , ("elements", jsonArr (map (exprToJson . snd) entries))
    ]
exprToJson (AppX schema func args) =
  jsonObj
    [ ("tag", jsonStr "app")
    , ("schema", jsonStr schema)
    , ("func", exprToJson func)
    , ("args", jsonArr (map exprToJson args))
    ]
exprToJson (LamX vars body) =
  jsonObj
    [ ("tag", jsonStr "lambda")
    , ("vars", jsonStrArr vars)
    , ("body", exprToJson body)
    ]
exprToJson (BndX schema var) =
  jsonObj
    [ ("tag", jsonStr "bound")
    , ("schema", jsonStr schema)
    , ("var", jsonStr var)
    ]
exprToJson (ShowX schema child) =
  jsonObj
    [ ("tag", jsonStr "show")
    , ("schema", jsonStr schema)
    , ("child", exprToJson child)
    ]
exprToJson (ReadX schema child) =
  jsonObj
    [ ("tag", jsonStr "read")
    , ("schema", jsonStr schema)
    , ("child", exprToJson child)
    ]
exprToJson (HashX schema child) =
  jsonObj
    [ ("tag", jsonStr "hash")
    , ("schema", jsonStr schema)
    , ("child", exprToJson child)
    ]
exprToJson (SaveX fmt schema value path) =
  jsonObj
    [ ("tag", jsonStr "save")
    , ("format", jsonStr fmt)
    , ("schema", jsonStr schema)
    , ("value", exprToJson value)
    , ("path", exprToJson path)
    ]
exprToJson (LoadX schema child) =
  jsonObj
    [ ("tag", jsonStr "load")
    , ("schema", jsonStr schema)
    , ("child", exprToJson child)
    ]
exprToJson (PatX schema (PatternText p ps)) =
  jsonObj
    [ ("tag", jsonStr "interpolation")
    , ("schema", jsonStr schema)
    , ("strings", jsonStrArr (p : ps))
    ]
exprToJson (PatX schema (PatternStruct sel)) =
  jsonObj
    [ ("tag", jsonStr "pattern")
    , ("schema", jsonStr schema)
    , ("pattern", selectorToJson sel)
    ]

selectorToJson :: Selector -> Text
selectorToJson SelectorEnd = jsonObj [("type", jsonStr "end")]
selectorToJson (SelectorIdx t ts) =
  jsonObj
    [ ("type", jsonStr "idx")
    , ("selectors", jsonArr [idxSel i s | (i, s) <- t : ts])
    ]
  where
    idxSel i sub =
      jsonObj
        [ ("index", jsonInt i)
        , ("sub", selectorToJson sub)
        ]
selectorToJson (SelectorKey t ts) =
  jsonObj
    [ ("type", jsonStr "key")
    , ("selectors", jsonArr [keySel k s | (k, s) <- t : ts])
    ]
  where
    keySel k sub =
      jsonObj
        [ ("key", jsonStr k)
        , ("sub", selectorToJson sub)
        ]

litSchemaStr :: LitType -> Text
litSchemaStr F32X = "f4"
litSchemaStr F64X = "f8"
litSchemaStr I8X = "i1"
litSchemaStr I16X = "i2"
litSchemaStr I32X = "i4"
litSchemaStr I64X = "i8"
litSchemaStr U8X = "u1"
litSchemaStr U16X = "u2"
litSchemaStr U32X = "u4"
litSchemaStr U64X = "u8"
litSchemaStr BoolX = "b"
litSchemaStr NullX = "z"

-- ======================================================================
-- Manifest builder
-- ======================================================================

buildManifest ::
  Config ->
  LangRegistry ->
  String ->
  String ->
  Int ->
  [(Lang, Socket)] ->
  [FData] ->
  [GastData] ->
  (Lang -> Int) ->
  Map.Map Int Text ->
  Map.Map Text [Text] ->
  [Text] ->
  [[Text]] ->
  Text
buildManifest config registry programName buildDir buildTime daemonSets fdata gasts langToPool indexToGroup groupDescs moduleDoc moduleEpilogues =
  jsonObj
    [ ("name", jsonStr (MT.pack programName))
    , ("build", buildJson)
    , ("pools", jsonArr (map poolJson daemonSets))
    , ("commands", jsonArr (map remoteCmdJson fdata ++ map pureCmdJson gasts))
    , ("groups", jsonArr (map groupJson (Map.toList groupDescs)))
    , ("desc", jsonStrArr moduleDoc)
    , ("epilogues", jsonArr (map jsonStrArr moduleEpilogues))
    , ("metadata", metadataEmpty)
    ]
  where
    -- Compiler-sourced build metadata. Distinct from the top-level
    -- user-sourced @metadata@ slot. Future additions (hash, host, user,
    -- system, source_hash, ...) go directly in this object.
    buildJson :: Text
    buildJson =
      jsonObj
        [ ("path", jsonStr (MT.pack buildDir))
        , ("time", jsonInt buildTime)
        , ("morloc_version", jsonStr (MT.pack Morloc.Version.versionStr))
        ]

    poolJson :: (Lang, Socket) -> Text
    poolJson (lang, _) =
      jsonObj
        [ ("lang", jsonStr (ML.showLangName lang))
        , ("exec", jsonStrArr (map MT.pack (makeExecArgs lang)))
        , ("socket", jsonStr ("pipe-" <> ML.showLangName lang))
        , ("metadata", metadataEmpty)
        ]

    makeExecArgs :: Lang -> [String]
    makeExecArgs lang =
      let name = ML.langName lang
          isCompiled = LR.registryIsCompiled registry name
          runCmd = case Map.lookup name (MC.configLangOverrides config) of
            Just cmd -> map MT.unpack cmd
            Nothing -> map MT.unpack (LR.registryRunCommand registry name)
          poolExe = buildDir </> "pools" </> programName </> ML.makeExecutablePoolName lang
       in if isCompiled
            then [poolExe]
            else
              if null runCmd
                then [MT.unpack name, poolExe]
                else runCmd ++ [poolExe]

    groupJson :: (Text, [Text]) -> Text
    groupJson (gname, desc) =
      jsonObj
        [ ("name", jsonStr gname)
        , ("desc", jsonStrArr desc)
        , ("metadata", metadataEmpty)
        ]

    -- Emit a real JSON null when the command has no group, not the
    -- literal string "null". Consumers (notably Rust serde) treat the
    -- two differently: a real null deserializes to None, while a
    -- string "null" used to require a custom deserializer that has
    -- since been dropped.
    -- Look up by manifold ID rather than subcommand name, since the
    -- subcommand may be renamed via --' name: docstrings.
    cmdGroupField :: Int -> (Text, Text)
    cmdGroupField mid = case Map.lookup mid indexToGroup of
      Just gname -> ("group", jsonStr gname)
      Nothing -> ("group", jsonNull)

    remoteCmdJson :: FData -> Text
    remoteCmdJson fd =
      jsonObj
        [ ("name", jsonStr (fdataSubcommand fd))
        , ("type", jsonStr "remote")
        , ("mid", jsonInt (fdataMid fd))
        , ("pool", jsonInt (langToPool (socketLang (fdataSocket fd))))
        , ("needed_pools", jsonArr (map (jsonInt . langToPool . socketLang) (fdataSubSockets fd)))
        , ("desc", jsonStrArr (cmdDocDesc (fdataCmdDocSet fd)))
        , ("args", argsJson (cmdDocArgs (fdataCmdDocSet fd)) (fdataArgSchemas fd))
        , ("return", returnJson (fdataReturnSchema fd) (fdataType fd) (snd (cmdDocRet (fdataCmdDocSet fd))))
        , ("constraints", jsonArr [])
        , ("metadata", metadataEmpty)
        , cmdGroupField (fdataMid fd)
        ]

    pureCmdJson :: GastData -> Text
    pureCmdJson g =
      jsonObj
        [ ("name", jsonStr (commandName g))
        , ("type", jsonStr "pure")
        , ("desc", jsonStrArr (cmdDocDesc (commandDocs g)))
        , ("args", argsJson (cmdDocArgs (commandDocs g)) (commandArgSchemas g))
        , ("return", returnJson (commandReturnSchema g) (commandType g) (snd (cmdDocRet (commandDocs g))))
        , ("expr", exprToJson (commandExpr g))
        , ("constraints", jsonArr [])
        , ("metadata", metadataEmpty)
        , cmdGroupField (commandMid g)
        ]

    -- Render the @args@ JSON array. 'makeSchemas' produces one schema
    -- per arg position in the original function signature, INCLUDING
    -- flags. So 'fdataArgSchemas' is index-aligned 1:1 with 'docArgs'.
    -- For each arg we attach the corresponding schema; flags drop
    -- their schema in the JSON output (it's never used at dispatch
    -- time for boolean flags) but we still consume the schema slot to
    -- keep the index alignment intact for subsequent args.
    argsJson :: [CmdArg] -> [Text] -> Text
    argsJson docArgs schemas =
      jsonArr (pairArgsWithSchemas docArgs schemas)
      where
        pairArgsWithSchemas :: [CmdArg] -> [Text] -> [Text]
        pairArgsWithSchemas [] _ = []
        -- Flags consume a schema slot but emit no `schema` field.
        pairArgsWithSchemas (a@(CmdArgFlag _) : rest) (_ : ss) =
          argToJson Nothing a : pairArgsWithSchemas rest ss
        pairArgsWithSchemas (a : rest) (s : ss) =
          argToJson (Just s) a : pairArgsWithSchemas rest ss
        pairArgsWithSchemas (a : rest) [] =
          -- Defensive: more args than schemas. Emit with no schema
          -- so we fail cleanly downstream rather than silently
          -- misaligning.
          argToJson Nothing a : pairArgsWithSchemas rest []

    -- Nested @return@ object replacing v1's flat @return_schema@ /
    -- @return_type@ / @return_desc@. Also carries @constraints@ and
    -- @metadata@ for symmetry with args.
    returnJson :: Text -> Type -> [Text] -> Text
    returnJson schema t desc =
      let retT = stripThunks (returnTypeOnly t)
      in jsonObj
        [ ("schema", jsonStr schema)
        , ("type", jsonStr (render (pretty retT)))
        , ("desc", jsonStrArr desc)
        , ("constraints", constraintsJsonFor retT)
        , ("metadata", metadataEmpty)
        ]

    -- Extract the return type from a function type; pass other types
    -- through unchanged.
    returnTypeOnly :: Type -> Type
    returnTypeOnly (FunT _ t) = t
    returnTypeOnly t          = t

    stripThunks :: Type -> Type
    stripThunks (EffectT _ t') = stripThunks t'
    stripThunks t' = t'

-- ======================================================================
-- Main entry point
-- ======================================================================

generate ::
  [(AnnoS (Indexed Type) One (), CmdDocSet)] ->
  [(AnnoS (Indexed Type) One (Indexed Lang), CmdDocSet)] ->
  MorlocMonad Script
generate cs rASTs = do
  config <- MM.ask
  st <- CMS.get

  -- Extract data for remote commands
  xs <- mapM makeFData rASTs
  fdata <- CM.mapM getFData xs

  -- Extract data for pure commands
  gasts <- mapM annotateGasts cs

  -- Get build time and compute build directory
  buildTime <- liftIO $ floor <$> Time.getPOSIXTime
  programName <- MM.getModuleName
  buildDir <-
    if stateInstall st
      then do
        let installDir = configHome config </> "exe" </> programName
        CMS.modify (\s -> s {stateInstallDir = Just installDir})
        return installDir
      else liftIO Dir.getCurrentDirectory

  -- Build pool list (deduplicated by language)
  let allSockets = concatMap (\x -> fdataSocket x : fdataSubSockets x) fdata
      daemonSets = uniqueFst [(socketLang s, s) | s <- allSockets]

      langToPoolIndex :: Lang -> Int
      langToPoolIndex lang =
        case findIndex ((== lang) . fst) daemonSets of
          Just idx -> idx
          Nothing -> error $ "Pool not found for language: " <> show lang

  -- Build manifest JSON with relative pool paths
  outfileName <- MM.getOutfileName
  registry <- MM.gets stateLangRegistry

  -- Build group info for manifest
  exportGroups <- MM.gets stateExportGroups
  let indexToGroup =
        Map.fromList
          [ (idx, gname)
          | (gname, (_, indices)) <- Map.toList exportGroups
          , idx <- indices
          ]
      groupDescs =
        Map.fromList
          [ (gname, desc)
          | (gname, (desc, _)) <- Map.toList exportGroups
          ]

  moduleDoc <- MM.gets stateModuleDoc
  moduleEpilogues <- MM.gets stateModuleEpilogues

  let manifestJson =
        buildManifest
          config
          registry
          programName
          buildDir
          buildTime
          daemonSets
          fdata
          gasts
          langToPoolIndex
          indexToGroup
          groupDescs
          moduleDoc
          moduleEpilogues
      wrapperScript = makeWrapperScript manifestJson

  return $
    Script
      { scriptBase = outfileName
      , scriptLang = cLang
      , scriptCode = "." :/ File outfileName (Code wrapperScript)
      , scriptMake = [SysExe outfileName]
      }

-- Build a self-contained wrapper script with embedded manifest
makeWrapperScript :: Text -> Text
makeWrapperScript manifestJson =
  "#!/bin/sh\nexec morloc-nexus \"$0\" \"$@\"\n### MANIFEST ###\n" <> manifestJson

-- ======================================================================
-- Utilities
-- ======================================================================

uniqueFst :: (Eq a) => [(a, b)] -> [(a, b)]
uniqueFst = f []
  where
    f _ [] = []
    f seen (x@(a, _) : xs)
      | a `elem` seen = f seen xs
      | otherwise = x : f (a : seen) xs


================================================
FILE: library/Morloc/CodeGenerator/Parameterize.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.CodeGenerator.Parameterize
Description : Propagate function arguments down through the AnnoS tree
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Threads the top-level function parameters through the expression tree
so that each manifold node knows which arguments it needs. This is
necessary because the tree may contain multiple alternative implementations
that share the same parameter interface.
-}
module Morloc.CodeGenerator.Parameterize
  ( parameterize
  ) where

import Data.Text (Text)
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM

{- | Add arguments that are required for each term. Unneeded arguments are
removed at each step.
-}
parameterize ::
  AnnoS (Indexed Type) One (Indexed Lang) ->
  MorlocMonad (AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]))
parameterize (AnnoS m@(Idx _ (FunT inputs _)) c (LamS vs x)) = do
  MM.sayVVV "Entering parameterize LamS"
  ids <- MM.takeFromCounter (length inputs)
  let args0 = fromJust $ safeZipWith Arg ids vs
  x' <- parameterize' args0 x
  return $ AnnoS m (c, args0) (LamS vs x')
parameterize (AnnoS m@(Idx _ (FunT inputs _)) c@(Idx _ lang) (BndS v)) = do
  MM.sayVVV $ "Entering parameterize VarS function - " <> pretty v <> "@" <> pretty lang
  ids <- MM.takeFromCounter (length inputs)
  let vs = map EV (freshVarsAZ [])
      args0 = fromJust $ safeZipWith Arg ids vs
  return $ AnnoS m (c, args0) (BndS v)
parameterize x = do
  MM.sayVVV "Entering parameterize Other"
  parameterize' [] x

parameterize' ::
  [Arg EVar] -> -- arguments in parental scope (child needn't retain them)
  AnnoS (Indexed Type) One (Indexed Lang) ->
  MorlocMonad (AnnoS (Indexed Type) One (Indexed Lang, [Arg EVar]))
-- primitives, no arguments are required for a primitive, so empty lists
parameterize' _ (AnnoS g c UniS) = return $ AnnoS g (c, []) UniS
parameterize' _ (AnnoS g c NullS) = return $ AnnoS g (c, []) NullS
parameterize' _ (AnnoS g c (RealS x)) = return (AnnoS g (c, []) (RealS x))
parameterize' _ (AnnoS g c (IntS x)) = return (AnnoS g (c, []) (IntS x))
parameterize' _ (AnnoS g c (LogS x)) = return (AnnoS g (c, []) (LogS x))
parameterize' _ (AnnoS g c (StrS x)) = return (AnnoS g (c, []) (StrS x))
parameterize' args (AnnoS g c (BndS v)) = do
  let args' = [r | r@(Arg _ v') <- args, v' == v]
  return $ AnnoS g (c, args') (BndS v)
parameterize' _ (AnnoS m c (ExeS (SrcCall src))) =
  return $ AnnoS m (c, []) (ExeS (SrcCall src))
parameterize' _ (AnnoS g c (ExeS (PatCall x))) =
  return (AnnoS g (c, []) (ExeS (PatCall x)))
parameterize' args (AnnoS g c (LstS xs)) = do
  xs' <- mapM (parameterize' args) xs
  let args' = pruneArgs args xs'
  return $ AnnoS g (c, args') (LstS xs')
parameterize' args (AnnoS g c (TupS xs)) = do
  xs' <- mapM (parameterize' args) xs
  let args' = pruneArgs args xs'
  return $ AnnoS g (c, args') (TupS xs')
parameterize' args (AnnoS g c (NamS entries)) = do
  xs' <- mapM (parameterize' args . snd) entries
  let args' = pruneArgs args xs'
  return $ AnnoS g (c, args') (NamS (zip (map fst entries) xs'))
parameterize' args (AnnoS g@(Idx _ (FunT inputs _)) c (LamS vs x)) = do
  ids <- MM.takeFromCounter (length inputs)
  let contextArgs = [r | r@(Arg _ v) <- args, v `notElem` vs] -- remove shadowed arguments
      boundArgs = fromJust $ safeZipWith Arg ids vs
  x' <- parameterize' (contextArgs <> boundArgs) x
  let contextArgs' = pruneArgs contextArgs [x']
  return $ AnnoS g (c, contextArgs' <> boundArgs) (LamS vs x')
-- LamS MUST have a functional type, deviations would have been caught by the typechecker
parameterize' _ (AnnoS _ _ (LamS _ _)) = error "impossible"
parameterize' args (AnnoS g c (AppS x xs)) = do
  x' <- parameterize' args x
  xs' <- mapM (parameterize' args) xs
  let args' = pruneArgs args (x' : xs')
  return $ AnnoS g (c, args') (AppS x' xs')
parameterize' args (AnnoS g c (LetBndS v)) = do
  let args' = [r | r@(Arg _ v') <- args, v' == v]
  return $ AnnoS g (c, args') (LetBndS v)
parameterize' args (AnnoS g c (LetS v e1 e2)) = do
  e1' <- parameterize' args e1
  idx <- MM.getCounter
  let letArg = Arg idx v
      bodyArgs = letArg : [r | r@(Arg _ v') <- args, v' /= v]
  e2' <- parameterize' bodyArgs e2
  let args' = pruneArgs args [e1', e2']
  return $ AnnoS g (c, args') (LetS v e1' e2')
parameterize' args (AnnoS g c (IfS cond thenE elseE)) = do
  cond' <- parameterize' args cond
  thenE' <- parameterize' args thenE
  elseE' <- parameterize' args elseE
  let args' = pruneArgs args [cond', thenE', elseE']
  return $ AnnoS g (c, args') (IfS cond' thenE' elseE')
parameterize' args (AnnoS g c (DoBlockS e)) = do
  e' <- parameterize' args e
  let args' = pruneArgs args [e']
  return $ AnnoS g (c, args') (DoBlockS e')
parameterize' args (AnnoS g c (EvalS e)) = do
  e' <- parameterize' args e
  let args' = pruneArgs args [e']
  return $ AnnoS g (c, args') (EvalS e')
parameterize' args (AnnoS g c (CoerceS co e)) = do
  e' <- parameterize' args e
  let args' = pruneArgs args [e']
  return $ AnnoS g (c, args') (CoerceS co e')
parameterize' args (AnnoS g c (IntrinsicS intr es)) = do
  es' <- mapM (parameterize' args) es
  let args' = pruneArgs args es'
  return $ AnnoS g (c, args') (IntrinsicS intr es')
parameterize' _ (AnnoS g c (CallS v)) = do
  return $ AnnoS g (c, []) (CallS v)
parameterize' _ (AnnoS _ _ (VarS _ _)) = undefined

pruneArgs :: [Arg a] -> [AnnoS c One (g, [Arg a])] -> [Arg a]
pruneArgs args xs =
  let usedArgs = unique $ concatMap (map ann . sannoSnd) xs
   in [r | r@(Arg i _) <- args, i `elem` usedArgs]

sannoSnd :: AnnoS g One (a, b) -> b
sannoSnd (AnnoS _ (_, x) _) = x

-- generate infinite list of fresh variables of form
-- ['a','b',...,'z','aa','ab',...,'zz',...]
freshVarsAZ ::
  [Text] -> -- variables to exclude
  [Text]
freshVarsAZ exclude =
  filter
    (`notElem` exclude)
    ([1 ..] >>= flip replicateM ['a' .. 'z'] |>> MT.pack)


================================================
FILE: library/Morloc/CodeGenerator/Realize.hs
================================================
{-# LANGUAGE CPP #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Realize
Description : Select concrete implementations for each polymorphic call site
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

When a term has multiple candidate implementations (different languages,
different source files), this pass selects the best one at each call site
based on language affinity and minimizing cross-language transitions. The
result is a fully-realized tree where every node has exactly one
implementation.
-}
module Morloc.CodeGenerator.Realize
  ( realityCheck
  , removeVarS
  ) where

import Morloc.CodeGenerator.Namespace
import qualified Morloc.CodeGenerator.SystemConfig as MCS
import Morloc.Data.Doc
import Morloc.Data.Map (Map)
import qualified Morloc.Data.Map as Map
import qualified Data.Set as Set
import qualified Morloc.Monad as MM
import qualified Morloc.TypeEval as TE

realityCheck ::
  -- | one AST forest for each command exported from main
  [AnnoS (Indexed Type) Many Int] ->
  MorlocMonad
    ( [AnnoS (Indexed Type) One ()]
    , [AnnoS (Indexed Type) One (Indexed Lang)]
    )
realityCheck es = do
  -- translate modules into bitrees
  (gASTs0, rASTs0) <-
    -- select a single instance at each node in the tree
    mapM realize es
      -- separate unrealized (general) ASTs (uASTs) from realized ASTs (rASTs)
      |>> partitionEithers

  -- Extract non-exported recursive helpers into their own rASTs.
  -- This must happen before removeVarS so we can find the VarS wrappers.
  rASTs1 <- extractRecursiveHelpers rASTs0

  -- Now dissolve remaining (non-recursive) VarS wrappers
  let gASTs = map removeVarS gASTs0
      rASTs = map removeVarS rASTs1

  -- check and configure the system
  -- in the future, the results of this step may be used to winnow the build
  MCS.configure rASTs

  return (gASTs, rASTs)

-- State for the realize scoring algorithm
data RState = RState
  { rLangs :: [Lang]
  , rApplied :: [AnnoS (Indexed Type) Many Int]
  , rBndVars :: Map EVar (AnnoS (Indexed Type) Many Int)
  }

emptyRState =
  RState
    { rLangs = []
    , rApplied = []
    , rBndVars = Map.empty
    }

{- | Choose a single concrete implementation. In the future, this component
may be one of the more complex components of the morloc compiler. It will
probably need to be implemented using an optimizing SMT solver. It will
also need benchmarking data from all the implementations and possibly
statistical info describing inputs.
-}
realize ::
  AnnoS (Indexed Type) Many Int ->
  MorlocMonad
    ( Either
        (AnnoS (Indexed Type) One ())
        (AnnoS (Indexed Type) One (Indexed Lang))
    )
realize s0 = do
  registry <- MM.gets stateLangRegistry
  realizeWithRegistry registry s0

realizeWithRegistry ::
  LangRegistry ->
  AnnoS (Indexed Type) Many Int ->
  MorlocMonad
    ( Either
        (AnnoS (Indexed Type) One ())
        (AnnoS (Indexed Type) One (Indexed Lang))
    )
realizeWithRegistry registry s0 = do
  e@(AnnoS _ li _) <- scoreAnnoS emptyRState s0 >>= collapseAnnoS Nothing
  case li of
    (Idx _ Nothing) -> makeGAST e |>> Left
    (Idx _ _) -> propagateDown e |>> Right
  where
    pairwiseCost :: Lang -> Lang -> Int
    pairwiseCost l1 l2
      | l1 == l2 = case Map.lookup (langName l2) (lrSameLangCosts registry) of
          Nothing -> lrDefaultSameCost registry
          (Just score) -> score
      | otherwise = case Map.lookup (langName l1, langName l2) (lrOptimizedPairs registry) of
          Nothing -> case Map.lookup (langName l2) (lrCrossLangCosts registry) of
            Nothing -> lrDefaultCrossCost registry
            (Just score) -> score
          (Just score) -> score

    languageCost :: Lang -> Int
    languageCost lang = pairwiseCost lang lang

    -- \| Depth first pass calculating scores for each language. Alternates with
    -- scoresSExpr.
    scoreAnnoS ::
      RState ->
      AnnoS (Indexed Type) Many Int ->
      MorlocMonad (AnnoS (Indexed Type) Many (Indexed [(Lang, Int)]))
    scoreAnnoS rstat (AnnoS gi ci e) = do
      (e', ci') <- scoreExpr rstat (e, ci)
      return $ AnnoS gi ci' e'

    -- \| Alternates with scoresAnnoS, finds the best score for each language at
    -- application nodes.
    scoreExpr ::
      RState ->
      (ExprS (Indexed Type) Many Int, Int) ->
      MorlocMonad (ExprS (Indexed Type) Many (Indexed [(Lang, Int)]), Indexed [(Lang, Int)])
    scoreExpr rstat (LstS xs, i) = do
      (xs', best) <- scoreMany rstat xs
      return (LstS xs', Idx i best)
    scoreExpr rstat (TupS xs, i) = do
      (xs', best) <- scoreMany rstat xs
      return (TupS xs', Idx i best)
    scoreExpr rstat (NamS rs, i) = do
      (xs, best) <- scoreMany rstat (map snd rs)
      return (NamS (zip (map fst rs) xs), Idx i best)
    scoreExpr rstat (LamS vs x, i) = do
      x' <- scoreAnnoS (updateRState vs rstat) x
      return (LamS vs x', Idx i (scoresOf x'))
    scoreExpr rstat (AppS f xs, i) = do
      -- store all applied arguments
      -- these may be bound to lambdas within f
      -- they are required for resolving the application language
      let rstat' = rstat {rLangs = [], rApplied = xs}

      f' <- scoreAnnoS rstat' f

      -- best scores for each language for f
      let scores = scoresOf f'
          rstat'' = emptyRState {rLangs = unique $ map fst scores}

      xs' <- mapM (scoreAnnoS rstat'') xs

      -- [[(Lang, Int)]] : where Lang is unique within each list and Int is minimized
      let pairss = [minPairs pairs | AnnoS _ (Idx _ pairs) _ <- xs']
      let best = scoreApp scores pairss

      return (AppS f' xs', Idx i best)
    -- non-recursive expressions
    scoreExpr rstat (UniS, i) = return (UniS, zipLang i rstat)
    scoreExpr rstat (NullS, i) = return (NullS, zipLang i rstat)
    scoreExpr rstat (VarS v (Many xs), i) = do
      (xs', best) <- scoreMany rstat xs
      return (VarS v (Many xs'), Idx i best)
    scoreExpr rstat (BndS v, i) = do
      case Map.lookup v (rBndVars rstat) of
        (Just e@(AnnoS (Idx _ (FunT _ _)) _ _)) -> do
          scores <- scoreAnnoS rstat e |>> scoresOf
          return (BndS v, Idx i scores)
        _ -> return (BndS v, zipLang i rstat)
    scoreExpr _ (ExeS x@(SrcCall src), i) = return (ExeS x, Idx i [(srcLang src, callCost src)])
    scoreExpr rstat (ExeS x@(PatCall _), i) = return (ExeS x, zipLang i rstat)
    scoreExpr rstat (RealS x, i) = return (RealS x, zipLang i rstat)
    scoreExpr rstat (IntS x, i) = return (IntS x, zipLang i rstat)
    scoreExpr rstat (LogS x, i) = return (LogS x, zipLang i rstat)
    scoreExpr rstat (StrS x, i) = return (StrS x, zipLang i rstat)
    scoreExpr rstat (LetS v e1 e2, i) = do
      e1' <- scoreAnnoS rstat e1
      e2' <- scoreAnnoS rstat e2
      -- include RHS scores so unused let bindings (e.g. from do-block bare
      -- statements) still propagate their language requirement
      let best = minPairs (scoresOf e1' ++ scoresOf e2')
      return (LetS v e1' e2', Idx i best)
    scoreExpr rstat (LetBndS v, i) = return (LetBndS v, zipLang i rstat)
    scoreExpr rstat (CallS v, i) = return (CallS v, zipLang i rstat)
    scoreExpr rstat (IfS c t e, i) = do
      c' <- scoreAnnoS rstat c
      t' <- scoreAnnoS rstat t
      e' <- scoreAnnoS rstat e
      let best = minPairs (scoresOf c' ++ scoresOf t' ++ scoresOf e')
      return (IfS c' t' e', Idx i best)
    scoreExpr rstat (DoBlockS x, i) = do
      x' <- scoreAnnoS rstat x
      return (DoBlockS x', Idx i (scoresOf x'))
    scoreExpr rstat (EvalS x, i) = do
      x' <- scoreAnnoS rstat x
      return (EvalS x', Idx i (scoresOf x'))
    scoreExpr rstat (CoerceS c x, i) = do
      x' <- scoreAnnoS rstat x
      return (CoerceS c x', Idx i (scoresOf x'))
    scoreExpr rstat (IntrinsicS intr xs, i) = do
      xs' <- mapM (scoreAnnoS rstat) xs
      let Idx _ langScores = zipLang i rstat
          best = case xs' of
            [] -> langScores
            _ -> minPairs (concatMap scoresOf xs')
      return (IntrinsicS intr xs', Idx i best)

    -- calculate the score for an application based on the score of the function
    -- and the scores of the arguments
    scoreApp ::
      [ ( Lang -- the language of the ith calling function implementation
        , Int -- the score of the ith implementation
        )
      ] ->
      [ [ ( Lang -- the language of the jth implementation of the kth argument
          , Int -- the score of the jth implementation of the kth argument
          )
        ]
      ] ->
      [(Lang, Int)]
    -- if nothing is known, nothing is returned
    scoreApp [] (concat -> []) = []
    -- if none of the arguments are language-specific, the scores are based only
    -- on the functions
    scoreApp scores (concat -> []) = scores
    -- if the function is not language-specific, calculate the cost of calling
    -- all arguments from each possible language context
    scoreApp [] pairss =
      let score = [(lang, 0) | lang <- unique $ map fst (concat pairss)]
       in scoreApp score pairss
    -- if arguments and function have implementations, calculate cost relative to
    -- each function implementation
    scoreApp scores pairss =
      [ ( l1
        , s1
            + sum
              [ minimumDef 999999999 [s2 + pairwiseCost l1 l2 | (l2, s2) <- pairs]
              | pairs <- pairss
              ]
        )
      | (l1, s1) <- scores
      ]

    updateRState :: [EVar] -> RState -> RState
    updateRState [] rstat = rstat
    updateRState _ rstat@(RState _ [] _) = rstat
    updateRState (v : vs) rstat@(RState _ (p : ps) bound) =
      updateRState vs $
        rstat {rApplied = ps, rBndVars = Map.insert v p bound}

    zipLang :: Int -> RState -> Indexed [(Lang, Int)]
    zipLang i (rLangs -> langs) = Idx i (zip langs (repeat 0))

    scoresOf :: AnnoS a Many (Indexed [(Lang, Int)]) -> [(Lang, Int)]
    scoresOf (AnnoS _ (Idx _ xs) _) = minPairs xs

    -- find the scores of all implementations from all possible language contexts
    scoreMany ::
      RState ->
      [AnnoS (Indexed Type) Many Int] ->
      MorlocMonad ([AnnoS (Indexed Type) Many (Indexed [(Lang, Int)])], [(Lang, Int)])
    scoreMany rstat xs0 = do
      xs1 <- mapM (scoreAnnoS rstat) xs0
      return (xs1, scoreMany' xs1)
      where
        scoreMany' :: [AnnoS (Indexed Type) Many (Indexed [(Lang, Int)])] -> [(Lang, Int)]
        scoreMany' xs =
          let pairss = [(minPairs . concat) [xs' | (AnnoS _ (Idx _ xs') _) <- xs]]
              langs' = unique (rLangs rstat <> concatMap (map fst) pairss)
           in -- Got 10 billion nodes in your AST? I didn't think so, so don't say my sentinal's ugly.
              [ ( l1
                , sum
                    [ minimumDef
                      999999999
                      [ score + pairwiseCost l1 l2
                      | (l2, score) <- pairs
                      ]
                    | pairs <- pairss
                    ]
                )
              | l1 <- langs'
              ]

    collapseAnnoS ::
      Maybe Lang ->
      AnnoS (Indexed Type) Many (Indexed [(Lang, Int)]) ->
      MorlocMonad (AnnoS (Indexed Type) One (Indexed (Maybe Lang)))
    collapseAnnoS l1 (AnnoS gi@(Idx _ gt) ci e) = do
      (e', ci') <- collapseExpr gt l1 (e, ci)
      return (AnnoS gi ci' e')

    -- The biased cost adds a slight penalty to changing language.
    -- This penalty is unrelated to the often large penalty of foreign calls.
    -- Rather, the purpose is just to distinguish VarS terms. It is totally
    -- kludgy, a better recursion scheme is needed here.
    biasedCost :: Maybe Lang -> (Lang, Int) -> Int
    biasedCost l1 (l2, s)
      | l1 == Just l2 = cost l1 l2 s
      | otherwise = 1 + cost l1 l2 s

    cost ::
      Maybe Lang -> -- parent language (if given)
      Lang -> -- child lang (should always be given if we are working from scored pairs)
      Int -> -- score
      Int
    cost (Just l1) l2 score = score + pairwiseCost l1 l2
    cost _ _ score = score

    -- FIXME: in the future, this function should be replaced by an estimate of
    -- the function runtime, for now I will just base it off languages.
    callCost :: Source -> Int
    callCost src = languageCost (srcLang src)

    collapseExpr ::
      Type ->
      Maybe Lang -> -- the language of the parent expression (if Nothing, then this is a GAST)
      (ExprS (Indexed Type) Many (Indexed [(Lang, Int)]), Indexed [(Lang, Int)]) ->
      MorlocMonad (ExprS (Indexed Type) One (Indexed (Maybe Lang)), Indexed (Maybe Lang))

    collapseExpr _ _ (VarS v (Many []), Idx i _) =
      MM.throwSourcedError i $ "No implementation found for" <+> squotes (pretty v)
    -- Select one implementation for the given term
    collapseExpr gt l1 (VarS v (Many xs), Idx i _) = do
      let minXs = minsBy (\(AnnoS _ (Idx _ ss) _) -> minimumMay [cost l1 l2 s | (l2, s) <- ss]) xs
      (x, lang) <- case minXs of
        [] -> MM.throwSourcedError i $ "No implementation found for" <+> squotes (pretty v)
        [x] -> handleOne x
        choices -> mapM handleOne choices >>= handleMany gt
      return (VarS v (One x), Idx i lang)
      where
        handleOne ::
          AnnoS (Indexed Type) Many (Indexed [(Lang, Int)]) ->
          MorlocMonad (AnnoS (Indexed Type) One (Indexed (Maybe Lang)), Maybe Lang)
        handleOne x@(AnnoS _ (Idx _ ss) e) = do
          let newLang =
                if isFunctionalData e
                  then l1
                  else fmap fst (minBy (biasedCost l1) ss)
          x' <- collapseAnnoS newLang x
          return (x', newLang)

        handleMany ::
          Type ->
          [(AnnoS (Indexed Type) One (Indexed (Maybe Lang)), Maybe Lang)] ->
          MorlocMonad (AnnoS (Indexed Type) One (Indexed (Maybe Lang)), Maybe Lang)
        handleMany gt' xs' =
          -- Match candidates by head type constructor, then fall back to
          -- alias reduction. This handles type aliases (e.g. Deque = List)
          -- by first looking for an exact head match, then reducing the
          -- expected type one level and searching again.
          case [x | x@(AnnoS (Idx _ t) _ _, _) <- xs', sameTypeHead gt' t] of
            [] -> do
              gscope <- MM.getGeneralScope i
              case TE.reduceType gscope (type2typeu gt') of
                (Just gt'') -> handleMany (typeOf gt'') xs'
                Nothing ->
                  case xs' of
                    -- All candidates have the same head: they're duplicates from
                    -- different imports (e.g., mempty = [] from both root-py and root-cpp).
                    (x'@(AnnoS (Idx _ t0) _ _, _) : rest)
                      | all (\(AnnoS (Idx _ t) _ _, _) -> sameTypeHead t0 t) rest -> return x'
                    _ ->
                      MM.throwSourcedError i $
                        "I couldn't find implementation for" <+> squotes (pretty v) <+> "gt' = " <+> pretty gt'
            [x'] -> return x'
            (x' : _) -> return x'

        -- Compare types by their head constructor, ignoring parameters.
        -- This handles candidates with unresolved type variables (UnkT).
        sameTypeHead :: Type -> Type -> Bool
        sameTypeHead (AppT (VarT v1) _) (AppT (VarT v2) _) = v1 == v2
        sameTypeHead (VarT v1) (VarT v2) = v1 == v2
        sameTypeHead (FunT _ r1) (FunT _ r2) = sameTypeHead r1 r2
        sameTypeHead t1 t2 = t1 == t2

    ----- NOTE: Some cases are inseperable, the code above does not
    ----- account for this, which may allow incorrect code to be
    ----- generated.
    -- xs' ->  MM.throwSystemError
    --   $ "no rule to separate the following sourced functions of type" <+> parens (pretty gt)":\n"
    --   <> indent 2 (vsep [ "*" <+> pretty t <+> ":" <+> pretty y | y@(AnnoS (Idx _ t) _ _, _)  <- xs'])

    -- Propagate downwards
    collapseExpr _ l1 (LamS vs x, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      x' <- collapseAnnoS lang x
      return (LamS vs x', Idx i lang)
    collapseExpr _ l1 (AppS f xs, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      f' <- collapseAnnoS lang f
      xs' <- mapM (collapseAnnoS lang) xs
      return (AppS f' xs', Idx i lang)
    -- Propagate data
    collapseExpr _ l1 (e@(LstS xs), Idx i ss) = do
      lang <- if isFunctionalData e then return l1 else chooseLanguage l1 ss
      xs' <- mapM (collapseAnnoS lang) xs
      return (LstS xs', Idx i lang)
    collapseExpr _ l1 (e@(TupS xs), Idx i ss) = do
      lang <- if isFunctionalData e then return l1 else chooseLanguage l1 ss
      xs' <- mapM (collapseAnnoS lang) xs
      return (TupS xs', Idx i lang)
    collapseExpr _ l1 (e@(NamS rs), Idx i ss) = do
      lang <- if isFunctionalData e then return l1 else chooseLanguage l1 ss
      xs' <- mapM (collapseAnnoS lang . snd) rs
      return (NamS (zip (map fst rs) xs'), Idx i lang)
    -- collapse leaf expressions
    collapseExpr _ _ (ExeS x@(SrcCall src), Idx i _) = return (ExeS x, Idx i (Just (srcLang src)))
    collapseExpr _ lang (ExeS x@(PatCall _), Idx i _) = return (ExeS x, Idx i lang)
    collapseExpr _ lang (BndS v, Idx i _) = return (BndS v, Idx i lang)
    collapseExpr _ lang (UniS, Idx i _) = return (UniS, Idx i lang)
    collapseExpr _ lang (NullS, Idx i _) = return (NullS, Idx i lang)
    collapseExpr _ lang (RealS x, Idx i _) = return (RealS x, Idx i lang)
    collapseExpr _ lang (IntS x, Idx i _) = return (IntS x, Idx i lang)
    collapseExpr _ lang (LogS x, Idx i _) = return (LogS x, Idx i lang)
    collapseExpr _ lang (StrS x, Idx i _) = return (StrS x, Idx i lang)
    collapseExpr _ l1 (LetS v e1 e2, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      e1' <- collapseAnnoS lang e1
      e2' <- collapseAnnoS lang e2
      return (LetS v e1' e2', Idx i lang)
    collapseExpr _ lang (LetBndS v, Idx i _) = return (LetBndS v, Idx i lang)
    collapseExpr _ lang (CallS v, Idx i _) = return (CallS v, Idx i lang)
    collapseExpr _ l1 (IfS c t e, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      c' <- collapseAnnoS lang c
      t' <- collapseAnnoS lang t
      e' <- collapseAnnoS lang e
      return (IfS c' t' e', Idx i lang)
    collapseExpr _ l1 (DoBlockS x, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      x' <- collapseAnnoS lang x
      return (DoBlockS x', Idx i lang)
    collapseExpr _ l1 (EvalS x, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      x' <- collapseAnnoS lang x
      return (EvalS x', Idx i lang)
    collapseExpr _ l1 (CoerceS c x, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      x' <- collapseAnnoS lang x
      return (CoerceS c x', Idx i lang)
    collapseExpr _ l1 (IntrinsicS intr xs, Idx i ss) = do
      lang <- chooseLanguage l1 ss
      xs' <- mapM (collapseAnnoS lang) xs
      return (IntrinsicS intr xs', Idx i lang)

    chooseLanguage :: Maybe Lang -> [(Lang, Int)] -> MorlocMonad (Maybe Lang)
    chooseLanguage l1 ss = do
      case minBy snd [(l2, cost l1 l2 s2) | (l2, s2) <- ss] of
        Nothing -> return Nothing
        (Just (l3, _)) -> return (Just l3)

    minBy :: (Ord b) => (a -> b) -> [a] -> Maybe a
    minBy _ [] = Nothing
    minBy _ [x] = Just x
    minBy f (x1 : rs) = case minBy f rs of
      Nothing -> Just x1
      (Just x2) -> if f x1 <= f x2 then Just x1 else Just x2

    minsBy :: (Ord b) => (a -> b) -> [a] -> [a]
    minsBy _ [] = []
    minsBy f (x : xs) = snd $ minsBy' (f x, [x]) xs
      where
        minsBy' (best, grp) [] = (best, grp)
        minsBy' (best, grp) (y : ys) = minsBy' (newSet (f y)) ys
          where
            newSet newScore
              | newScore == best = (best, y : grp)
              | newScore < best = (newScore, [y])
              | otherwise = (best, grp)

    -- find the lowest cost function for each key
    -- the groupSort function will never yield an empty value for vs, so `minimum` is safe
    minPairs :: (Ord a, Ord b) => [(a, b)] -> [(a, b)]
    minPairs = map (second minimum) . groupSort

    propagateDown ::
      AnnoS (Indexed Type) One (Indexed (Maybe Lang)) ->
      MorlocMonad (AnnoS (Indexed Type) One (Indexed Lang))
    propagateDown (AnnoS _ (Idx i Nothing) _) =
      MM.throwSourcedError i $ "Compiler bug: (__FILE__:__LINE__) - Unexpected Nothing"
    propagateDown e@(AnnoS _ (Idx _ (Just lang0)) _) = f lang0 e
      where
        f ::
          Lang ->
          AnnoS (Indexed Type) One (Indexed (Maybe Lang)) ->
          MorlocMonad (AnnoS (Indexed Type) One (Indexed Lang))
        f lang (AnnoS g (Idx i Nothing) e') = f lang (AnnoS g (Idx i (Just lang)) e')
        f _ (AnnoS g (Idx i (Just lang)) e') = do
          e'' <- case e' of
            (AppS x xs) -> AppS <$> f lang x <*> mapM (f lang) xs
            (LamS vs x) -> LamS vs <$> f lang x
            (LstS xs) -> LstS <$> mapM (f lang) xs
            (TupS xs) -> TupS <$> mapM (f lang) xs
            (NamS rs) -> NamS <$> (zip (map fst rs) <$> mapM (f lang . snd) rs)
            UniS -> return UniS
            NullS -> return NullS
            (VarS v (One x)) -> VarS v . One <$> f lang x
            (BndS v) -> return (BndS v)
            (RealS x) -> return (RealS x)
            (IntS x) -> return (IntS x)
            (LogS x) -> return (LogS x)
            (StrS x) -> return (StrS x)
            (ExeS x) -> return (ExeS x)
            (LetS v e1 e2) -> LetS v <$> f lang e1 <*> f lang e2
            (LetBndS v) -> return (LetBndS v)
            (CallS v) -> return (CallS v)
            (IfS c t elseE) -> IfS <$> f lang c <*> f lang t <*> f lang elseE
            (DoBlockS x) -> DoBlockS <$> f lang x
            (EvalS x) -> EvalS <$> f lang x
            (CoerceS c x) -> CoerceS c <$> f lang x
            (IntrinsicS intr xs) -> IntrinsicS intr <$> mapM (f lang) xs
          return (AnnoS g (Idx i lang) e'')

{- | This function is called on trees that contain no language-specific
components.  "GAST" refers to General Abstract Syntax Tree. The most common
GAST case, and the only one that is currently supported, is a expression
that merely rearranges data structures without calling any functions. Here
are a few examples:

 Constant values and containters (currently supported):
 f1 = 5
 f2 = [1,2,3]

 Variable values and containers (coming soon):
 f3 x = x

 f4 x = [1,2,x]

 Combinations of transformations on containers (possible, but not coming soon):
 f5 :: forall a b . (a, b) -> (b, a)
 f6 (x,y) = (y,x)

The idea could be elaborated into a full-fledged language.
-}
makeGAST ::
  AnnoS (Indexed Type) One (Indexed (Maybe Lang)) -> MorlocMonad (AnnoS (Indexed Type) One ())
makeGAST = mapAnnoSCM (\(Idx _ _) -> return ())

removeVarS :: AnnoS g One c -> AnnoS g One c
removeVarS (AnnoS g1 _ (VarS _ (One (AnnoS _ c2 x)))) = removeVarS (AnnoS g1 c2 x)
removeVarS (AnnoS g c (AppS x xs)) = AnnoS g c (AppS (removeVarS x) (map removeVarS xs))
removeVarS (AnnoS g c (LamS vs x)) = AnnoS g c (LamS vs (removeVarS x))
removeVarS (AnnoS g c (LstS xs)) = AnnoS g c (LstS (map removeVarS xs))
removeVarS (AnnoS g c (TupS xs)) = AnnoS g c (TupS (map removeVarS xs))
removeVarS (AnnoS g c (NamS rs)) = AnnoS g c (NamS (map (second removeVarS) rs))
removeVarS (AnnoS g c (LetS v e1 e2)) = AnnoS g c (LetS v (removeVarS e1) (removeVarS e2))
removeVarS (AnnoS g c (IfS cond thenE elseE)) = AnnoS g c (IfS (removeVarS cond) (removeVarS thenE) (removeVarS elseE))
removeVarS (AnnoS g c (DoBlockS e)) = AnnoS g c (DoBlockS (removeVarS e))
removeVarS (AnnoS g c (EvalS e)) = AnnoS g c (EvalS (removeVarS e))
removeVarS (AnnoS g c (CoerceS co e)) = AnnoS g c (CoerceS co (removeVarS e))
removeVarS (AnnoS g c (IntrinsicS intr es)) = AnnoS g c (IntrinsicS intr (map removeVarS es))
removeVarS x = x

-- | Extract non-exported recursive helpers from rASTs into their own top-level
-- rASTs. A recursive helper is a VarS node whose body contains a CallS
-- back-edge to its own name. These must become separate manifolds so the
-- generated code can call them recursively. This runs before removeVarS.
extractRecursiveHelpers ::
  [AnnoS (Indexed Type) One (Indexed Lang)] ->
  MorlocMonad [AnnoS (Indexed Type) One (Indexed Lang)]
extractRecursiveHelpers rASTs = do
  exports <- MM.gets stateExports
  let exportSet = Set.fromList exports
  results <- mapM (extractFromTree exportSet) rASTs
  let (modified, helperLists) = unzip results
      helpers = concat helperLists
  -- Register extracted helpers in stateName if not already present (they
  -- should be from the Link phase, but ensure it for safety).
  nameMap <- MM.gets stateName
  mapM_ (\(AnnoS (Idx midx _) _ _) ->
    case Map.lookup midx nameMap of
      Just _ -> return ()
      Nothing -> MM.sayVVV $ "Warning: recursive helper manifold" <+> pretty midx <+> "not in stateName"
    ) helpers
  return (modified ++ helpers)

-- | Walk an rAST and extract recursive VarS nodes into separate rASTs.
-- Returns the modified tree and the list of extracted helper rASTs.
extractFromTree ::
  Set.Set Int ->
  AnnoS (Indexed Type) One (Indexed Lang) ->
  MorlocMonad (AnnoS (Indexed Type) One (Indexed Lang), [AnnoS (Indexed Type) One (Indexed Lang)])
extractFromTree exports (AnnoS g c e) = do
  (e', helpers) <- extractExpr exports e
  return (AnnoS g c e', helpers)

extractExpr ::
  Set.Set Int ->
  ExprS (Indexed Type) One (Indexed Lang) ->
  MorlocMonad (ExprS (Indexed Type) One (Indexed Lang), [AnnoS (Indexed Type) One (Indexed Lang)])
extractExpr exports (VarS v (One child@(AnnoS (Idx midx _) _ _)))
  -- Only extract if the function is recursive AND not already an export
  -- (exports already have their own manifolds)
  | not (Set.member midx exports) && containsCallS v child = do
      -- Recursively extract from the child's body first
      (child', innerHelpers) <- extractFromTree exports child
      return (CallS v, child' : innerHelpers)
extractExpr exports (VarS v (One child)) = do
  (child', helpers) <- extractFromTree exports child
  return (VarS v (One child'), helpers)
extractExpr exports (AppS f xs) = do
  (f', fHelpers) <- extractFromTree exports f
  results <- mapM (extractFromTree exports) xs
  let (xs', xHelperLists) = unzip results
  return (AppS f' xs', fHelpers ++ concat xHelperLists)
extractExpr exports (LamS vs e) = do
  (e', helpers) <- extractFromTree exports e
  return (LamS vs e', helpers)
extractExpr exports (LstS xs) = do
  results <- mapM (extractFromTree exports) xs
  let (xs', helperLists) = unzip results
  return (LstS xs', concat helperLists)
extractExpr exports (TupS xs) = do
  results <- mapM (extractFromTree exports) xs
  let (xs', helperLists) = unzip results
  return (TupS xs', concat helperLists)
extractExpr exports (NamS rs) = do
  results <- mapM (extractFromTree exports . snd) rs
  let (vals', helperLists) = unzip results
  return (NamS (zip (map fst rs) vals'), concat helperLists)
extractExpr exports (LetS v e1 e2) = do
  (e1', h1) <- extractFromTree exports e1
  (e2', h2) <- extractFromTree exports e2
  return (LetS v e1' e2', h1 ++ h2)
extractExpr exports (IfS c t e) = do
  (c', h1) <- extractFromTree exports c
  (t', h2) <- extractFromTree exports t
  (e', h3) <- extractFromTree exports e
  return (IfS c' t' e', h1 ++ h2 ++ h3)
extractExpr exports (DoBlockS e) = do
  (e', helpers) <- extractFromTree exports e
  return (DoBlockS e', helpers)
extractExpr exports (EvalS e) = do
  (e', helpers) <- extractFromTree exports e
  return (EvalS e', helpers)
extractExpr exports (CoerceS c e) = do
  (e', helpers) <- extractFromTree exports e
  return (CoerceS c e', helpers)
extractExpr exports (IntrinsicS intr es) = do
  results <- mapM (extractFromTree exports) es
  let (es', helperLists) = unzip results
  return (IntrinsicS intr es', concat helperLists)
extractExpr _ e = return (e, [])

-- | Check if an AnnoS tree contains a CallS node targeting the given name
containsCallS :: EVar -> AnnoS g One c -> Bool
containsCallS target (AnnoS _ _ e) = go e
  where
    go (CallS v) = v == target
    go (AppS f xs) = containsCallS target f || any (containsCallS target) xs
    go (LamS _ x) = containsCallS target x
    go (LstS xs) = any (containsCallS target) xs
    go (TupS xs) = any (containsCallS target) xs
    go (NamS rs) = any (containsCallS target . snd) rs
    go (VarS _ (One x)) = containsCallS target x
    go (LetS _ e1 e2) = containsCallS target e1 || containsCallS target e2
    go (LetBndS _) = False
    go (IfS c t e') = containsCallS target c || containsCallS target t || containsCallS target e'
    go (DoBlockS x) = containsCallS target x
    go (EvalS x) = containsCallS target x
    go (CoerceS _ x) = containsCallS target x
    go (IntrinsicS _ xs) = any (containsCallS target) xs
    go _ = False

-- Check if this expression is a data structure that contains
-- a function. If so, then the data structure is must be in the
-- same language as the parent (since functions can't be serialized)
isFunctionalData :: ExprS (Indexed Type) f a -> Bool
isFunctionalData (LstS xs) = any isFunctionalDataAnnoS xs
isFunctionalData (TupS xs) = any isFunctionalDataAnnoS xs
isFunctionalData (NamS (map snd -> xs)) = any isFunctionalDataAnnoS xs
isFunctionalData _ = False

isFunctionalDataAnnoS :: AnnoS (Indexed Type) f a -> Bool
isFunctionalDataAnnoS (AnnoS (Idx _ t) _ e) = handleType t || isFunctionalData e
  where
    handleType :: Type -> Bool
    handleType (FunT _ _) = True
    handleType _ = False


================================================
FILE: library/Morloc/CodeGenerator/Reduce.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.CodeGenerator.Reduce
Description : Compile-time reduction of intrinsics
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Walks the SerialManifold tree after serialization and replaces compile-time
intrinsics (@version, @compiled, @lang, @schema, @typeof, @datafile) with
string literals. Runtime intrinsics (@save, @load, @hash) pass through
unchanged to code generation.
-}
module Morloc.CodeGenerator.Reduce (reduce) where

import Data.Text (Text)
import qualified Data.Text as T
import Data.Time.Clock (getCurrentTime)
import Data.Time.Format (formatTime, defaultTimeLocale)
import Control.Monad.State (gets)
import Morloc.CodeGenerator.Namespace
import qualified Morloc.Version as V

reduce :: SerialManifold -> MorlocMonad SerialManifold
reduce sm = do
  timestamp <- liftIO $ do
    now <- getCurrentTime
    return . T.pack $ formatTime defaultTimeLocale "%Y-%m-%dT%H:%M:%SZ" now
  let ver = T.pack V.versionStr
  reduceManifold ver timestamp sm

reduceManifold :: Text -> Text -> SerialManifold -> MorlocMonad SerialManifold
reduceManifold ver ts (SerialManifold m lang form hf se) =
  SerialManifold m lang form hf <$> reduceSerialExpr ver ts lang se

reduceSerialExpr :: Text -> Text -> Lang -> SerialExpr -> MorlocMonad SerialExpr
reduceSerialExpr ver ts _ (ManS sm) = ManS <$> reduceManifold ver ts sm
reduceSerialExpr ver ts lang (AppPoolS t pc args) =
  AppPoolS t pc <$> mapM (reduceSerialArg ver ts lang) args
reduceSerialExpr ver ts lang (AppRecS t i args) =
  AppRecS t i <$> mapM (reduceSerialExpr ver ts lang) args
reduceSerialExpr ver ts lang (AppForeignRecS t i sock args) =
  AppForeignRecS t i sock <$> mapM (reduceSerialExpr ver ts lang) args
reduceSerialExpr ver ts lang (ReturnS se) = ReturnS <$> reduceSerialExpr ver ts lang se
reduceSerialExpr ver ts lang (SerialLetS i e1 e2) =
  SerialLetS i <$> reduceSerialExpr ver ts lang e1 <*> reduceSerialExpr ver ts lang e2
reduceSerialExpr ver ts lang (NativeLetS i ne se) =
  NativeLetS i <$> reduceNativeExpr ver ts lang ne <*> reduceSerialExpr ver ts lang se
reduceSerialExpr ver ts lang (SerializeS ast ne) =
  SerializeS ast <$> reduceNativeExpr ver ts lang ne
reduceSerialExpr _ _ _ e = return e

reduceSerialArg :: Text -> Text -> Lang -> SerialArg -> MorlocMonad SerialArg
reduceSerialArg ver ts _ (SerialArgManifold sm) = SerialArgManifold <$> reduceManifold ver ts sm
reduceSerialArg ver ts lang (SerialArgExpr se) = SerialArgExpr <$> reduceSerialExpr ver ts lang se

reduceNativeManifold :: Text -> Text -> NativeManifold -> MorlocMonad NativeManifold
reduceNativeManifold ver ts (NativeManifold m lang form ne) =
  NativeManifold m lang form <$> reduceNativeExpr ver ts lang ne

reduceNativeExpr :: Text -> Text -> Lang -> NativeExpr -> MorlocMonad NativeExpr
-- compile-time intrinsics: replace with string literals
reduceNativeExpr ver _ _ (IntrinsicN t IntrVersion _ []) = return $ makeStr t ver
reduceNativeExpr _ ts _ (IntrinsicN t IntrCompiled _ []) = return $ makeStr t ts
reduceNativeExpr _ _ lang (IntrinsicN t IntrLang _ []) = return $ makeStr t (langName lang)
-- @datafile: resolve relative path to installed data file location
reduceNativeExpr ver ts lang (IntrinsicN t IntrDatafile _ [pathArg]) = do
  pathArg' <- reduceNativeExpr ver ts lang pathArg
  case extractStr pathArg' of
    Just relPath -> do
      mInstallDir <- gets stateInstallDir
      let resolved = case mInstallDir of
            Just dir -> T.pack (dir </> T.unpack relPath)
            Nothing -> relPath
      return $ makeStr t resolved
    Nothing ->
      return $ makeStr t "<datafile: could not resolve path>"
-- runtime intrinsics: recurse into children but keep the intrinsic node
reduceNativeExpr ver ts lang (IntrinsicN t intr msch es) =
  IntrinsicN t intr msch <$> mapM (reduceNativeExpr ver ts lang) es
-- recursive cases
reduceNativeExpr ver ts _ (ManN nm) = ManN <$> reduceNativeManifold ver ts nm
reduceNativeExpr ver ts lang (AppExeN t exe args) =
  AppExeN t exe <$> mapM (reduceNativeArg ver ts lang) args
reduceNativeExpr ver ts lang (ReturnN ne) = ReturnN <$> reduceNativeExpr ver ts lang ne
reduceNativeExpr ver ts lang (SerialLetN i se ne) =
  SerialLetN i <$> reduceSerialExpr ver ts lang se <*> reduceNativeExpr ver ts lang ne
reduceNativeExpr ver ts lang (NativeLetN i ne1 ne2) =
  NativeLetN i <$> reduceNativeExpr ver ts lang ne1 <*> reduceNativeExpr ver ts lang ne2
reduceNativeExpr ver ts lang (DeserializeN t ast se) =
  DeserializeN t ast <$> reduceSerialExpr ver ts lang se
reduceNativeExpr ver ts lang (ListN fv t es) =
  ListN fv t <$> mapM (reduceNativeExpr ver ts lang) es
reduceNativeExpr ver ts lang (TupleN fv es) =
  TupleN fv <$> mapM (reduceNativeExpr ver ts lang) es
reduceNativeExpr ver ts lang (RecordN o fv tps rs) =
  RecordN o fv tps <$> mapM (\(k, ne) -> (,) k <$> reduceNativeExpr ver ts lang ne) rs
reduceNativeExpr ver ts lang (DoBlockN t ne) = DoBlockN t <$> reduceNativeExpr ver ts lang ne
reduceNativeExpr ver ts lang (EvalN t ne) = EvalN t <$> reduceNativeExpr ver ts lang ne
reduceNativeExpr ver ts lang (CoerceN c t ne) = CoerceN c t <$> reduceNativeExpr ver ts lang ne
reduceNativeExpr ver ts lang (IfN t c th el) =
  IfN t <$> reduceNativeExpr ver ts lang c <*> reduceNativeExpr ver ts lang th <*> reduceNativeExpr ver ts lang el
-- leaf nodes
reduceNativeExpr _ _ _ e = return e

reduceNativeArg :: Text -> Text -> Lang -> NativeArg -> MorlocMonad NativeArg
reduceNativeArg ver ts _ (NativeArgManifold nm) = NativeArgManifold <$> reduceNativeManifold ver ts nm
reduceNativeArg ver ts lang (NativeArgExpr ne) = NativeArgExpr <$> reduceNativeExpr ver ts lang ne

makeStr :: TypeF -> Text -> NativeExpr
makeStr (VarF fv) x = StrN fv x
makeStr _ x = StrN (FV (TV "Str") (CV "str")) x

-- | Extract the string value from a StrN node
extractStr :: NativeExpr -> Maybe Text
extractStr (StrN _ x) = Just x
extractStr _ = Nothing


================================================
FILE: library/Morloc/CodeGenerator/Segment.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.CodeGenerator.Segment
Description : Break polymorphic manifold trees at language boundaries
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.CodeGenerator.Segment
  ( segment
  ) where

import Morloc.CodeGenerator.Namespace
import qualified Morloc.Config as MC
import Morloc.Data.Doc
import qualified Morloc.Monad as MM

segment :: PolyHead -> MorlocMonad [MonoHead]
segment (PolyHead lang m0 args0 e0) = do
  (heads, (_, topExpr)) <- segmentExpr m0 (map ann args0) e0

  MM.sayVVV $
    "segmentation complete"
      <> "\n  topExpr language:" <+> pretty lang
      <> "\n  topExpr: " <+> pretty topExpr
      <> "\n  heads:" <+> list (map pretty heads)

  return (MonoHead lang m0 args0 HeadManifoldFormLocalRoot topExpr : heads)

segmentExpr ::
  Int -> -- manifold index
  [Int] -> -- argument indices
  PolyExpr ->
  MorlocMonad ([MonoHead], (Maybe Lang, MonoExpr))
segmentExpr
  _
  args
  ( PolyRemoteInterface
      lang
      callingType
      cargs
      remoteCall
      e@(PolyManifold _ m (ManifoldFull foreignArgs) _)
    ) = do
    MM.sayVVV $
      "segmentExpr PolyRemoteInterface PolyManifold m"
        <> pretty m
        <> "\n  forced ManifoldFull" <+> pretty foreignArgs
        <> "\n  lang" <+> pretty lang
        <> "\n  args" <+> pretty args
        <> "\n  cargs" <+> pretty cargs
        <> "\n  foreignArgs" <+> pretty (map ann foreignArgs)
    (ms, (_, e')) <- segmentExpr m (map ann foreignArgs) e
    headForm <- case remoteCall of
      ForeignCall -> return HeadManifoldFormLocalForeign
      (RemoteCall _) -> return HeadManifoldFormRemoteWorker
    let foreignHead = MonoHead lang m foreignArgs headForm e'
    config <- MM.ask
    reg <- MM.gets stateLangRegistry
    let socket = MC.setupServerAndSocket config reg lang
    return (foreignHead : ms, (Nothing, MonoPoolCall callingType m socket remoteCall foreignArgs))
segmentExpr m _ (PolyRemoteInterface lang callingType args remoteCall e) = do
  MM.sayVVV $
    "segmentExpr PolyRemoteInterface m"
      <> pretty m
      <> "\n  args" <+> pretty args
      <> "\n  lang" <+> pretty lang
  (ms, (_, e')) <- segmentExpr m args e
  headForm <- case remoteCall of
    ForeignCall -> return HeadManifoldFormLocalForeign
    (RemoteCall _) -> return HeadManifoldFormRemoteWorker
  let foreignHead = MonoHead lang m [Arg i None | i <- args] headForm (MonoReturn e')
      es' = map (MonoBndVar (A None)) args

  config <- MM.ask
  reg <- MM.gets stateLangRegistry
  let socket = MC.setupServerAndSocket config reg lang
      localFun = MonoApp (MonoPoolCall callingType m socket remoteCall [Arg i None | i <- args]) es'

  return (foreignHead : ms, (Nothing, localFun))
segmentExpr _ _ (PolyManifold lang m form e) = do
  (ms, (_, e')) <- segmentExpr m (abilist const const form) e
  return (ms, (Just lang, MonoManifold m form e'))
segmentExpr m args (PolyApp e es) = do
  (ms, (lang, e')) <- segmentExpr m args e
  (mss, es') <- mapM (segmentExpr m args) es |>> unzip
  return (ms ++ concat mss, (lang, MonoApp e' (map snd es')))
segmentExpr m args (PolyLet i e1 e2) = do
  MM.sayVVV "segmentExpr PolyLet"
  (ms1, (_, e1')) <- segmentExpr m args e1
  (ms2, (lang2, e2')) <- segmentExpr m args e2
  return (ms1 ++ ms2, (lang2, MonoLet i e1' e2'))
segmentExpr m args (PolyList v t es) = do
  (mss, es') <- mapM (segmentExpr m args) es |>> unzip
  return (concat mss, (Nothing, MonoList v t (map snd es')))
segmentExpr m args (PolyTuple v es) = do
  (mss, es') <- mapM (segmentExpr m args . snd) es |>> unzip
  return (concat mss, (Nothing, MonoTuple v (zip (map fst es) (map snd es'))))
segmentExpr m args (PolyRecord o v ps entries) = do
  let entryTypes = map (fst . snd) entries
  (mss, es') <- mapM (segmentExpr m args . snd . snd) entries |>> unzip
  let keys = map fst entries
  return (concat mss, (Nothing, MonoRecord o v ps (zip keys (zip entryTypes (map snd es')))))
segmentExpr m args (PolyReturn e) = do
  (ms, (lang, e')) <- segmentExpr m args e
  return (ms, (lang, MonoReturn e'))
segmentExpr _ _ (PolyLetVar t x) = return ([], (Nothing, MonoLetVar t x))
segmentExpr _ _ (PolyBndVar (A lang) i) = return ([], (Just lang, MonoBndVar (A None) i))
segmentExpr _ _ (PolyBndVar (B t) i) = return ([], (Nothing, MonoBndVar (B t) i))
segmentExpr _ _ (PolyBndVar (C t) i) = return ([], (Nothing, MonoBndVar (C t) i))
segmentExpr _ _ (PolyExe t exe) = return ([], (Nothing, MonoExe t exe))
segmentExpr _ _ (PolyLog v x) = return ([], (Nothing, MonoLog v x))
segmentExpr _ _ (PolyReal v x) = return ([], (Nothing, MonoReal v x))
segmentExpr _ _ (PolyInt v x) = return ([], (Nothing, MonoInt v x))
segmentExpr _ _ (PolyStr v x) = return ([], (Nothing, MonoStr v x))
segmentExpr _ _ (PolyNull v) = return ([], (Nothing, MonoNull v))
segmentExpr m args (PolyDoBlock t e) = do
  (ms, (_, e')) <- segmentExpr m args e
  return (ms, (Nothing, MonoDoBlock t e'))
segmentExpr m args (PolyIf cond thenE elseE) = do
  (ms1, (_, cond')) <- segmentExpr m args cond
  (ms2, (_, thenE')) <- segmentExpr m args thenE
  (ms3, (_, elseE')) <- segmentExpr m args elseE
  return (ms1 ++ ms2 ++ ms3, (Nothing, MonoIf cond' thenE' elseE'))
segmentExpr m args (PolyEval t e) = do
  (ms, (_, e')) <- segmentExpr m args e
  return (ms, (Nothing, MonoEval t e'))
segmentExpr m args (PolyCoerce c t e) = do
  (ms, (_, e')) <- segmentExpr m args e
  return (ms, (Nothing, MonoCoerce c t e'))
segmentExpr m args (PolyIntrinsic t intr es) = do
  results <- mapM (segmentExpr m args) es
  let (mss, pairs) = unzip results
  return (concat mss, (Nothing, MonoIntrinsic t intr (map snd pairs)))


================================================
FILE: library/Morloc/CodeGenerator/Serial.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Serial
Description : Build serialization ASTs that describe how to pack\/unpack types
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Constructs 'SerialAST' trees that describe the serialization and
deserialization plan for each type. Handles format selection (JSON
vs MessagePack), packer resolution via typeclass instances, and
serializability checking. Distinct from 'Serialize' which inserts
pack\/unpack calls into the manifold tree.
-}
module Morloc.CodeGenerator.Serial
  ( makeSerialAST
  , chooseSerializationCycle
  , isSerializable
  , hasArrowHint
  , prettySerialOne
  , serialAstToType
  , shallowType
  , serialAstToMsgpackSchema
  , encode64
  , decode64
  ) where

import qualified Data.Char as C
import qualified Data.IntMap.Strict as IntMap
import qualified Data.Set as Set
import qualified Data.Text as DT
import qualified Morloc.BaseTypes as BT
import Morloc.CodeGenerator.Infer
import Morloc.CodeGenerator.Namespace
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM
import qualified Morloc.TypeEval as TE
import Morloc.Typecheck.Internal (apply, qualify, substitute, subtype, unqualify)

-- | recurse all the way to a serializable type
serialAstToType :: SerialAST -> TypeF
serialAstToType (SerialPack _ (_, s)) = serialAstToType s
serialAstToType (SerialList v s) = AppF (VarF v) [serialAstToType s]
serialAstToType (SerialTensor v _ s) = AppF (VarF v) [serialAstToType s]
serialAstToType (SerialTuple v ss) = AppF (VarF v) (map serialAstToType ss)
serialAstToType (SerialObject o n ps rs) =
  let ts = map (serialAstToType . snd) rs
   in NamF o n ps (zip (map fst rs) ts)
serialAstToType (SerialReal x) = VarF x
serialAstToType (SerialFloat32 x) = VarF x
serialAstToType (SerialFloat64 x) = VarF x
serialAstToType (SerialInt x) = VarF x
serialAstToType (SerialInt8 x) = VarF x
serialAstToType (SerialInt16 x) = VarF x
serialAstToType (SerialInt32 x) = VarF x
serialAstToType (SerialInt64 x) = VarF x
serialAstToType (SerialUInt x) = VarF x
serialAstToType (SerialUInt8 x) = VarF x
serialAstToType (SerialUInt16 x) = VarF x
serialAstToType (SerialUInt32 x) = VarF x
serialAstToType (SerialUInt64 x) = VarF x
serialAstToType (SerialBool x) = VarF x
serialAstToType (SerialString x) = VarF x
serialAstToType (SerialNull x) = VarF x
serialAstToType (SerialOptional _ s) = OptionalF (serialAstToType s)
-- passthrough type, it cannot be deserialized or serialized, only passed in from a different language
serialAstToType (SerialUnknown v) = UnkF v

encode64 :: Int -> String
encode64 i
  | i < 0 = error "Negative size - not in this universe my dear"
  | i < 10 = [C.chr (C.ord '0' + i)] -- 0-9
  | i < 36 = [C.chr (C.ord 'a' + i - 10)]
  | i < 62 = [C.chr (C.ord 'A' + i - 36)]
  | i == 62 = "+"
  | i == 63 = "/"
  | otherwise = "=" <> (encode64 (mod i 64)) <> (encode64 (div i 64))

decode64 :: String -> Int
decode64 (x : xs)
  | x >= '0' && x <= '9' = C.ord x - C.ord '0'
  | x >= 'a' && x <= 'z' = C.ord x - C.ord 'a' + C.ord '0'
  | x >= 'A' && x <= 'Z' = C.ord x - C.ord 'A' + C.ord 'a' + C.ord '0'
  | x == '+' = 62
  | x == '/' = 63
  | x == '=' = decode64 [head xs] + 64 * decode64 (tail xs)
  | otherwise = error "illegal character"
decode64 [] = 0

encode64D :: Int -> MDoc
encode64D i = pretty (encode64 i)

serialAstToMsgpackSchema :: SerialAST -> MDoc
serialAstToMsgpackSchema (SerialPack v (_, s)) = addHint v <> serialAstToMsgpackSchema s
serialAstToMsgpackSchema (SerialList v s) = addHint v <> "a" <> serialAstToMsgpackSchema s
serialAstToMsgpackSchema (SerialTensor v ndim s) = addHint v <> "T" <> encode64D ndim <> serialAstToMsgpackSchema s
serialAstToMsgpackSchema (SerialTuple v ss) = addHint v <> "t" <> encode64D (length ss) <> foldl (<>) "" (map serialAstToMsgpackSchema ss)
serialAstToMsgpackSchema (SerialObject _ v _ rs) = addHint v <> "m" <> encode64D (length rs) <> foldl (<>) "" (map keypair rs)
  where
    keypair :: (Key, SerialAST) -> MDoc
    keypair (k, s) = (encode64D . DT.length . unKey $ k) <> pretty (unKey k) <> serialAstToMsgpackSchema s
serialAstToMsgpackSchema (SerialReal v) = addHint v <> "f8" -- 64 bit float
serialAstToMsgpackSchema (SerialFloat32 v) = addHint v <> "f4"
serialAstToMsgpackSchema (SerialFloat64 v) = addHint v <> "f8"
serialAstToMsgpackSchema (SerialInt v) = addHint v <> "i4" -- 32 bit integer, will need to extend this soon
serialAstToMsgpackSchema (SerialInt8 v) = addHint v <> "i1"
serialAstToMsgpackSchema (SerialInt16 v) = addHint v <> "i2"
serialAstToMsgpackSchema (SerialInt32 v) = addHint v <> "i4"
serialAstToMsgpackSchema (SerialInt64 v) = addHint v <> "i8"
serialAstToMsgpackSchema (SerialUInt v) = addHint v <> "u4"
serialAstToMsgpackSchema (SerialUInt8 v) = addHint v <> "u1"
serialAstToMsgpackSchema (SerialUInt16 v) = addHint v <> "u2"
serialAstToMsgpackSchema (SerialUInt32 v) = addHint v <> "u4"
serialAstToMsgpackSchema (SerialUInt64 v) = addHint v <> "u8"
serialAstToMsgpackSchema (SerialBool v) = addHint v <> "b"
serialAstToMsgpackSchema (SerialString v) = addHint v <> "s"
serialAstToMsgpackSchema (SerialNull v) = addHint v <> "z"
serialAstToMsgpackSchema (SerialOptional v s) = addHint v <> "?" <> serialAstToMsgpackSchema s
serialAstToMsgpackSchema (SerialUnknown v) = addHint v <> "*"

addHint :: FVar -> MDoc
addHint (FV _ (CV "")) = "" -- no hint if no concrete type is defined
-- this is helpful in the nexus
addHint (FV _ (CV v)) = "<" <> pretty v <> ">"

-- | get only the toplevel type
shallowType :: SerialAST -> TypeF
shallowType (SerialPack _ (p, _)) = typePackerPacked p
shallowType (SerialList v s) = AppF (VarF v) [shallowType s]
shallowType (SerialTuple v ss) = AppF (VarF v) $ map shallowType ss
shallowType (SerialObject o n ps rs) =
  let ts = map (shallowType . snd) rs
   in NamF o n ps (zip (map fst rs) ts)
shallowType (SerialReal x) = VarF x
shallowType (SerialFloat32 x) = VarF x
shallowType (SerialFloat64 x) = VarF x
shallowType (SerialInt x) = VarF x
shallowType (SerialInt8 x) = VarF x
shallowType (SerialInt16 x) = VarF x
shallowType (SerialInt32 x) = VarF x
shallowType (SerialInt64 x) = VarF x
shallowType (SerialUInt x) = VarF x
shallowType (SerialUInt8 x) = VarF x
shallowType (SerialUInt16 x) = VarF x
shallowType (SerialUInt32 x) = VarF x
shallowType (SerialUInt64 x) = VarF x
shallowType (SerialBool x) = VarF x
shallowType (SerialString x) = VarF x
shallowType (SerialNull x) = VarF x
shallowType (SerialOptional _ s) = OptionalF (shallowType s)
shallowType (SerialTensor v _ s) = AppF (VarF v) [shallowType s]
shallowType (SerialUnknown v) = UnkF v

findPackers ::
  Lang ->
  MorlocMonad
    ( [(([TVar], TypeU), Source)]
    , [(([TVar], TypeU), Source)]
    )
findPackers lang = do
  sigmap <- MM.gets stateTypeclasses

  MM.sayVVV $
    "findPackers"
      <> "\n  sigmap:" <+> viaShow sigmap

  packers <- case Map.lookup (EV "pack") sigmap of
    (Just (Instance _ _ _ ts)) -> return $ concatMap f ts
    Nothing -> return []

  unpackers <- case Map.lookup (EV "unpack") sigmap of
    (Just (Instance _ _ _ ts)) -> return $ concatMap f ts
    Nothing -> return []

  return (packers, unpackers)
  where
    f :: TermTypes -> [(([TVar], TypeU), Source)]
    f (TermTypes (Just et) (map (val . snd) -> srcs) _) =
      let (vs, t) = unqualify $ etype et
       in [((vs, t), src) | src <- srcs, srcLang src == lang]
    f (TermTypes Nothing _ _) = []

-- Takes a map of packers with concrete type names as keys. A single concrete
-- type name may map to many single types. For example, the python type "dict"
-- might represent a Map with homogenous keys and values or many things that
-- might be objects in other languages. Similarly, the python "tuple" type maps
-- to tuples of all sizes -- each of which is a different type in both the
-- morloc general type system and many other languages. So the map contains a
-- list of possible packers. Matching the concrete type name to the right packer
-- will be done through subtyping.
makeSerialAST :: Int -> Lang -> TypeF -> MorlocMonad SerialAST
makeSerialAST m lang t0 = do
  -- ([(([TVar], TypeU), Source)], ...)
  (packs, unpacks) <- findPackers lang

  MM.sayVVV $ "packs:" <+> viaShow packs
  MM.sayVVV $ "unpacks:" <+> viaShow unpacks

  (_, gscope) <- getScope m lang

  -- Map TVar ((TypeU, Source), (TypeU, Source))
  let typepackers =
        Map.fromListWith
          (<>)
          [ (extractKey b1, [(length vs1, qualify vs1 a1, qualify vs1 b1, src1, src2)])
          | ((vs1, FunU [a1] b1), src1) <- packs
          , ((vs2, FunU [a2] _), src2) <- unpacks
          , extractKey b1 == extractKey a2
          , length vs1 == length vs2
          ]

  makeSerialAST' gscope typepackers t0
  where
    makeSerialAST' ::
      Scope ->
      Map.Map TVar [(Int, TypeU, TypeU, Source, Source)] ->
      TypeF ->
      MorlocMonad SerialAST
    -- If the type is unknown in this language, then it must be a passthrough
    -- type. So it will only be represented in the serialization form. As a
    -- string, for now.
    makeSerialAST' _ _ (UnkF (FV gv _)) = do
      registry <- MM.gets stateLangRegistry |>> lrEntries
      serialType <- case Map.lookup (langName lang) registry of
        Nothing -> MM.throwSourcedError m "Unsupported language"
        (Just langRegistry) -> return $ CV (lreSerialType langRegistry)
      return $ SerialUnknown (FV gv serialType)
    makeSerialAST' gscope typepackers ft@(VarF v@(FV gv cv))
      | finalType == BT.unitU = return $ SerialNull v
      | finalType == BT.boolU = return $ SerialBool v
      | finalType == BT.strU = return $ SerialString v
      | finalType == BT.realU = return $ SerialReal v
      | finalType == BT.f32U = return $ SerialFloat32 v
      | finalType == BT.f64U = return $ SerialFloat64 v
      | finalType == BT.intU = return $ SerialInt v
      | finalType == BT.i8U = return $ SerialInt8 v
      | finalType == BT.i16U = return $ SerialInt16 v
      | finalType == BT.i32U = return $ SerialInt32 v
      | finalType == BT.i64U = return $ SerialInt64 v
      | finalType == BT.uintU = return $ SerialUInt v
      | finalType == BT.u8U = return $ SerialUInt8 v
      | finalType == BT.u16U = return $ SerialUInt16 v
      | finalType == BT.u32U = return $ SerialUInt32 v
      | finalType == BT.u64U = return $ SerialUInt64 v
      | otherwise = case Map.lookup gv typepackers of
          (Just ps) -> do
            packers <- mapM makeTypePacker ps
            unpacked <- mapM (makeSerialAST' gscope typepackers . typePackerUnpacked) packers
            selection <- selectPacker (zip packers unpacked)
            return $ SerialPack v selection
          Nothing ->
            MM.throwSourcedError m $
              "Cannot find constructor in VarF" <+> dquotes (pretty v) <+> " finalType=" <> pretty finalType
      where
        -- Evaluate type aliases step-by-step, stopping at known serialization
        -- base types. This prevents aliases like Int64 = Int from collapsing
        -- to Int, which would lose width information for serialization.
        finalType =
          let t = fst $ unweaveTypeF ft
           in resolveToSerialBaseType gscope t

        resolveToSerialBaseType scope t
          | Set.member t serialBaseTypes = t
          | otherwise = case TE.reduceType scope t of
              Just t' -> resolveToSerialBaseType scope t'
              Nothing -> t

        serialBaseTypes = Set.fromList
          [ BT.unitU, BT.boolU, BT.strU, BT.realU
          , BT.f32U, BT.f64U
          , BT.intU, BT.i8U, BT.i16U, BT.i32U, BT.i64U
          , BT.uintU, BT.u8U, BT.u16U, BT.u32U, BT.u64U
          ]

        makeTypePacker :: (Int, TypeU, TypeU, Source, Source) -> MorlocMonad TypePacker
        makeTypePacker (0, generalUnpackedType, generalPackedType, forwardSource, reverseSource) = do
          packedType <- inferConcreteType lang (Idx m (typeOf generalPackedType))
          unpackedType <- inferConcreteType lang (Idx m (typeOf generalUnpackedType))
          return $
            TypePacker
              { typePackerPacked = packedType
              , typePackerUnpacked = unpackedType
              , typePackerForward = forwardSource
              , typePackerReverse = reverseSource
              }
        makeTypePacker (nparam, _, _, _, _) =
          MM.throwSourcedError m $ "Unexpected parameters for atomic variable:" <+> pretty nparam

        -- Select the first packer we happen across. This is a very key step and
        -- eventually this function should be replaced with one more carefully
        -- considered. But for now, I don't have any great criterion for
        -- choosing.
        selectPacker :: [(TypePacker, SerialAST)] -> MorlocMonad (TypePacker, SerialAST)
        selectPacker [] = MM.throwSourcedError m $ "Cannot find constructor for" <+> pretty cv <+> "in selectPacker"
        selectPacker [x] = return x
        selectPacker _ = MM.throwSourcedError m "Two you say, oh, get out of here"
    makeSerialAST' _ _ t@(FunF _ _) =
      MM.throwSourcedError m $ "Cannot serialize functions at" <+> pretty m <> ":" <+> pretty t
    makeSerialAST' gscope typepackers ft@(AppF (VarF fv@(FV generalTypeName _)) ts0)
      | null runtimeTs = MM.throwSourcedError m $ "No runtime type args for" <+> pretty ft
      -- When alias expansion changed the root type, re-infer the concrete
      -- type for the expanded general form and recurse.
      | Just fv' <- finalVar, fv' /= generalTypeName, Just expanded <- evaluatedType = do
          expandedTf <- inferConcreteType lang (Idx m (typeOf expanded))
          makeSerialAST' gscope typepackers expandedTf
      | finalVar == Just BT.list = SerialList fv <$> makeSerialAST' gscope typepackers (head runtimeTs)
      | finalVar == Just (BT.tuple (length runtimeTs)) =
          SerialTuple fv <$> mapM (makeSerialAST' gscope typepackers) runtimeTs
      | Just ndim <- tensorNDim finalVar =
          SerialTensor fv ndim <$> makeSerialAST' gscope typepackers (last runtimeTs)
      | otherwise = case Map.lookup generalTypeName typepackers of
          (Just ps) -> do
            packers <- catMaybes <$> mapM (resolvePacker lang m ft) ps
            unpacked <- mapM (makeSerialAST' gscope typepackers . typePackerUnpacked) packers
            selection <- selectPacker (zip packers unpacked)
            return $ SerialPack fv selection
          Nothing ->
            MM.throwSourcedError m $
              "Cannot find" <+> pretty generalTypeName <+> "from" <+> dquotes (pretty fv)
                <> "\n  ft:" <+> pretty ft
                <> "\n  finalVar:" <+> pretty finalVar
                <> "\n  gscope:" <+> viaShow gscope
                <> "\n  general t:" <+> (viaShow . fst $ unweaveTypeF ft)
                <> "\n  concrete t:" <+> (viaShow . snd $ unweaveTypeF ft)
                <> "\n  typepackers:" <+> viaShow typepackers
      where
        -- Filter out Nat-kinded type params (phantom, not serialized)
        isNatTypeF :: TypeF -> Bool
        isNatTypeF (NatLitF _) = True
        isNatTypeF _ = False

        runtimeTs = filter (not . isNatTypeF) ts0

        basevar :: TypeU -> Maybe TVar
        basevar (VarU v) = Just v
        basevar (NatVarU _) = Nothing
        basevar (ExistU _ _ _) = Nothing
        basevar (ForallU _ _) = Nothing
        basevar (FunU _ _) = Nothing
        basevar (AppU t _) = basevar t
        basevar (NamU _ v _ _) = Just v
        basevar (EffectU _ _) = Nothing
        basevar (OptionalU _) = Nothing
        basevar (NatLitU _) = Nothing
        basevar (NatAddU _ _) = Nothing
        basevar (NatMulU _ _) = Nothing
        basevar (NatSubU _ _) = Nothing
        basevar (NatDivU _ _) = Nothing
        basevar (LabeledU _ t) = basevar t

        generalType = fst $ unweaveTypeF ft

        evaluatedType =
          case TE.evaluateType gscope generalType of
            Right et | et /= generalType -> Just et
            _ -> Nothing

        finalVar = basevar $ maybe generalType id evaluatedType

        tensorNDim :: Maybe TVar -> Maybe Int
        tensorNDim (Just v) = lookup v [(BT.tensor k, k) | k <- [1..5]]
        tensorNDim Nothing = Nothing

        selectPacker :: [(TypePacker, SerialAST)] -> MorlocMonad (TypePacker, SerialAST)
        selectPacker [] =
          MM.throwSourcedError m $
            "Cannot find constructor in selectPacker for" <+> pretty ft
              <> "\n  ft:" <+> pretty ft
              <> "\n  generalTypeName (key):" <+> pretty generalTypeName
              <> "\n  typepackers:" <+> viaShow typepackers
              <> "\n  Map.lookup generalTypeName typepackers:" <+> viaShow (Map.lookup generalTypeName typepackers)
        selectPacker (x : _) = return x
    makeSerialAST' gscope typepackers (NamF o n ps rs) = do
      ts <- mapM (makeSerialAST' gscope typepackers . snd) rs
      let entries = zip (map fst rs) ts
      return $ SerialObject o n ps entries
    makeSerialAST' gscope typepackers (EffectF _ t) = makeSerialAST' gscope typepackers t
    makeSerialAST' gscope typepackers (OptionalF t) = do
      inner <- makeSerialAST' gscope typepackers t
      let v = case t of
                VarF fv -> fv
                AppF (VarF fv) _ -> fv
                NamF _ fv _ _ -> fv
                _ -> FV (TV "Optional") (CV "optional")
      return $ SerialOptional v inner
    makeSerialAST' _ _ t = MM.throwSourcedError m $ "makeSerialAST' error on type:" <+> pretty t

resolvePacker ::
  Lang ->
  Int ->
  TypeF ->
  (Int, TypeU, TypeU, Source, Source) ->
  MorlocMonad (Maybe TypePacker)
resolvePacker lang m0 resolvedType@(AppF _ _) (_, unpackedGeneralType, packedGeneralType, srcPacked, srcUnpacked) = do
  packedConcreteType <- inferConcreteTypeU lang (Idx m0 packedGeneralType)
  unpackedConcreteType <- inferConcreteTypeU lang (Idx m0 unpackedGeneralType)
  maybeUnpackedType <-
    resolveP
      resolvedType
      packedConcreteType
      unpackedConcreteType
      (packedGeneralType, unpackedGeneralType)

  case maybeUnpackedType of
    (Just unpackedType) ->
      return . Just $
        TypePacker
          { typePackerPacked = resolvedType
          , typePackerUnpacked = unpackedType
          , typePackerForward = srcPacked
          , typePackerReverse = srcUnpacked
          }
    Nothing -> return Nothing
  where
    -- Both sides of the packer function are guaranteed to have the same
    -- generic values, this is guaranteed by the implementation of
    -- Restructure.hs. So it is sufficient to resolve the generics in the packed
    -- type and map them to the unpacked type.
    --
    -- Example:
    --
    --  resolveP ("dict" "str" "int") ("dict" a b) ("list" ("list" a b) --> ("list" ("list" "str" "int"))
    --                    x_r             x_u                y_u                       y_r
    --
    -- x_u is the unresolved packed type that is extracted before typechecking
    -- x_r is equal to x_u after type inference
    --
    -- () |- x_u <: x_y -| g
    -- y_r = apply g y_u
    --
    -- y_u is the unresolved unpacked type that is extracted with x_u
    --
    -- y_u and y_r are both processed by Restructure.hs and are both guaranteed
    -- to share the same set of generics. We can find the identity of these
    -- generics by subtyping x_u against x_y. The produced context contains
    -- the types for each generic variable. The context can be applied to
    -- y_u to get the final desired y_r.
    resolveP ::
      TypeF -> -- resolved packed type (e.g., "dict" "str" "int")
      TypeU -> -- unresolved packed type (e.g., "dict" a b)
      TypeU -> -- unresolved unpacked type (e.g., "list" ("list" a b))
      (TypeU, TypeU) -> -- The general unresolved packed and unpacked types
      MorlocMonad (Maybe TypeF) -- the resolved unpacked types
    resolveP a b c generalTypes = do
      let (ga, ca) = unweaveTypeF a
      unpackedConcreteType <- case subtype Map.empty b ca (Gamma 0 0 IntMap.empty Map.empty Map.empty [] Map.empty Map.empty) of
        (Left typeErr) ->
          MM.throwSourcedError m0 $
            "There was an error raised in subtyping while resolving serialization"
              <> "\nThe packer involved maps the type:"
              <> "\n  "
              <> (pretty . fst) generalTypes
              <> "\n\nTo the serialized form:"
              <> "\n  "
              <> (pretty . snd) generalTypes
              <> "\n\nHere the unresolved concrete packed type:"
              <> "\n  b:" <+> pretty b
              <> "\n\nShould be the subtype of the resolved packed type:"
              <> "\n  a:" <+> pretty a
              <> "\n\nThe generic terms in b should be resolved through subtyping and used to resolve the unpacked type:"
              <> "\n  c:" <+> pretty c
              <> "\n\nHowever, the b <: a step failed:\n"
              <> typeErr
              <> "\n\nThe packer function may not be generic enough to pack the type you specify, if this is the case, you may need to simplify the datatype"
        (Right g) -> do
          return (apply g (existential c))

      maybeUnpackedGeneralType <- case generalTypes of
        (u, gc) -> do
          -- where u  is the unresolved general packed type that was stored in Desugar.hs
          --       gc is the unresolved general unpacked type
          case subtype Map.empty u ga (Gamma 0 0 IntMap.empty Map.empty Map.empty [] Map.empty Map.empty) of
            (Left _) -> return Nothing
            (Right g) -> do
              return . Just $ apply g (existential gc)

      return $ case maybeUnpackedGeneralType of
        (Just resolvedUnpackedGeneralType) -> Just $ weaveTypeF resolvedUnpackedGeneralType unpackedConcreteType
        Nothing -> Nothing

    -- Replaces each generic term with an existential term of the same name
    existential :: TypeU -> TypeU
    existential (ForallU v t0) = substitute v (existential t0)
    existential t0 = t0
resolvePacker _ m0 _ _ = MM.throwSourcedError m0 $ "No packer found for this type"

cv2tv :: CVar -> TVar
cv2tv (CV x) = TV x

tv2cv :: TVar -> CVar
tv2cv (TV x) = CV x

unweaveTypeF :: TypeF -> (TypeU, TypeU)
unweaveTypeF (UnkF (FV gv cv)) = (VarU gv, VarU (cv2tv cv))
unweaveTypeF (VarF (FV gv cv)) = (VarU gv, VarU (cv2tv cv))
unweaveTypeF (FunF ts t) =
  let (gt, ct) = unweaveTypeF t
      (gts, cts) = unzip $ map unweaveTypeF ts
   in (FunU gts gt, FunU cts ct)
unweaveTypeF (AppF t ts) =
  let (gt, ct) = unweaveTypeF t
      (gts, cts) = unzip $ map unweaveTypeF ts
   in (AppU gt gts, AppU ct cts)
unweaveTypeF (NamF n (FV gv cv) ps rs) =
  let (psg, psc) = unzip $ map unweaveTypeF ps
      keys = map fst rs
      (vsg, vsc) = unzip $ map (unweaveTypeF . snd) rs
   in (NamU n gv psg (zip keys vsg), NamU n (cv2tv cv) psc (zip keys vsc))
unweaveTypeF (EffectF effs t) =
  let (gt, ct) = unweaveTypeF t
   in (EffectU (EffectSet effs) gt, EffectU (EffectSet effs) ct)
unweaveTypeF (OptionalF t) =
  let (gt, ct) = unweaveTypeF t
   in (OptionalU gt, OptionalU ct)

-- Nat types have no concrete/general distinction; duplicate as-is
unweaveTypeF (NatLitF n) = (NatLitU n, NatLitU n)

weaveTypeF :: TypeU -> TypeU -> TypeF
weaveTypeF (VarU gv) (VarU cv) = VarF (FV gv (tv2cv cv))
weaveTypeF (FunU tsg tg) (FunU tsc tc) = FunF (zipWith weaveTypeF tsg tsc) (weaveTypeF tg tc)
weaveTypeF (AppU tg tsg) (AppU tc tsc) = AppF (weaveTypeF tg tc) (zipWith weaveTypeF tsg tsc)
weaveTypeF (NamU n gv psg rsg) (NamU _ cv psc rsc) =
  NamF
    n
    (FV gv (tv2cv cv))
    (zipWith weaveTypeF psg psc)
    ( zip
        (map fst rsg)
        (zipWith weaveTypeF (map snd rsg) (map snd rsc))
    )
weaveTypeF (EffectU effs gt) (EffectU _ ct) = EffectF (resolveEffectSet effs) (weaveTypeF gt ct)
weaveTypeF (OptionalU gt) (OptionalU ct) = OptionalF (weaveTypeF gt ct)
weaveTypeF ((ExistU gv _ _)) (ExistU cv _ _) = UnkF (FV gv (tv2cv cv))
weaveTypeF (NatLitU n) (NatLitU _) = NatLitF n
weaveTypeF (NatLitU n) _ = NatLitF n  -- Nat params may be erased in concrete type
weaveTypeF (NatVarU _) _ = NatLitF 0  -- Nat vars erased in concrete type
weaveTypeF (LabeledU _ gt) ct = weaveTypeF gt ct
weaveTypeF gt (LabeledU _ ct) = weaveTypeF gt ct
weaveTypeF gt ct = error . show $ (gt, ct)

-- | Check if a SerialAST's root has the "arrow" concrete type hint
hasArrowHint :: SerialAST -> Bool
hasArrowHint (SerialObject _ (FV _ (CV "arrow")) _ _) = True
hasArrowHint _ = False

{- | Given a list of possible ways to (de)serialize data between two languages,
choose one (or none if the list is empty). Currently I just take the first
in the list, but different cycles may have very different performance, so
this will be an important optimization step later on.
-}
chooseSerializationCycle ::
  [(SerialAST, SerialAST)] ->
  Maybe (SerialAST, SerialAST)
chooseSerializationCycle [] = Nothing
chooseSerializationCycle (x : _) = Just x

{- | Determine if a SerialAST can be directly translated to JSON, if not it
will need to be further reduced.
-}
isSerializable :: SerialAST -> Bool
isSerializable (SerialPack _ _) = False
isSerializable (SerialList _ x) = isSerializable x
isSerializable (SerialTuple _ xs) = all isSerializable xs
isSerializable (SerialObject _ _ _ rs) = all (isSerializable . snd) rs
isSerializable (SerialReal _) = True
isSerializable (SerialFloat32 _) = True
isSerializable (SerialFloat64 _) = True
isSerializable (SerialInt _) = True
isSerializable (SerialInt8 _) = True
isSerializable (SerialInt16 _) = True
isSerializable (SerialInt32 _) = True
isSerializable (SerialInt64 _) = True
isSerializable (SerialUInt _) = True
isSerializable (SerialUInt8 _) = True
isSerializable (SerialUInt16 _) = True
isSerializable (SerialUInt32 _) = True
isSerializable (SerialUInt64 _) = True
isSerializable (SerialBool _) = True
isSerializable (SerialString _) = True
isSerializable (SerialNull _) = True
isSerializable (SerialOptional _ x) = isSerializable x
isSerializable (SerialTensor _ _ x) = isSerializable x
isSerializable (SerialUnknown _) = True -- are you feeling lucky?

prettySerialOne :: SerialAST -> MDoc
prettySerialOne (SerialPack _ _) = "SerialPack"
prettySerialOne (SerialList v x) = "SerialList" <> angles (pretty v) <> parens (prettySerialOne x)
prettySerialOne (SerialTuple v xs) = "SerialTuple" <> angles (pretty v) <> tupled (map prettySerialOne xs)
prettySerialOne (SerialObject r _ _ rs) =
  block 4 ("SerialObject@" <> viaShow r) $
    vsep (map (\(k, v) -> parens (viaShow k) <> "=" <> prettySerialOne v) rs)
prettySerialOne (SerialReal _) = "SerialReal"
prettySerialOne (SerialFloat32 _) = "SerialFloat32"
prettySerialOne (SerialFloat64 _) = "SerialFloat64"
prettySerialOne (SerialInt _) = "SerialInt"
prettySerialOne (SerialInt8 _) = "SerialInt8"
prettySerialOne (SerialInt16 _) = "SerialInt16"
prettySerialOne (SerialInt32 _) = "SerialInt32"
prettySerialOne (SerialInt64 _) = "SerialInt64"
prettySerialOne (SerialUInt _) = "SerialUInt"
prettySerialOne (SerialUInt8 _) = "SerialUInt8"
prettySerialOne (SerialUInt16 _) = "SerialUInt16"
prettySerialOne (SerialUInt32 _) = "SerialUInt32"
prettySerialOne (SerialUInt64 _) = "SerialUInt64"
prettySerialOne (SerialBool _) = "SerialBool"
prettySerialOne (SerialString _) = "SerialString"
prettySerialOne (SerialNull _) = "SerialNull"
prettySerialOne (SerialOptional _ x) = "SerialOptional" <> parens (prettySerialOne x)
prettySerialOne (SerialTensor _ ndim x) = "SerialTensor" <> pretty ndim <> parens (prettySerialOne x)
prettySerialOne (SerialUnknown _) = "SerialUnknown"


================================================
FILE: library/Morloc/CodeGenerator/Serialize.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.CodeGenerator.Serialize
Description : Insert pack\/unpack operations at cross-language call boundaries
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Walks the segmented manifold tree and inserts serialization\/deserialization
calls wherever data crosses a language boundary (interprocess communication).
Uses 'Serial.makeSerialAST' to determine the packing strategy for each type.
The result is the 'SerialManifold' tree consumed by the translators.
-}
module Morloc.CodeGenerator.Serialize
  ( serialize
  ) where

import Data.Text (Text)
import Morloc.CodeGenerator.Infer
import Morloc.CodeGenerator.Namespace
import qualified Morloc.CodeGenerator.Serial as Serial
import qualified Morloc.Config as MC
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM

{- | This step is performed after segmentation, so all terms are in the same
language. Here we need to determine where inputs are (de)serialized and the
serialization states of arguments and variables.
-}
serialize :: MonoHead -> MorlocMonad SerialManifold
serialize (MonoHead lang m0 args0 headForm0 e0) = do
  form0 <- ManifoldFull <$> mapM prepareArg args0

  MM.sayVVV $
    "In serialize for" <+> "m"
      <> pretty m0 <+> pretty lang <+> "segment"
      <> "\n  form0:" <+> pretty form0
      <> "\n  typemap:" <+> viaShow typemap
      <> "\n  This map we made from the expression:\n  "
      <> pretty e0

  se1 <- serialExpr m0 e0
  let sm = SerialManifold m0 lang form0 headForm0 se1
  wireSerial lang sm
  where
    inferType = inferConcreteType lang
    inferTypeUniversal = inferConcreteTypeUniversal lang
    inferVar = inferConcreteVar lang

    typemap = makeTypemap m0 e0

    prepareArg ::
      Arg None ->
      MorlocMonad (Arg (Or TypeS TypeF))
    prepareArg (Arg i _) = case Map.lookup i typemap of
      Nothing -> return $ Arg i (L PassthroughS)
      (Just (Right t)) -> do
        t' <- inferType t
        return $ Arg i (L (typeSof t'))
      (Just (Left t)) -> do
        MM.sayVVV "Warning: using universal inference at prepareArg"
        t' <- inferTypeUniversal t
        return $ Arg i (L (typeSof t'))

    contextArg ::
      Int ->
      MorlocMonad (Or TypeS TypeF)
    contextArg i = case Map.lookup i typemap of
      (Just (Right t)) -> do
        t' <- inferType t
        return $ LR (typeSof t') t'
      Nothing -> return $ L PassthroughS
      (Just (Left t)) -> do
        MM.sayVVV "Warning: using universal inference at contextArg"
        t' <- inferTypeUniversal t
        return $ LR (typeSof t') t'

    boundArg :: Int -> MorlocMonad TypeF
    boundArg i = case Map.lookup i typemap of
      (Just (Right t)) -> inferType t
      Nothing -> error "Untyped native arg"
      (Just (Left t)) -> do
        MM.sayVVV "Warning: using universal inference at boundArg"
        inferTypeUniversal t

    serialExpr ::
      Int ->
      MonoExpr ->
      MorlocMonad SerialExpr
    serialExpr _ (MonoManifold m form e) = do
      MM.sayVVV $ "serialExpr MonoManifold m" <> pretty m <> parens (pretty form)
      serialExpr m e
    serialExpr m (MonoLet i e1 e2) =
      let (m1, e1') = unwrapLetDef m e1
       in case inferState e1 of
            Serialized -> SerialLetS i <$> serialExpr m1 e1' <*> serialExpr m e2
            Unserialized -> do
              ne1 <- nativeExpr m1 e1'
              NativeLetS i ne1 <$> serialExpr m e2
    serialExpr _ (MonoLetVar t i) = do
      t' <- inferType t
      return $ LetVarS (Just t') i
    serialExpr m (MonoReturn e) = ReturnS <$> serialExpr m e
    serialExpr _ (MonoApp (MonoPoolCall t m docs remoteCall contextArgs) es) = do
      contextArgs' <- mapM (typeArg Serialized . ann) contextArgs
      let poolCall' = PoolCall m docs remoteCall contextArgs'
      es' <- mapM (serialArg m) es
      t' <- inferType t
      return $ AppPoolS t' poolCall' es'
    serialExpr _ (MonoBndVar (A _) i) = return $ BndVarS Nothing i
    serialExpr _ (MonoBndVar (B _) i) =
      case Map.lookup i typemap of
        (Just (Right t)) -> BndVarS <$> fmap Just (inferType t) <*> pure i
        _ -> return $ BndVarS Nothing i
    serialExpr _ (MonoBndVar (C t) i) = BndVarS <$> fmap Just (inferType t) <*> pure i
    serialExpr m (MonoIf cond thenE elseE) = do
      ne <- nativeExpr m (MonoIf cond thenE elseE)
      serializeS "serialE MonoIf" m ne
    -- Thunk-producing intrinsics: convert to native and serialize with the
    -- inner type (strip EffectF) so the wire format matches the forced value.
    serialExpr m (MonoDoBlock _ e) = serialExpr m e
    serialExpr _ (MonoExe _ _) = error "Can represent MonoSrc as SerialExpr"
    serialExpr _ MonoPoolCall {} = error "MonoPoolCall does not map to a SerialExpr"
    serialExpr _ (MonoApp MonoManifold {} _) = error "Illegal?"
    serialExpr m e = nativeExpr m e >>= serializeS "serialE e" m

    serialArg ::
      Int ->
      MonoExpr ->
      MorlocMonad SerialArg
    serialArg _ e@(MonoManifold m form _) = do
      MM.sayVVV $ "serialArg MonoManifold m" <> pretty m <> parens (pretty form)
      se <- serialExpr m e
      case se of
        (ManS sm) -> return $ SerialArgManifold sm
        _ -> error "Unreachable?"
    serialArg _ MonoPoolCall {} = error "This step should be unreachable"
    serialArg _ (MonoExe _ _) = error "This step should be unreachable"
    serialArg _ (MonoReturn _) = error "Return should not happen hear (really I should remove this term completely)"
    serialArg m e = SerialArgExpr <$> serialExpr m e

    nativeArg ::
      Int ->
      MonoExpr ->
      MorlocMonad NativeArg
    nativeArg _ e@(MonoManifold m form _) = do
      MM.sayVVV $ "nativeArg MonoManifold m" <> pretty m <> parens (pretty form)
      ne <- nativeExpr m e
      case ne of
        (ManN nm) -> return $ NativeArgManifold nm
        _ -> error "Unreachable?"
    nativeArg _ MonoPoolCall {} = error "This step should be unreachable"
    nativeArg _ (MonoExe _ _) = error "This step should be unreachable"
    nativeArg _ (MonoReturn _) = error "Return should not happen here (really I should remove this term completely)"
    nativeArg m e = NativeArgExpr <$> nativeExpr m e

    nativeExpr ::
      Int ->
      MonoExpr ->
      MorlocMonad NativeExpr
    nativeExpr _ (MonoManifold m form e) = do
      MM.sayVVV $ "nativeExpr MonoManifold m" <> pretty m <> parens (pretty form)
      ne <- nativeExpr m e
      form' <- abimapM (\i _ -> contextArg i) (\i _ -> boundArg i) form
      return . ManN $ NativeManifold m lang form' ne
    nativeExpr _ MonoPoolCall {} = error "MonoPoolCall does not map to NativeExpr"
    nativeExpr m (MonoLet i e1 e2) =
      let (m1, e1') = unwrapLetDef m e1
       in case inferState e1 of
            Serialized -> do
              ne2 <- nativeExpr m e2
              SerialLetN i <$> serialExpr m1 e1' <*> pure ne2
            Unserialized -> do
              ne1 <- nativeExpr m1 e1'
              ne2 <- nativeExpr m e2
              return $ NativeLetN i ne1 ne2
    nativeExpr _ (MonoLetVar t i) = LetVarN <$> inferType t <*> pure i
    nativeExpr m (MonoReturn e) = ReturnN <$> nativeExpr m e
    -- Cross-language recursive call: serialize args, call via socket, deserialize result
    nativeExpr m (MonoApp (MonoExe (Idx idx t0) (RecCallP mid (Just targetLang))) es) = do
      let (_, outputType) = case t0 of
            FunT its ot -> (its, ot)
            _ -> ([], t0)
      nativeArgs <- mapM (nativeExpr m) es
      serializedArgs <- mapM (serializeS "foreignRecArg" m) nativeArgs
      resultType <- inferType (Idx idx outputType)
      config <- MM.ask
      reg <- MM.gets stateLangRegistry
      let socket = MC.setupServerAndSocket config reg targetLang
          serialCall = AppForeignRecS resultType mid socket serializedArgs
      naturalizeN "foreignRecCall" m lang resultType serialCall
    -- Same-language recursive call: serialize args, call serial manifold, deserialize result
    nativeExpr m (MonoApp (MonoExe (Idx idx t0) (RecCallP mid Nothing)) es) = do
      let (_, outputType) = case t0 of
            FunT its ot -> (its, ot)
            _ -> ([], t0)
      -- Build native args, then serialize each one
      nativeArgs <- mapM (nativeExpr m) es
      serializedArgs <- mapM (serializeS "recArg" m) nativeArgs
      -- Return type of the serial manifold call
      resultType <- inferType (Idx idx outputType)
      -- Create serial expression: call the serial manifold with serialized args
      let serialCall = AppRecS resultType mid serializedArgs
      -- Deserialize the result back to native
      naturalizeN "recCall" m lang resultType serialCall
    nativeExpr m (MonoApp (MonoExe (Idx idx t0) exe) es) = do
      args <- mapM (nativeArg m) es
      let (inputTypes, outputType) = case t0 of
            FunT its ot -> (its, ot)
            _ -> ([], t0)
      appType <- case drop (length es) inputTypes of
        [] -> inferType (Idx idx outputType)
        remaining -> inferType $ Idx idx (FunT remaining outputType)

      return $ AppExeN appType exe args
    nativeExpr m e@(MonoApp (MonoPoolCall t _ _ _ _) _) = do
      e' <- serialExpr m e
      t' <- inferType t
      MM.sayVVV $ "nativeExpr MonoApp:" <+> pretty t'
      naturalizeN "nativeE MonoApp" m lang t' e'
    nativeExpr m (MonoApp (MonoLetVar (Idx idx (FunT inputTypes outputType)) i) es) = do
      MM.sayVVV $ "MonoLetVar case"
      args <- mapM (nativeArg m) es
      appType <- case drop (length es) inputTypes of
        [] -> inferType (Idx idx outputType)
        remaining -> inferType $ Idx idx (FunT remaining outputType)
      return $ AppExeN appType (LocalCallP i) args
    nativeExpr _ (MonoApp e es) = do
      MM.sayVVV "nativeExprr MonoApp"
      MM.sayVVV $ "e:" <+> pretty e
      MM.sayVVV $ "es:" <+> list (map pretty es)
      error "Illegal application"
    nativeExpr _ (MonoExe t exe) = ExeN <$> inferType t <*> pure exe
    nativeExpr _ (MonoBndVar (A _) _) = error "MonoBndVar must have a type if used in native context"
    nativeExpr _ (MonoBndVar (B _) i) =
      case Map.lookup i typemap of
        (Just (Right t)) -> BndVarN <$> inferType t <*> pure i
        _ -> error "No type found"
    nativeExpr _ (MonoBndVar (C t) i) = BndVarN <$> inferType t <*> pure i
    nativeExpr m (MonoList v t es) =
      ListN
        <$> inferVar v
        <*> inferType t
        <*> mapM (nativeExpr m) es
    nativeExpr m (MonoTuple v rs) =
      TupleN
        <$> inferVar v
        <*> mapM (nativeExpr m . snd) rs
    nativeExpr m (MonoRecord o v ps rs) =
      RecordN o
        <$> inferVar v
        <*> mapM inferType ps
        <*> mapM (secondM (nativeExpr m . snd)) rs
    nativeExpr _ (MonoLog v x) = LogN <$> inferVar v <*> pure x
    nativeExpr _ (MonoReal v x) = RealN <$> inferVar v <*> pure x
    nativeExpr _ (MonoInt v x) = IntN <$> inferVar v <*> pure x
    nativeExpr _ (MonoStr v x) = StrN <$> inferVar v <*> pure x
    nativeExpr _ (MonoNull v) = NullN <$> inferVar v
    nativeExpr m (MonoIf cond thenE elseE) = do
      condNe <- nativeExpr m cond
      thenNe <- nativeExpr m thenE
      elseNe <- nativeExpr m elseE
      let ifType = case (thenNe, elseNe) of
            (NullN _, _) -> typeFof elseNe
            (_, NullN _) -> typeFof thenNe
            _ -> typeFof thenNe
      return $ IfN ifType condNe thenNe elseNe
    nativeExpr m (MonoDoBlock t e) = DoBlockN <$> inferType t <*> nativeExpr m e
    nativeExpr m (MonoEval t e) = EvalN <$> inferType t <*> nativeExpr m e
    nativeExpr m (MonoCoerce c t e) = CoerceN c <$> inferType t <*> nativeExpr m e
    -- Runtime intrinsics with thunk return types (save/load): the C functions
    -- (mlc_save, mlc_load) are eager, so we wrap them in DoBlockN to produce a
    -- proper thunk that EvalN can call.
    nativeExpr m (MonoIntrinsic t intr es)
      | intr `elem` [IntrSave, IntrSaveM, IntrSaveJ, IntrLoad] = do
          tf <- inferType t
          es' <- mapM (nativeExpr m) es
          msch <- intrinsicSchema m intr tf es'
          let innerTf = case tf of
                EffectF _ inner -> inner
                other -> other
          return $ DoBlockN tf (IntrinsicN innerTf intr msch es')
    nativeExpr m (MonoIntrinsic t intr es) = do
      tf <- inferType t
      es' <- mapM (nativeExpr m) es
      msch <- intrinsicSchema m intr tf es'
      return $ IntrinsicN tf intr msch es'

    -- Compute the msgpack schema string for runtime intrinsics
    intrinsicSchema :: Int -> Intrinsic -> TypeF -> [NativeExpr] -> MorlocMonad (Maybe Text)
    intrinsicSchema m intr _ (dataArg:_)
      | intr `elem` [IntrHash, IntrSave, IntrSaveM, IntrSaveJ, IntrShow, IntrSchema] = do
          ast <- Serial.makeSerialAST m lang (typeFof dataArg)
          return . Just . render $ Serial.serialAstToMsgpackSchema ast
    intrinsicSchema _ IntrTypeof _ (dataArg:_) =
      -- @typeof yields the user-facing type name as a compile-time constant
      -- string. The string is stored in the Intrinsic node's schema slot and
      -- emitted as a literal by the translator; the argument is erased.
      return . Just $ renderTypeFName (typeFof dataArg)
    intrinsicSchema m IntrLoad tf _ = do
      -- For @load, the return type is {?a} or ?a; the schema is for a
      let unwrap (EffectF _ inner) = unwrap inner
          unwrap (OptionalF inner) = inner
          unwrap other = other
          dataType = unwrap tf
      ast <- Serial.makeSerialAST m lang dataType
      return . Just . render $ Serial.serialAstToMsgpackSchema ast
    intrinsicSchema m IntrRead tf _ = do
      -- For @read, the return type is ?a; the schema is for a
      let unwrap (OptionalF inner) = inner
          unwrap other = other
          dataType = unwrap tf
      ast <- Serial.makeSerialAST m lang dataType
      return . Just . render $ Serial.serialAstToMsgpackSchema ast
    intrinsicSchema _ _ _ _ = return Nothing

    -- Render a TypeF as a user-facing Morloc type string (for @typeof).
    -- Uses the general type variable name (not the language-concrete one),
    -- matching what the user wrote in their source.
    renderTypeFName :: TypeF -> Text
    renderTypeFName = render . go
      where
        go (UnkF (FV t _)) = pretty t
        go (VarF (FV t _)) = pretty t
        go (NamF _ (FV t _) params _) =
          case params of
            [] -> pretty t
            ps -> parens (pretty t <+> hsep (map go ps))
        go (AppF con args) = parens (go con <+> hsep (map go args))
        go (FunF args ret) =
          parens (hsep (punctuate " ->" (map go args ++ [go ret])))
        go (EffectF _ t) = go t
        go (OptionalF t) = "?" <> go t
        go (NatLitF n) = pretty n

    typeArg ::
      SerializationState ->
      Int ->
      MorlocMonad (Arg TypeM)
    typeArg s i = case (s, Map.lookup i typemap) of
      (Serialized, Just (Right t)) -> do
        t' <- inferType t
        return $ Arg i (Serial t')
      (Serialized, Nothing) -> return $ Arg i Passthrough
      (Serialized, Just (Left t)) -> do
        MM.sayVVV $ "typeArg universal inference of unindexed type " <> pretty t
        t' <- inferTypeUniversal t
        return $ Arg i (Serial t')
      (Unserialized, Just (Right t)) -> do
        t' <- inferType t
        return $ Arg i (Native t')
      (Unserialized, Nothing) -> error "Bug: untyped non-passthrough value"
      (Unserialized, Just (Left t)) -> do
        MM.sayVVV $ "typeArg universal inference of unindexed type " <> pretty t
        t' <- inferTypeUniversal t
        return $ Arg i (Native t')

    makeTypemap :: Int -> MonoExpr -> Map.Map Int (Either Type (Indexed Type))
    makeTypemap _ (MonoLetVar t i) = Map.singleton i (Right t)
    makeTypemap parentIndex (MonoBndVar (B t) i) = Map.singleton i (Right (Idx parentIndex t))
    makeTypemap _ (MonoBndVar (C t) i) = Map.singleton i (Right t)
    makeTypemap _ (MonoManifold midx (manifoldBound -> ys) e) =
      Map.union (Map.fromList [(i, Left t) | (Arg i (Just t)) <- ys]) (makeTypemap midx e)
    makeTypemap parentIdx (MonoLet _ e1 e2) = Map.union (makeTypemap parentIdx e1) (makeTypemap parentIdx e2)
    makeTypemap parentIdx (MonoReturn e) = makeTypemap parentIdx e
    makeTypemap parentIdx (MonoEval _ e) = makeTypemap parentIdx e
    makeTypemap parentIdx (MonoDoBlock _ e) = makeTypemap parentIdx e
    makeTypemap parentIdx (MonoCoerce _ _ e) = makeTypemap parentIdx e
    makeTypemap parentIdx (MonoIntrinsic _ _ es) = Map.unionsWith mergeTypes (map (makeTypemap parentIdx) es)
    makeTypemap parentIdx (MonoIf cond thenE elseE) =
      Map.unionsWith mergeTypes [makeTypemap parentIdx cond, makeTypemap parentIdx thenE, makeTypemap parentIdx elseE]
    makeTypemap _ (MonoApp (MonoExe (ann -> idx) _) es) = Map.unionsWith mergeTypes (map (makeTypemap idx) es)
    makeTypemap parentIdx (MonoApp e es) = Map.unionsWith mergeTypes (map (makeTypemap parentIdx) (e : es))
    makeTypemap _ (MonoList (ann -> idx) _ es) = Map.unionsWith mergeTypes (map (makeTypemap idx) es)
    makeTypemap _ (MonoTuple (ann -> idx) (map snd -> es)) = Map.unionsWith mergeTypes (map (makeTypemap idx) es)
    makeTypemap _ (MonoRecord _ (ann -> idx) _ (map (snd . snd) -> es)) = Map.unionsWith mergeTypes (map (makeTypemap idx) es)
    makeTypemap _ _ = Map.empty

    mergeTypes :: Either Type (Indexed Type) -> Either Type (Indexed Type) -> Either Type (Indexed Type)
    mergeTypes (Right t) _ = Right t
    mergeTypes _ (Right t) = Right t
    mergeTypes x _ = x

    serializeS :: MDoc -> Int -> NativeExpr -> MorlocMonad SerialExpr
    serializeS msg m se = do
      MM.sayVVV $ "serializeS" <+> pretty m <> ":" <+> msg
      SerializeS <$> Serial.makeSerialAST m lang (typeFof se) <*> pure se

    inferState :: MonoExpr -> SerializationState
    inferState (MonoApp MonoPoolCall {} _) = Serialized
    inferState (MonoApp MonoExe {} _) = Unserialized
    inferState (MonoApp (MonoManifold _ _ e) _) = inferState e
    inferState (MonoLet _ _ e) = inferState e
    inferState (MonoReturn e) = inferState e
    inferState (MonoManifold _ _ e) = inferState e
    inferState (MonoIf _ thenE _) = inferState thenE
    inferState MonoPoolCall {} = Unserialized
    inferState MonoBndVar {} = Unserialized
    inferState _ = Unserialized

{- | Unwrap structural MonoManifold/MonoReturn wrappers from a let definition.
MonoManifold contributes its index (for type lookups); MonoReturn is the
manifold's return semantics, which is meaningless in a let-binding context.
-}
unwrapLetDef :: Int -> MonoExpr -> (Int, MonoExpr)
unwrapLetDef _ (MonoManifold m _ (MonoReturn e)) = (m, e)
unwrapLetDef _ (MonoManifold m _ e) = (m, e)
unwrapLetDef m (MonoReturn e) = (m, e)
unwrapLetDef m e = (m, e)

naturalizeN :: MDoc -> Int -> Lang -> TypeF -> SerialExpr -> MorlocMonad NativeExpr
naturalizeN msg m lang t se = do
  MM.sayVVV $ "naturalizeN at" <+> msg
  DeserializeN t <$> Serial.makeSerialAST m lang t <*> pure se

class IsSerializable a where
  serialLet :: Int -> SerialExpr -> a -> a
  nativeLet :: Int -> NativeExpr -> a -> a

instance IsSerializable SerialExpr where
  serialLet = SerialLetS
  nativeLet = NativeLetS

instance IsSerializable NativeExpr where
  serialLet = SerialLetN
  nativeLet = NativeLetN

type D a = (Map.Map Int Request, a)

wireSerial :: Lang -> SerialManifold -> MorlocMonad SerialManifold
wireSerial lang sm0@(SerialManifold m0 _ _ _ _) = foldSerialManifoldM fm sm0 |>> snd
  where
    defs = makeMonoidFoldDefault Map.empty (Map.unionWith (<>))

    fm =
      FoldManifoldM
        { opSerialManifoldM = wireSerialManifold
        , opNativeManifoldM = wireNativeManifold
        , opSerialExprM = wireSerialExpr
        , opNativeExprM = wireNativeExpr
        , opSerialArgM = monoidSerialArg defs
        , opNativeArgM = monoidNativeArg defs
        }

    wireSerialManifold :: SerialManifold_ (D SerialExpr) -> MorlocMonad (D SerialManifold)
    wireSerialManifold (SerialManifold_ m _ form headForm (req, e)) = do
      let form' = afirst (specialize req) form
          req' = Map.map fst (manifoldToMap form')
      e' <- letWrap m form' req e
      return (req', SerialManifold m lang form' headForm e')

    wireNativeManifold :: NativeManifold_ (D NativeExpr) -> MorlocMonad (D NativeManifold)
    wireNativeManifold (NativeManifold_ m _ form (req, e)) = do
      let form' = afirst (specialize req) form
          req' = Map.map fst (manifoldToMap form')
      e' <- letWrap m form' req e
      return (req', NativeManifold m lang form' e')

    wireSerialExpr (LetVarS_ t i) = return (Map.singleton i SerialContent, LetVarS t i)
    wireSerialExpr (BndVarS_ t i) = return (Map.singleton i SerialContent, BndVarS t i)
    wireSerialExpr (AppPoolS_ t p@(PoolCall _ _ _ pargs) args) = do
      let req1 = Map.unionsWith (<>) (map fst args)
          req2 = Map.fromList [(i, requestOf tm) | Arg i tm <- pargs]
          req3 = Map.unionWith (<>) req1 req2
      return (req3, AppPoolS t p (map snd args))
    wireSerialExpr (AppRecS_ t mid args) = do
      let req = Map.unionsWith (<>) (map fst args)
      return (req, AppRecS t mid (map snd args))
    wireSerialExpr (AppForeignRecS_ t mid socket args) = do
      let req = Map.unionsWith (<>) (map fst args)
      return (req, AppForeignRecS t mid socket (map snd args))
    wireSerialExpr (SerialLetS_ i (req1, se1) (req2, se2)) = do
      let req' = Map.unionWith (<>) req1 req2
      e' <- case Map.lookup i req2 of
        (Just NativeContent) -> case typeSof se1 of
          (SerialS tf) -> NativeLetS i <$> naturalizeN "a" m0 lang tf se1 <*> pure se2
          (FunctionS _ (SerialS tf)) -> NativeLetS i <$> naturalizeN "a" m0 lang tf se1 <*> pure se2
          _ -> error "Unuseable let definition"
        (Just NativeAndSerialContent) -> case typeSof se1 of
          (SerialS tf) -> do
            ne1 <- naturalizeN "a" m0 lang tf (LetVarS (Just tf) i)
            return $ SerialLetS i se1 (NativeLetS i ne1 se2)
          (FunctionS _ (SerialS tf)) -> do
            ne1 <- naturalizeN "a" m0 lang tf (LetVarS (Just tf) i)
            return $ SerialLetS i se1 (NativeLetS i ne1 se2)
          _ -> error "Unuseable let definition"
        _ -> return $ SerialLetS i se1 se2
      return (req', e')
    wireSerialExpr (NativeLetS_ i (req1, ne1) (req2, se2)) = do
      let req' = Map.unionWith (<>) req1 req2
      e' <- case Map.lookup i req2 of
        (Just SerialContent) -> SerialLetS i <$> serializeS "b" m0 (typeFof ne1) ne1 <*> pure se2
        (Just NativeAndSerialContent) -> do
          let tf = typeFof ne1
          sv <- serializeS "b" m0 tf (LetVarN tf i)
          return $ NativeLetS i ne1 (SerialLetS i sv se2)
        _ -> return $ NativeLetS i ne1 se2
      return (req', e')
    wireSerialExpr e = monoidSerialExpr defs e

    wireNativeExpr ::
      NativeExpr_ (D NativeManifold) (D SerialExpr) (D NativeExpr) (D SerialArg) (D NativeArg) ->
      MorlocMonad (D NativeExpr)
    wireNativeExpr (LetVarN_ t i) = return (Map.singleton i NativeContent, LetVarN t i)
    wireNativeExpr (BndVarN_ t i) = return (Map.singleton i NativeContent, BndVarN t i)
    wireNativeExpr (SerialLetN_ i (req1, se1) (req2, ne2)) = do
      let req' = Map.unionWith (<>) req1 req2
      e' <- case Map.lookup i req2 of
        (Just NativeContent) -> case typeSof se1 of
          (SerialS tf) -> NativeLetN i <$> naturalizeN "a" m0 lang tf se1 <*> pure ne2
          (FunctionS _ (SerialS tf)) -> NativeLetN i <$> naturalizeN "a" m0 lang tf se1 <*> pure ne2
          _ -> error "Unuseable let definition"
        (Just NativeAndSerialContent) -> case typeSof se1 of
          (SerialS tf) -> do
            ne1 <- naturalizeN "a" m0 lang tf (LetVarS (Just tf) i)
            return $ SerialLetN i se1 (NativeLetN i ne1 ne2)
          (FunctionS _ (SerialS tf)) -> do
            ne1 <- naturalizeN "a" m0 lang tf (LetVarS (Just tf) i)
            return $ SerialLetN i se1 (NativeLetN i ne1 ne2)
          _ -> error "Unuseable let definition"
        _ -> return $ SerialLetN i se1 ne2
      return (req', e')
    wireNativeExpr (NativeLetN_ i (req1, ne1) (req2, ne2)) = do
      let req' = Map.unionWith (<>) req1 req2
      e' <- case Map.lookup i req2 of
        (Just SerialContent) -> SerialLetN i <$> serializeS "b" m0 (typeFof ne1) ne1 <*> pure ne2
        (Just NativeAndSerialContent) -> do
          let tf = typeFof ne1
          sv <- serializeS "b" m0 tf (LetVarN tf i)
          return $ NativeLetN i ne1 (SerialLetN i sv ne2)
        _ -> return $ NativeLetN i ne1 ne2
      return (req', e')
    wireNativeExpr e = monoidNativeExpr defs e

    specialize :: Map.Map Int Request -> Int -> Or TypeS TypeF -> Or TypeS TypeF
    specialize req i r = case (Map.lookup i req, r) of
      (Nothing, _) -> L PassthroughS
      (Just SerialContent, LR t _) -> L t
      (Just NativeContent, LR _ t) -> R t
      _ -> r

    letWrap ::
      (IsSerializable e, HasRequest t, MayHaveTypeF t) =>
      Int ->
      ManifoldForm (Or TypeS TypeF) t ->
      Map.Map Int Request ->
      e ->
      MorlocMonad e
    letWrap m form0 req0 e0 = do
      foldlM wrapAsNeeded e0 (Map.toList req0)
      where
        formMap = manifoldToMap form0

        wrapAsNeeded :: (IsSerializable e) => e -> (Int, Request) -> MorlocMonad e
        wrapAsNeeded e (i, req) = case (req, Map.lookup i formMap) of
          (SerialContent, Just (NativeContent, Just t)) -> serialLet i <$> serializeS "wan 1" m t (BndVarN t i) <*> pure e
          (NativeAndSerialContent, Just (NativeContent, Just t)) -> serialLet i <$> serializeS "wan 2" m t (BndVarN t i) <*> pure e
          (NativeContent, Just (SerialContent, Just t)) -> nativeLet i <$> naturalizeN "wan 3" m lang t (BndVarS (Just t) i) <*> pure e
          (NativeAndSerialContent, Just (SerialContent, Just t)) -> nativeLet i <$> naturalizeN "wan 4" m lang t (BndVarS (Just t) i) <*> pure e
          _ -> return e

    manifoldToMap ::
      (HasRequest t, MayHaveTypeF t) =>
      ManifoldForm (Or TypeS TypeF) t ->
      Map.Map Int (Request, Maybe TypeF)
    manifoldToMap form = f form
      where
        mapRequestFromXs xs = Map.fromList [(i, (requestOf t, mayHaveTypeF t)) | (Arg i t) <- typeMofRs xs]
        mapRequestFromYs ys = Map.fromList [(i, (requestOf t, mayHaveTypeF t)) | (Arg i t) <- ys]

        f (ManifoldFull xs) = mapRequestFromXs xs
        f (ManifoldPass ys) = mapRequestFromYs ys
        f (ManifoldPart xs ys) = Map.union (mapRequestFromXs xs) (mapRequestFromYs ys)

    serializeS :: MDoc -> Int -> TypeF -> NativeExpr -> MorlocMonad SerialExpr
    serializeS msg m t se = do
      MM.sayVVV $ "serializeS" <+> pretty m <> ":" <+> msg
      SerializeS <$> Serial.makeSerialAST m lang t <*> pure se

data Request = SerialContent | NativeContent | NativeAndSerialContent
  deriving (Ord, Eq, Show)

class HasRequest a where
  requestOf :: a -> Request

instance HasRequest TypeM where
  requestOf Passthrough = SerialContent
  requestOf (Serial _) = SerialContent
  requestOf (Native _) = NativeContent
  requestOf (Function _ _) = NativeContent

instance HasRequest SerialExpr where
  requestOf _ = SerialContent

instance HasRequest NativeExpr where
  requestOf _ = NativeContent

instance HasRequest SerialArg where
  requestOf _ = SerialContent

instance HasRequest NativeArg where
  requestOf _ = NativeContent

instance HasRequest TypeS where
  requestOf _ = SerialContent

instance HasRequest TypeF where
  requestOf _ = NativeContent

instance Semigroup Request where
  SerialContent <> SerialContent = SerialContent
  NativeContent <> NativeContent = NativeContent
  _ <> _ = NativeAndSerialContent

data SerializationState = Serialized | Unserialized
  deriving (Show, Eq, Ord)


================================================
FILE: library/Morloc/CodeGenerator/SystemConfig.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ScopedTypeVariables #-}

{- |
Module      : Morloc.CodeGenerator.SystemConfig
Description : Write runtime files and compile shared libraries during @morloc init@
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Handles the @morloc init@ system setup: writing embedded C library sources,
compiling @libmorloc.so@, building the static nexus binary, and running
per-language @init.sh@ scripts to compile language extensions.
-}
module Morloc.CodeGenerator.SystemConfig
  ( configure
  , configureAll
  ) where

import Morloc.CodeGenerator.Namespace
import qualified Morloc.Completion as Completion
import qualified Morloc.DataFiles as DF
import Morloc.Module (OverwriteProtocol (..))

import qualified Data.Text.IO as TIO

import Control.Exception (SomeException, catch, displayException, fromException, try)
import System.IO.Error (ioeGetErrorString)
import System.Directory (createDirectoryIfMissing, createFileLink, doesDirectoryExist, doesFileExist, findExecutable, getHomeDirectory, listDirectory, pathIsSymbolicLink, removeDirectoryRecursive, removeFile)
import System.Environment (lookupEnv)
import System.FilePath (takeDirectory)
import System.IO (hIsTerminalDevice, hPutStrLn, stderr)
import System.Exit (ExitCode(..))
import System.Process (CreateProcess(..), StdStream(..), createProcess, proc, waitForProcess)

configure :: [AnnoS (Indexed Type) One (Indexed Lang)] -> MorlocMonad ()
configure _ = return ()

configureAll :: Bool -> OverwriteProtocol -> Bool -> Bool -> Config -> IO Bool
configureAll verbose force slurmSupport sanitize config = do
  result <- try (configureAllSteps verbose force slurmSupport sanitize config) :: IO (Either SomeException ())
  case result of
    Left e -> do
      -- Strip the "user error (...)" wrapper from IOError messages
      let msg = case fromException e :: Maybe IOError of
            Just ioe -> ioeGetErrorString ioe
            Nothing -> displayException e
      sayError $ "Configuration failed: " ++ msg
      return False
    Right _ -> return True

configureAllSteps :: Bool -> OverwriteProtocol -> Bool -> Bool -> Config -> IO ()
configureAllSteps verbose force slurmSupport sanitize config = do
  let homeDir = configHome config
      srcLibrary = configLibrary config
      includeDir = homeDir </> "include"
      tmpDir = configTmpDir config
      optDir = homeDir </> "opt"
      libDir = homeDir </> "lib"

  -- When force is set, clean build output directories
  when (force == ForceOverwrite) $ do
    sayInfo verbose "Force rebuild: cleaning stale artifacts"
    cleanDirectory libDir
    cleanDirectoryExcept includeDir ["mlccpptypes"]
    cleanDirectory optDir

  ensureDirectory verbose "morloc home directory" homeDir
  ensureDirectory verbose "morloc lib directory" libDir
  ensureDirectory verbose "morloc include directory" includeDir
  ensureDirectory verbose "morloc tmp directory" tmpDir
  ensureDirectory verbose "morloc opt directory" optDir
  ensureDirectory verbose "morloc module directory" srcLibrary

  sayInfo verbose $ "Slurm support ... " <> show slurmSupport

  sayInfo verbose $ "Sanitize ... " <> show sanitize

  sayInfo verbose "Writing build config file"
  let sanitizeLine = if sanitize then "\nsanitize: true" else "\nsanitize: false"
  TIO.writeFile
    (configBuildConfig config)
    ((if slurmSupport then "slurm-support: true" else "slurm-support: false") <> sanitizeLine)

  -- Clean and create build directory
  let buildDir = tmpDir </> "libmorloc-build"
  buildDirExists <- doesDirectoryExist buildDir
  when buildDirExists $ removeDirectoryRecursive buildDir
  createDirectoryIfMissing True buildDir

  requireTool "gcc" "gcc is required to compile language extensions (C++ pools, Python/R bindings)"
  -- Install morloc.h (the C ABI contract for language extensions and pool templates)
  sayInfo verbose "Installing morloc.h"
  TIO.writeFile (includeDir </> "morloc.h") DF.libmorlocHeader

  -- Install libmorloc.so and morloc-nexus.
  --
  -- Strategy (in priority order):
  --   1. MORLOC_RUST_BIN: directory with pre-built libmorloc.so + morloc-nexus
  --      (used for release installs with portable musl-linked binaries)
  --   2. MORLOC_RUST_DIR: Cargo workspace source — build from source via cargo
  --      (used for development and container builds)
  --   3. Auto-detect Cargo workspace relative to morloc binary
  let soPath = libDir </> "libmorloc.so"
  -- Primary install goes to $MORLOC_HOME/bin/
  let nexusBinDir = homeDir </> "bin"
      nexusBinPath = nexusBinDir </> "morloc-nexus"
  createDirectoryIfMissing True nexusBinDir
  -- Symlink to ~/.local/bin/ if that directory exists
  userHome <- getHomeDirectory
  let userBinDir = userHome </> ".local" </> "bin"

  rustBinEnv <- lookupEnv "MORLOC_RUST_BIN"
  case rustBinEnv of
    Just binDir -> do
      -- Pre-built binaries (release path)
      let prebuiltSo = binDir </> "libmorloc.so"
          prebuiltNexus = binDir </> "morloc-nexus"
          prebuiltManager = binDir </> "morloc-manager"
          managerBinPath = nexusBinDir </> "morloc-manager"
      sayInfo verbose $ "Installing pre-built libmorloc.so from " <> binDir
      run verbose "cp" [prebuiltSo, soPath]
      run verbose "cp" [prebuiltNexus, nexusBinPath]
      run verbose "chmod" ["+x", soPath]
      run verbose "chmod" ["+x", nexusBinPath]
      -- Install morloc-manager if present in pre-built binaries
      managerExists <- doesFileExist prebuiltManager
      when managerExists $ do
        sayInfo verbose "Installing pre-built morloc-manager"
        run verbose "cp" [prebuiltManager, managerBinPath]
        run verbose "chmod" ["+x", managerBinPath]
    Nothing -> do
      -- Try to build from source: need both cargo and the Rust workspace
      rustDirEnv <- lookupEnv "MORLOC_RUST_DIR"
      rustDir <- case rustDirEnv of
        Just d -> return d
        Nothing -> do
          morlocBin <- findExecutable "morloc"
          let searchDirs = case morlocBin of
                Just binPath ->
                  [ takeDirectory (takeDirectory binPath) </> "share" </> "morloc" </> "rust"
                  , takeDirectory (takeDirectory binPath) </> "data" </> "rust"
                  ]
                Nothing -> []
          findRustDir searchDirs

      hasCargo <- findExecutable "cargo"

      when (null rustDir || hasCargo == Nothing) $
        ioError . userError $ unlines
          [ "morloc init requires pre-built libmorloc.so and morloc-nexus binaries."
          , ""
          , "Download them from: https://github.com/morloc-project/morloc/releases"
          , ""
          , "Then set MORLOC_RUST_BIN to the directory containing them:"
          , "  export MORLOC_RUST_BIN=/path/to/binaries"
          , "  morloc init -f"
          , ""
          , "For development, you can build from source instead:"
          , "  1. Install Rust: curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh"
          , "  2. Set MORLOC_RUST_DIR to the data/rust/ directory in the compiler repo"
          , "  3. Run: morloc init -f"
          ]

      sayInfo verbose "Compiling libmorloc.so (Rust)"
      run verbose "cargo"
        [ "build", "--release"
        , "--manifest-path", rustDir </> "Cargo.toml"
        , "-p", "morloc-runtime"
        ]
      -- Build the .so from the staticlib using gcc --whole-archive.
      -- This exports ALL symbols, which is required because the Rust runtime's
      -- internal state (SHM globals, allocator) must be visible to language
      -- extensions (pymorloc, rmorloc, cppmorloc).
      -- We cannot use the cdylib directly because Rust's cdylib only exports
      -- #[no_mangle] pub extern "C" symbols, and adding a version script to
      -- override this conflicts with Rust's own version script on ARM/aarch64.
      let rustStaticLib = rustDir </> "target" </> "release" </> "libmorloc_runtime.a"
      run verbose "gcc"
        [ "-shared", "-o", soPath
        , "-Wl,--whole-archive", rustStaticLib, "-Wl,--no-whole-archive"
        , "-lpthread", "-lrt", "-ldl", "-lm"
        ]
      hasStrip <- findExecutable "strip"
      case hasStrip of
        Just stripPath -> run verbose stripPath [soPath]
        Nothing -> return ()

      sayInfo verbose "Compiling morloc-nexus (Rust)"
      run verbose "cargo"
        [ "build", "--release"
        , "--manifest-path", rustDir </> "Cargo.toml"
        , "-p", "morloc-nexus"
        ]
      let rustNexus = rustDir </> "target" </> "release" </> "morloc-nexus"
      run verbose "cp" [rustNexus, nexusBinPath]
      case hasStrip of
        Just stripPath -> run verbose stripPath [nexusBinPath]
        Nothing -> return ()

      sayInfo verbose "Compiling morloc-manager (Rust)"
      run verbose "cargo"
        [ "build", "--release"
        , "--manifest-path", rustDir </> "Cargo.toml"
        , "-p", "morloc-manager"
        ]
      let rustManager = rustDir </> "target" </> "release" </> "morloc-manager"
          managerBinPath = nexusBinDir </> "morloc-manager"
      run verbose "cp" [rustManager, managerBinPath]
      case hasStrip of
        Just stripPath -> run verbose stripPath [managerBinPath]
        Nothing -> return ()


  -- Symlink binaries to ~/.local/bin/ if it exists
  userBinExists <- doesDirectoryExist userBinDir
  when userBinExists $ do
    symlinkBinary nexusBinPath (userBinDir </> "morloc-nexus")
    let managerSrc = nexusBinDir </> "morloc-manager"
    managerExists <- doesFileExist managerSrc
    when managerExists $
      symlinkBinary managerSrc (userBinDir </> "morloc-manager")

  -- Create exe/ and fdb/ directories
  let exeDir = homeDir </> "exe"
      fdbDir = homeDir </> "fdb"
  ensureDirectory verbose "morloc exe directory" exeDir
  ensureDirectory verbose "morloc fdb directory" fdbDir

  -- Configure each language via its init.sh script
  forM_ DF.langSetups $ \ls -> do
    missing <- checkTools (DF.lsRequiredTools ls)
    if null missing
      then do
        hPutStrLn stderr $ "Building " <> DF.lsName ls <> " extension ..."
        sayInfo verbose $ "Configuring " <> DF.lsName ls <> " language support"
        -- Write data files to build dir
        forM_ (DF.lsFiles ls) $ \ef ->
          TIO.writeFile (buildDir </> DF.embededFileName ef) (DF.embededFileText ef)
        -- Write and run init script
        let initPath = buildDir </> "init.sh"
        TIO.writeFile initPath (DF.embededFileText (DF.lsInitScript ls))
        let sanitizeFlagsStr = if sanitize then "-fsanitize=alignment -fno-sanitize-recover=alignment" else ""
        result <- try (run verbose "bash" [initPath, homeDir, buildDir, sanitizeFlagsStr]) :: IO (Either SomeException ())
        case result of
          Left e -> sayWarning $ DF.lsName ls <> " setup failed: " <> displayException e
          Right _ -> return ()
        -- Clean up
        removeFileSafe initPath
        forM_ (DF.lsFiles ls) $ \ef ->
          removeFileSafe (buildDir </> DF.embededFileName ef)
      else
        sayWarning $ "Skipping " <> DF.lsName ls <> " setup (missing: " <> unwords missing <> ")"

  -- Generate shell completions
  sayInfo verbose "Generating shell completions"
  Completion.regenerateCompletions verbose homeDir

-- | Search for a Rust workspace directory containing Cargo.toml
findRustDir :: [FilePath] -> IO FilePath
findRustDir [] = return ""
findRustDir (d:ds) = do
  exists <- doesFileExist (d </> "Cargo.toml")
  if exists then return d else findRustDir ds

-- ANSI color wrapping, disabled when stderr is not a terminal
withColor :: String -> String -> IO String
withColor code msg = do
  isTty <- hIsTerminalDevice stderr
  return $ if isTty then code <> msg <> "\ESC[0m" else msg

sayInfo :: Bool -> String -> IO ()
sayInfo verbose message = when verbose $ do
  line <- withColor "\ESC[34m" ("[INFO] " <> message)
  hPutStrLn stderr line

sayWarning :: String -> IO ()
sayWarning message = do
  line <- withColor "\ESC[33m" ("[WARNING] " <> message)
  hPutStrLn stderr line

sayError :: String -> IO ()
sayError message = do
  line <- withColor "\ESC[31m" ("[ERROR] " <> message)
  hPutStrLn stderr line

run :: Bool -> String -> [String] -> IO ()
run verbose cmd args = do
  when verbose $ do
    line <- withColor "\ESC[2m" (cmd <> " " <> unwords args)
    hPutStrLn stderr line
  let cp = (proc cmd args) { std_out = UseHandle stderr }
  (_, _, _, ph) <- createProcess cp
  exitCode <- waitForProcess ph
  case exitCode of
    ExitSuccess -> return ()
    ExitFailure code -> ioError . userError $ cmd <> " exited with code " <> show code

ensureDirectory :: Bool -> String -> FilePath -> IO ()
ensureDirectory verbose description path = do
  exists <- doesDirectoryExist path
  if exists
    then sayInfo verbose $ description ++ " ... " ++ path
    else do
      createDirectoryIfMissing True path
      sayInfo verbose $ description ++ " ... created " ++ path

-- | Remove a file, ignoring errors if it doesn't exist
removeFileSafe :: FilePath -> IO ()
removeFileSafe path = do
  result <- try (removeFile path) :: IO (Either SomeException ())
  case result of
    Left _ -> return ()
    Right _ -> return ()

-- | Remove all contents of a directory (but keep the directory itself)
cleanDirectory :: FilePath -> IO ()
cleanDirectory dir = do
  exists <- doesDirectoryExist dir
  when exists $ do
    removeDirectoryRecursive dir
    createDirectoryIfMissing True dir

-- | Remove all contents of a directory except entries in the keep list
cleanDirectoryExcept :: FilePath -> [String] -> IO ()
cleanDirectoryExcept dir keep = do
  exists <- doesDirectoryExist dir
  when exists $ do
    entries <- listDirectory dir
    forM_ entries $ \entry -> do
      unless (entry `elem` keep) $ do
        let path = dir </> entry
        isDir <- doesDirectoryExist path
        if isDir
          then removeDirectoryRecursive path
          else removeFile path

-- | Check that a tool exists on PATH, error if not
requireTool :: String -> String -> IO ()
requireTool tool msg = do
  found <- findExecutable tool
  case found of
    Nothing -> ioError . userError $ tool <> " not found on PATH. " <> msg
    Just _ -> return ()

-- | Create a symlink at dst pointing to src, removing any existing file at dst.
symlinkBinary :: FilePath -> FilePath -> IO ()
symlinkBinary src dst = do
  -- Remove existing file or symlink at destination
  isLink <- pathIsSymbolicLink dst `catch` (\(_ :: SomeException) -> return False)
  when isLink $ removeFile dst
  isFile <- doesFileExist dst
  when isFile $ removeFile dst
  createFileLink src dst

-- | Check which tools from a list are missing. Returns list of missing tool names.
checkTools :: [String] -> IO [String]
checkTools tools = do
  results <- forM tools $ \tool -> do
    found <- findExecutable tool
    return (tool, found)
  return [t | (t, Nothing) <- results]


================================================
FILE: library/Morloc/Completion.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# OPTIONS_GHC -Wno-unused-top-binds #-}

{- |
Module      : Morloc.Completion
Description : Generate shell completion scripts for morloc and installed programs
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.Completion
  ( regenerateCompletions
  ) where

import Control.Monad (when)
import Control.Exception (SomeException, try)
import Data.Aeson ((.!=), (.:), (.:?))
import qualified Data.Aeson as JSON
import Data.Aeson.Types (Parser)
import qualified Data.ByteString.Lazy as BL
import Data.Char (isAlphaNum)
import Data.List (intercalate, isSuffixOf, nub)
import Data.Maybe (catMaybes)
import Data.Text (Text)
import qualified Data.Text as T
import System.Directory (createDirectoryIfMissing, listDirectory)
import System.FilePath (dropExtension, takeFileName, (</>))
import System.IO (hIsTerminalDevice, hPutStrLn, stderr)

-- Lightweight manifest types for completion generation

data ManifestInfo = ManifestInfo
  { miName :: Text
  , miCommands :: [CmdInfo]
  , miGroups :: [GroupInfo]
  }

data CmdInfo = CmdInfo
  { ciName :: Text
  , ciGroup :: Maybe Text
  , ciArgs :: [ArgInfo]
  }

data ArgInfo
  = PosArg
  | OptArg {oaShort :: Maybe Char, oaLong :: Maybe Text}
  | FlagArg {faShort :: Maybe Char, faLong :: Maybe Text, faLongRev :: Maybe Text}
  | GrpArg {gaGroupOpt :: Maybe (Maybe Char, Maybe Text), gaEntries :: [ArgInfo]}

data GroupInfo = GroupInfo
  { giName :: Text
  }

-- JSON parsing instances

instance JSON.FromJSON ManifestInfo where
  parseJSON = JSON.withObject "ManifestInfo" $ \o ->
    ManifestInfo
      <$> (o .:? "name" .!= "")
      <*> (o .:? "commands" .!= [])
      <*> (o .:? "groups" .!= [])

instance JSON.FromJSON CmdInfo where
  parseJSON = JSON.withObject "CmdInfo" $ \o ->
    CmdInfo
      <$> o .: "name"
      <*> o .:? "group"
      <*> (o .:? "args" .!= [])

instance JSON.FromJSON ArgInfo where
  parseJSON = JSON.withObject "ArgInfo" $ \o -> do
    kind <- o .: "kind" :: Parser Text
    case kind of
      "pos" -> return PosArg
      "opt" -> do
        s <- o .:? "short"
        l <- o .:? "long"
        return $ OptArg (fmap charFromText s) l
      "flag" -> do
        s <- o .:? "short"
        l <- o .:? "long"
        lr <- o .:? "long_rev"
        return $ FlagArg (fmap charFromText s) l lr
      "grp" -> do
        gopt <- o .:? "group_opt"
        entries <- o .:? "entries" .!= []
        parsedOpt <- traverse parseGroupOpt gopt
        parsedEntries <- mapM parseEntry entries
        return $ GrpArg parsedOpt parsedEntries
      _ -> return PosArg
    where
      charFromText :: Text -> Char
      charFromText t = case T.unpack t of
        [c] -> c
        _ -> '?'

      parseGroupOpt :: JSON.Value -> Parser (Maybe Char, Maybe Text)
      parseGroupOpt = JSON.withObject "GroupOpt" $ \o' -> do
        s <- o' .:? "short"
        l <- o' .:? "long"
        return (fmap charFromText s, l)

      parseEntry :: JSON.Value -> Parser ArgInfo
      parseEntry = JSON.withObject "Entry" $ \o -> do
        arg <- o .: "arg"
        JSON.parseJSON arg

instance JSON.FromJSON GroupInfo where
  parseJSON = JSON.withObject "GroupInfo" $ \o ->
    GroupInfo <$> o .: "name"

{- | Read all manifests and regenerate completion files.
The Bool parameter controls whether to print activation instructions.
-}
regenerateCompletions :: Bool -> String -> IO ()
regenerateCompletions printInstructions configHome = do
  let fdbDir = configHome </> "fdb"
      compDir = configHome </> "completions"
  createDirectoryIfMissing True compDir

  manifests <- loadManifests fdbDir
  let bashScript = generateBash manifests
      zshScript = generateZsh manifests
      bashPath = compDir </> "morloc-completions.bash"
      zshPath = compDir </> "_morloc_completions"
  writeFile bashPath bashScript
  writeFile zshPath zshScript

  when printInstructions $ do
      isTty <- hIsTerminalDevice stderr
      let info msg = if isTty then "\ESC[34m[INFO] " ++ msg ++ "\ESC[0m" else "[INFO] " ++ msg
      hPutStrLn stderr $ info $ "Shell completions written to " ++ compDir ++ "/"
      hPutStrLn stderr $ info $ "  Bash: add to ~/.bashrc:  source " ++ bashPath
      hPutStrLn stderr $ info $ "  Zsh:  add to ~/.zshrc:   source " ++ zshPath

-- | Load all .manifest files from the fdb directory
loadManifests :: FilePath -> IO [ManifestInfo]
loadManifests fdbDir = do
  result <- try (listDirectory fdbDir) :: IO (Either SomeException [FilePath])
  case result of
    Left _ -> return []
    Right entries -> do
      let manifestFiles = filter (".manifest" `isSuffixOf`) entries
      catMaybes <$> mapM loadOne manifestFiles
  where
    -- Derive program name from filename (e.g. "pricer.manifest" -> "pricer")
    nameFromFile f = T.pack (dropExtension (takeFileName f))

    loadOne f = do
      r <- try (BL.readFile (fdbDir </> f)) :: IO (Either SomeException BL.ByteString)
      case r of
        Left _ -> return Nothing
        Right bs -> case JSON.eitherDecode bs of
          Right m ->
            let m' = if T.null (miName m) then m {miName = nameFromFile f} else m
             in return (Just m')
          Left err -> do
            hPutStrLn stderr $ "Warning: failed to parse " ++ f ++ ": " ++ err
            return Nothing

-- | Collect all flag/opt strings for a command
argCompletionWords :: [ArgInfo] -> [String]
argCompletionWords = concatMap argWords
  where
    argWords PosArg = []
    argWords (OptArg s l) = shortWord s ++ longWord l
    argWords (FlagArg s l lr) = shortWord s ++ longWord l ++ longWord lr
    argWords (GrpArg gopt entries) =
      maybe [] (\(s, l) -> shortWord s ++ longWord l) gopt
        ++ concatMap argWords entries

    shortWord (Just c) = ['-' : [c]]
    shortWord Nothing = []
    longWord (Just t) = ["--" ++ T.unpack t]
    longWord Nothing = []

-- | Get flags/opts that take a value (opts and grp opts, but not flags)
valueArgs :: [ArgInfo] -> [String]
valueArgs = concatMap go
  where
    go PosArg = []
    go (OptArg s l) = shortWord s ++ longWord l
    go FlagArg {} = []
    go (GrpArg gopt entries) =
      maybe [] (\(gs, gl) -> shortWord gs ++ longWord gl) gopt
        ++ concatMap go entries

    shortWord (Just c) = ['-' : [c]]
    shortWord Nothing = []
    longWord (Just t) = ["--" ++ T.unpack t]
    longWord Nothing = []

-- | Sanitize a name for use as a bash function name
sanitizeName :: Text -> String
sanitizeName = map (\c -> if isAlphaNum c then c else '_') . T.unpack

-- Bash generation

generateBash :: [ManifestInfo] -> String
generateBash manifests =
  unlines $
    [ "# Auto-generated by morloc -- do not edit manually"
    , ""
    ]
      ++ morlocBashCompletion
      ++ concatMap programBashCompletion manifests

morlocBashCompletion :: [String]
morlocBashCompletion =
  [ "_morloc() {"
  , "  local cur prev"
  , "  COMPREPLY=()"
  , "  cur=\"${COMP_WORDS[COMP_CWORD]}\""
  , "  prev=\"${COMP_WORDS[COMP_CWORD-1]}\""
  , ""
  , "  if [[ $COMP_CWORD -eq 1 ]]; then"
  , "    COMPREPLY=($(compgen -W \"make install typecheck dump init list uninstall\" -- \"$cur\"))"
  , "    return"
  , "  fi"
  , ""
  , "  case \"${COMP_WORDS[1]}\" in"
  , "    make)"
  , "      case \"$prev\" in"
  , "        -o|--outfile|--config|--include) return ;;"
  , "      esac"
  , "      if [[ \"$cur\" != -* ]]; then"
  , "        COMPREPLY=($(compgen -f -X '!*.loc' -- \"$cur\") $(compgen -d -- \"$cur\"))"
  , "        return"
  , "      fi"
  , "      COMPREPLY=($(compgen -W \"-e --expression -o --outfile --install -f --force --include --config -v --vanilla\" -- \"$cur\"))"
  , "      ;;"
  , "    install)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      COMPREPLY=($(compgen -W \"--config --vanilla -v -f --force --ssh --no-typecheck\" -- \"$cur\"))"
  , "      ;;"
  , "    typecheck)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      if [[ \"$cur\" != -* ]]; then"
  , "        COMPREPLY=($(compgen -f -X '!*.loc' -- \"$cur\") $(compgen -d -- \"$cur\"))"
  , "        return"
  , "      fi"
  , "      COMPREPLY=($(compgen -W \"--config --vanilla -t --type --raw -e --expression -v -r --realize\" -- \"$cur\"))"
  , "      ;;"
  , "    dump)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      if [[ \"$cur\" != -* ]]; then"
  , "        COMPREPLY=($(compgen -f -X '!*.loc' -- \"$cur\") $(compgen -d -- \"$cur\"))"
  , "        return"
  , "      fi"
  , "      COMPREPLY=($(compgen -W \"--config --vanilla -v -e --expression\" -- \"$cur\"))"
  , "      ;;"
  , "    init)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      COMPREPLY=($(compgen -W \"--config -q --quiet --vanilla -f --force --slurm\" -- \"$cur\"))"
  , "      ;;"
  , "    list)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      COMPREPLY=($(compgen -W \"--modules --programs --config --vanilla -v\" -- \"$cur\"))"
  , "      ;;"
  , "    uninstall)"
  , "      case \"$prev\" in"
  , "        --config) return ;;"
  , "      esac"
  , "      COMPREPLY=($(compgen -W \"--module --program --dry-run --config --vanilla\" -- \"$cur\"))"
  , "      ;;"
  , "  esac"
  , "}"
  , "complete -F _morloc morloc"
  , ""
  ]

programBashCompletion :: ManifestInfo -> [String]
programBashCompletion mi =
  let name = miName mi
      safeName = sanitizeName name
      funcName = "_morloc_prog_" ++ safeName
      groups = miGroups mi
      groupNames = map (T.unpack . giName) groups
      cmds = miCommands mi
      ungroupedCmds = [c | c <- cmds, ciGroup c == Nothing]
      ungroupedNames = map (T.unpack . ciName) ungroupedCmds
      firstLevelWords = nub (ungroupedNames ++ groupNames)
      groupedCmds grp = [c | c <- cmds, ciGroup c == Just grp]
   in if T.null name
        then []
        else
          [ "# --- Installed program: " ++ T.unpack name ++ " ---"
          , funcName ++ "() {"
          , "  local cur prev"
          , "  COMPREPLY=()"
          , "  cur=\"${COMP_WORDS[COMP_CWORD]}\""
          , "  prev=\"${COMP_WORDS[COMP_CWORD-1]}\""
          , ""
          , "  if [[ $COMP_CWORD -eq 1 ]]; then"
          , "    COMPREPLY=($(compgen -W \"" ++ unwords firstLevelWords ++ "\" -- \"$cur\"))"
          , "    return"
          , "  fi"
          , ""
          , "  case \"${COMP_WORDS[1]}\" in"
          ]
            -- group cases
            ++ concatMap
              ( \grp ->
                  let grpCmds = groupedCmds (giName grp)
                      grpCmdNames = map (T.unpack . ciName) grpCmds
                   in [ "    " ++ T.unpack (giName grp) ++ ")"
                      , "      if [[ $COMP_CWORD -eq 2 ]]; then"
                      , "        COMPREPLY=($(compgen -W \"" ++ unwords grpCmdNames ++ "\" -- \"$cur\"))"
                      , "        return"
                      , "      fi"
                      ]
                        ++ bashCommandFlagCases 3 grpCmds
                        ++ ["      ;;"]
              )
              groups
            -- ungrouped command cases
            ++ concatMap (bashSingleCommandCase 1) ungroupedCmds
            ++ [ "  esac"
               , "}"
               , "complete -F " ++ funcName ++ " " ++ T.unpack name
               , ""
               ]

-- | Generate flag completion for a direct command at the given COMP_CWORD depth
bashSingleCommandCase :: Int -> CmdInfo -> [String]
bashSingleCommandCase _depth cmd =
  let words' = argCompletionWords (ciArgs cmd)
      valArgs = valueArgs (ciArgs cmd)
   in if null words'
        then
          [ "    " ++ T.unpack (ciName cmd) ++ ")"
          , "      ;;"
          ]
        else
          [ "    " ++ T.unpack (ciName cmd) ++ ")"
          ]
            ++ ( if null valArgs
                  then []
                  else
                    [ "      case \"$prev\" in"
                    , "        " ++ intercalate "|" valArgs ++ ") return ;;"
                    , "      esac"
                    ]
               )
            ++ [ "      COMPREPLY=($(compgen -W \"" ++ unwords words' ++ "\" -- \"$cur\"))"
               , "      ;;"
               ]

-- | Generate command dispatch within a group (at COMP_CWORD == depth for command name)
bashCommandFlagCases :: Int -> [CmdInfo] -> [String]
bashCommandFlagCases depth cmds =
  if null cmds
    then []
    else
      [ "      case \"${COMP_WORDS[" ++ show (depth - 1) ++ "]}\" in"
      ]
        ++ concatMap
          ( \cmd ->
              let words' = argCompletionWords (ciArgs cmd)
                  valArgs = valueArgs (ciArgs cmd)
               in if null words'
                    then []
                    else
                      [ "        " ++ T.unpack (ciName cmd) ++ ")"
                      ]
                        ++ ( if null valArgs
                              then []
                              else
                                [ "          case \"$prev\" in"
                                , "            " ++ intercalate "|" valArgs ++ ") return ;;"
                                , "          esac"
                                ]
                           )
                        ++ [ "          COMPREPLY=($(compgen -W \"" ++ unwords words' ++ "\" -- \"$cur\"))"
                           , "          ;;"
                           ]
          )
          cmds
        ++ [ "      esac"
           ]

-- Zsh generation

generateZsh :: [ManifestInfo] -> String
generateZsh manifests =
  unlines $
    [ "#compdef morloc"
    , "# Auto-generated by morloc -- do not edit manually"
    , ""
    ]
      ++ morlocZshCompletion
      ++ concatMap programZshCompletion manifests

morlocZshCompletion :: [String]
morlocZshCompletion =
  [ "_morloc() {"
  , "  local -a subcmds"
  , "  subcmds=("
  , "    'make:Build a morloc script'"
  , "    'install:Install a morloc module'"
  , "    'typecheck:Typecheck a morloc program'"
  , "    'dump:Dump parsed code'"
  , "    'init:Initialize morloc environment'"
  , "    'list:List installed modules and programs'"
  , "    'uninstall:Uninstall a module or program'"
  , "  )"
  , ""
  , "  if (( CURRENT == 2 )); then"
  , "    _describe 'subcommand' subcmds"
  , "    return"
  , "  fi"
  , ""
  , "  case \"$words[2]\" in"
  , "    make)"
  , "      _arguments \\"
  , "        '-e[Read as expression]' \\"
  , "        '--expression[Read as expression]' \\"
  , "        '-o[Output file]:outfile:_files' \\"
  , "        '--outfile[Output file]:outfile:_files' \\"
  , "        '--install[Install to PATH]' \\"
  , "        '-f[Force overwrite]' \\"
  , "        '--force[Force overwrite]' \\"
  , "        '--include[Include pattern]:pattern:' \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '-v[Verbose]' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '*:script:_files -g \"*.loc\"'"
  , "      ;;"
  , "    install)"
  , "      _arguments \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '-v[Verbose]' \\"
  , "        '-f[Force overwrite]' \\"
  , "        '--force[Force overwrite]' \\"
  , "        '--ssh[Use SSH protocol]' \\"
  , "        '--no-typecheck[Skip typechecking]'"
  , "      ;;"
  , "    typecheck)"
  , "      _arguments \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '-t[Parse type string]' \\"
  , "        '--type[Parse type string]' \\"
  , "        '--raw[Print raw objects]' \\"
  , "        '-e[Read as expression]' \\"
  , "        '--expression[Read as expression]' \\"
  , "        '-v[Verbose]' \\"
  , "        '-r[Typecheck realizations]' \\"
  , "        '--realize[Typecheck realizations]' \\"
  , "        '*:script:_files -g \"*.loc\"'"
  , "      ;;"
  , "    dump)"
  , "      _arguments \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '-v[Verbose]' \\"
  , "        '-e[Read as expression]' \\"
  , "        '--expression[Read as expression]' \\"
  , "        '*:script:_files -g \"*.loc\"'"
  , "      ;;"
  , "    init)"
  , "      _arguments \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '-q[Minimal output]' \\"
  , "        '--quiet[Minimal output]' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '-f[Force overwrite]' \\"
  , "        '--force[Force overwrite]' \\"
  , "        '--slurm[Enable SLURM support]'"
  , "      ;;"
  , "    list)"
  , "      _arguments \\"
  , "        '--modules[List only modules]' \\"
  , "        '--programs[List only programs]' \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '--vanilla[Ignore local config]' \\"
  , "        '-v[Verbose]'"
  , "      ;;"
  , "    uninstall)"
  , "      _arguments \\"
  , "        '--module[Uninstall only the module]' \\"
  , "        '--program[Uninstall only the program]' \\"
  , "        '--dry-run[Show what would be removed]' \\"
  , "        '--config[Config file]:config:_files' \\"
  , "        '--vanilla[Ignore local config]'"
  , "      ;;"
  , "  esac"
  , "}"
  , "compdef _morloc morloc"
  , ""
  ]

programZshCompletion :: ManifestInfo -> [String]
programZshCompletion mi =
  let name = miName mi
      safeName = sanitizeName name
      funcName = "_morloc_prog_" ++ safeName
      groups = miGroups mi
      cmds = miCommands mi
      ungroupedCmds = [c | c <- cmds, ciGroup c == Nothing]
      groupedCmds grp = [c | c <- cmds, ciGroup c == Just grp]
      -- Build first-level descriptions
      ungroupedDescs = map (\c -> "    '" ++ T.unpack (ciName c) ++ ":" ++ T.unpack (ciName c) ++ "'") ungroupedCmds
      groupDescs = map (\g -> "    '" ++ T.unpack (giName g) ++ ":" ++ T.unpack (giName g) ++ "'") groups
      allDescs = ungroupedDescs ++ groupDescs
   in if T.null name
        then []
        else
          [ "# --- Installed program: " ++ T.unpack name ++ " ---"
          , funcName ++ "() {"
          , "  local -a cmds"
          , "  cmds=("
          ]
            ++ allDescs
            ++ [ "  )"
               , ""
               , "  if (( CURRENT == 2 )); then"
               , "    _describe 'command' cmds"
               , "    return"
               , "  fi"
               , ""
               , "  case \"$words[2]\" in"
               ]
            -- group cases
            ++ concatMap
              ( \grp ->
                  let grpCmds = groupedCmds (giName grp)
                      grpDescs = map (\c -> "        '" ++ T.unpack (ciName c) ++ ":" ++ T.unpack (ciName c) ++ "'") grpCmds
                   in [ "    " ++ T.unpack (giName grp) ++ ")"
                      , "      if (( CURRENT == 3 )); then"
                      , "        local -a grpcmds=("
                      ]
                        ++ grpDescs
                        ++ [ "        )"
                           , "        _describe 'command' grpcmds"
                           , "        return"
                           , "      fi"
                           ]
                        ++ zshCommandFlagCases 3 grpCmds
                        ++ [ "      ;;"
                           ]
              )
              groups
            -- ungrouped command cases
            ++ concatMap zshSingleCommandCase ungroupedCmds
            ++ [ "  esac"
               , "}"
               , "compdef " ++ funcName ++ " " ++ T.unpack name
               , ""
               ]

-- | Generate zsh _arguments for a single command
zshSingleCommandCase :: CmdInfo -> [String]
zshSingleCommandCase cmd =
  let argSpecs = zshArgSpecs (ciArgs cmd)
   in if null argSpecs
        then
          [ "    " ++ T.unpack (ciName cmd) ++ ")"
          , "      ;;"
          ]
        else
          [ "    " ++ T.unpack (ciName cmd) ++ ")"
          , "      _arguments \\"
          ]
            ++ formatZshArgs argSpecs
            ++ [ "      ;;"
               ]

-- | Generate dispatch within a group for zsh
zshCommandFlagCases :: Int -> [CmdInfo] -> [String]
zshCommandFlagCases depth cmds =
  if null cmds
    then []
    else
      [ "      case \"$words[" ++ show depth ++ "]\" in"
      ]
        ++ concatMap
          ( \cmd ->
              let argSpecs = zshArgSpecs (ciArgs cmd)
               in if null argSpecs
                    then []
                    else
                      [ "        " ++ T.unpack (ciName cmd) ++ ")"
                      , "          _arguments \\"
                      ]
                        ++ map ("    " ++) (formatZshArgs argSpecs)
                        ++ [ "          ;;"
                           ]
          )
          cmds
        ++ [ "      esac"
           ]

-- | Convert args to zsh _arguments spec strings
zshArgSpecs :: [ArgInfo] -> [String]
zshArgSpecs = concatMap go
  where
    go PosArg = []
    go (OptArg s l) =
      maybe [] (\c -> ["'-" ++ [c] ++ "[Option]:value:'"]) s
        ++ maybe [] (\t -> ["'--" ++ T.unpack t ++ "[Option]:value:'"]) l
    go (FlagArg s l lr) =
      maybe [] (\c -> ["'-" ++ [c] ++ "[Flag]'"]) s
        ++ maybe [] (\t -> ["'--" ++ T.unpack t ++ "[Flag]'"]) l
        ++ maybe [] (\t -> ["'--" ++ T.unpack t ++ "[Flag]'"]) lr
    go (GrpArg gopt entries) =
      maybe
        []
        ( \(s, l) ->
            maybe [] (\c -> ["'-" ++ [c] ++ "[Group option]:value:'"]) s
              ++ maybe [] (\t -> ["'--" ++ T.unpack t ++ "[Group option]:value:'"]) l
        )
        gopt
        ++ concatMap go entries

-- | Format zsh args with proper line continuation
formatZshArgs :: [String] -> [String]
formatZshArgs [] = []
formatZshArgs [x] = ["        " ++ x]
formatZshArgs (x : xs) = ("        " ++ x ++ " \\") : formatZshArgs xs


================================================
FILE: library/Morloc/Config.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Config
Description : Configuration loading and default paths
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Loads the morloc configuration from @~\/.local\/share\/morloc\/config@ (YAML),
module-level configs from @\<module\>.yaml@, and build configs. Also sets up
per-language server sockets for IPC during pool execution.
-}
module Morloc.Config
  ( Config (..)
  , loadMorlocConfig
  , loadModuleConfig
  , loadDefaultMorlocConfig
  , loadBuildConfig
  , setupServerAndSocket
  , getDefaultConfigFilepath
  , getDefaultMorlocLibrary
  ) where

import qualified Data.Aeson.KeyMap as K
import qualified Data.Map.Strict as Map
import Data.Text (Text)
import qualified Data.Yaml as Y
import qualified Data.Yaml.Config as YC
import Morloc.Data.Doc
import qualified Morloc.Data.Text as MT
import qualified Morloc.LangRegistry as LR
import qualified Morloc.Language as ML
import qualified Morloc.Monad as MM
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import qualified Morloc.System as MS
import System.Environment (lookupEnv)

getDefaultConfigFilepath :: IO Path
getDefaultConfigFilepath = MS.combine <$> getDefaultMorlocHome <*> pure "config"

-- | Load the default Morloc configuration, ignoring any local configurations.
loadDefaultMorlocConfig :: IO Config
loadDefaultMorlocConfig = do
  defaults <- defaultFields
  return $
    Config
      (MT.unpack . fromJust $ defaults K.!? "home")
      (MT.unpack . fromJust $ defaults K.!? "source")
      (MT.unpack . fromJust $ defaults K.!? "plane")
      (MT.unpack . fromJust $ defaults K.!? "plane-core")
      (MT.unpack . fromJust $ defaults K.!? "tmpdir")
      (MT.unpack . fromJust $ defaults K.!? "build-config")
      Map.empty -- configLangOverrides
      Nothing   -- configRegistry

{- | Load a Morloc config file. If no file is given (i.e., Nothing), then the
default configuration will be used.
-}
loadMorlocConfig :: Maybe Path -> IO Config
loadMorlocConfig Nothing = do
  defaults <- defaultFields
  MS.loadYamlConfig
    Nothing
    (YC.useCustomEnv defaults)
    loadDefaultMorlocConfig
loadMorlocConfig (Just configFile) = do
  configExists <- MS.doesFileExist configFile
  defaults <- defaultFields
  if configExists
    then
      MS.loadYamlConfig
        (Just [configFile])
        (YC.useCustomEnv defaults)
        loadDefaultMorlocConfig
    else
      loadMorlocConfig Nothing

loadModuleConfig :: Maybe Path -> MorlocMonad ModuleConfig
loadModuleConfig Nothing = return defaultValue
loadModuleConfig (Just configFile) = do
  let moduleConfigFile = MS.dropExtension configFile <> ".yaml"
  configExists <- liftIO $ MS.doesFileExist moduleConfigFile
  if configExists
    then do
      result <- liftIO $ Y.decodeFileEither moduleConfigFile
      case result of
        Left errMsg ->
          MM.throwSystemError $
            "Failed to parse module config file '"
              <> pretty configFile
              <> "': "
              <> pretty (Y.prettyPrintParseException errMsg)
        Right config -> return config
    else
      return defaultValue

loadBuildConfig :: Config -> IO BuildConfig
loadBuildConfig config = do
  let configFile = configBuildConfig config
  configExists <- MS.doesFileExist configFile
  if configExists
    then do
      result <- Y.decodeFileEither configFile
      case result of
        Left errMsg ->
          error $
            "Failed to parse build config file '" <> configFile <> "': " <> Y.prettyPrintParseException errMsg
        Right buildConfig -> return buildConfig
    else
      return defaultValue

setupServerAndSocket ::
  Config ->
  LangRegistry ->
  Lang ->
  Socket
setupServerAndSocket c reg lang = Socket lang args socket
  where
    name = ML.langName lang
    -- Look up run command: config overrides take precedence over registry defaults
    runCmd = case Map.lookup name (configLangOverrides c) of
      Just cmd -> cmd
      Nothing -> LR.registryRunCommand reg name
    isCompiled = LR.registryIsCompiled reg name
    poolExe = ML.makeExecutablePoolName lang

    args
      | isCompiled = ["./" <> pretty poolExe]
      | null runCmd = [pretty name, pretty poolExe]
      | otherwise = map pretty runCmd ++ [pretty poolExe]

    socket = "pipe-" <> pretty (ML.showLangName lang)

-- This is where the default file organization of morloc is set
defaultFields :: IO (K.KeyMap Text)
defaultFields = do
  home <- MT.pack <$> getDefaultMorlocHome
  lib <- MT.pack <$> getDefaultMorlocSource
  tmp <- MT.pack <$> getDefaultMorlocTmpDir
  buildConfig <- MT.pack <$> getDefaultMorlocBuildConfig
  return $
    K.fromList
      [ ("home", home)
      , ("source", lib)
      , ("plane", "default")
      , ("plane-core", "morloclib")
      , ("tmpdir", tmp)
      , ("build-config", buildConfig)
      ]

-- | Get the Morloc home directory (absolute path).
-- Respects MORLOC_HOME env var, falling back to ~/.local/share/morloc.
getDefaultMorlocHome :: IO Path
getDefaultMorlocHome = do
  envHome <- lookupEnv "MORLOC_HOME"
  case envHome of
    Just p | not (null p) -> return p
    _ -> MS.combine <$> MS.getHomeDirectory <*> pure ".local/share/morloc"

{- | Get the Morloc source directory (absolute path). Usually this will be a
folder inside the home directory. This is the path to the source data (often
a get repo).
-}
getDefaultMorlocSource :: IO Path
getDefaultMorlocSource = MS.combine <$> getDefaultMorlocHome <*> pure "src/morloc/plane"

-- | Get the path to the morloc shared libraries folder
getDefaultMorlocLibrary :: IO Path
getDefaultMorlocLibrary = MS.combine <$> getDefaultMorlocHome <*> pure "lib"

-- | Get the Morloc default temporary directory.
getDefaultMorlocTmpDir :: IO Path
getDefaultMorlocTmpDir = MS.combine <$> getDefaultMorlocHome <*> pure "tmp"

{- | Get the Morloc default build config. This will store `morloc init` flags
that affect all builds
-}
getDefaultMorlocBuildConfig :: IO Path
getDefaultMorlocBuildConfig = MS.combine <$> getDefaultMorlocHome <*> pure ".build-config.yaml"


================================================
FILE: library/Morloc/Data/Annotated.hs
================================================
{-# LANGUAGE TypeFamilies #-}

{- |
Module      : Morloc.Data.Annotated
Description : Class of annotated entities
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Typeclass for containers that pair an annotation with a value, providing
accessors and mapping operations over both components.
-}
module Morloc.Data.Annotated (Annotated (..)) where

class Annotated f where
  -- | Extract the annotation
  ann :: f a b -> a

  -- | Extract the value
  val :: f a b -> b

  -- | Pair an annotation with a value
  annotate :: a -> b -> f a b

  -- | Apply a function to both the annotation and the value
  annapp :: (a -> b -> c) -> f a b -> c
  annapp f x = f (ann x) (val x)

  -- | Replace the value using a function of both annotation and value
  reval :: (a -> b -> b') -> f a b -> f a b'
  reval f x = annotate (ann x) $ f (ann x) (val x)

  -- | Replace the annotation using a function of both annotation and value
  reann :: (a -> b -> a') -> f a b -> f a' b
  reann f x = annotate (f (ann x) (val x)) (val x)

  -- | Monadic 'annapp'
  annappM :: (Monad m) => (a -> b -> m c) -> f a b -> m c
  annappM f x = f (ann x) (val x)

  -- | Monadic 'reval'
  revalM :: (Monad m) => (a -> b -> m b') -> f a b -> m (f a b')
  revalM f x = annotate (ann x) <$> f (ann x) (val x)

  -- | Monadic 'reann'
  reannM :: (Monad m) => (a -> b -> m a') -> f a b -> m (f a' b)
  reannM f x = annotate <$> f (ann x) (val x) <*> pure (val x)

instance Annotated (,) where
  ann = fst
  val = snd
  annotate a b = (a, b)


================================================
FILE: library/Morloc/Data/Bifoldable.hs
================================================
{-# LANGUAGE TypeFamilies #-}

{- |
Module      : Morloc.Data.Bifoldable
Description : The Bifoldable typeclass with monadic instances
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Bifoldable operations for containers with two type parameters. Each operation
has a monadic variant (the primary interface) and a pure variant derived via
'Identity'. The @ubi*@ family of functions specializes to cases where both
type parameters are equal (@a ~ b@).
-}
module Morloc.Data.Bifoldable (Bifoldable (..)) where

import Control.Monad.Identity (runIdentity)
import Data.Foldable (foldlM, foldrM)
import Data.Maybe (catMaybes)
import Morloc.Data.Bifunctor

-- | Lift a binary function into a monadic return
return2 :: (Monad m) => (a -> b -> c) -> (a -> b -> m c)
return2 f x y = return $ f x y

class (Bifunctor f) => Bifoldable f where
  -- | Collect both components into a monadic list
  bilistM :: (Monad m) => (a -> m c) -> (b -> m c) -> f a b -> m [c]

  -- | Collect only second components into a monadic list
  bilistsndM :: (Monad m) => (b -> m c) -> f a b -> m [c]
  bilistsndM f = fmap catMaybes . bilistM (return . const Nothing) (fmap Just . f)

  -- | Collect only first components into a monadic list
  bilistfstM :: (Monad m) => (a -> m c) -> f a b -> m [c]
  bilistfstM f = fmap catMaybes . bilistM (fmap Just . f) (return . const Nothing)

  -- | Monoidal append over both components (monadic)
  biappendM :: (Monad m, Monoid c) => (a -> m c) -> (b -> m c) -> f a b -> m c
  biappendM f g = fmap mconcat . bilistM f g

  -- | Concatenate results from a foldable of bifunctors (monadic)
  bicatM :: (Monad m, Foldable t) => (a -> m c) -> (b -> m c) -> t (f a b) -> m [c]
  bicatM f g xs = foldrM (\e' b -> (<>) b <$> bilistM f g e') [] xs

  -- | Monoidal fold over a foldable of bifunctors (monadic)
  bifoldMapM :: (Foldable t, Monoid c, Monad m) => (a -> m c) -> (b -> m c) -> t (f a b) -> m c
  bifoldMapM f g = fmap mconcat . bicatM f g

  -- | Right fold over a foldable of bifunctors (monadic)
  bifoldrM ::
    (Monoid c, Foldable t, Monad m) => (a -> c -> m c) -> (b -> c -> m c) -> c -> t (f a b) -> m c
  bifoldrM f g c xs = foldrM (\x c' -> biappendM (`f` c') (`g` c') x) c xs

  -- | Left fold over a foldable of bifunctors (monadic)
  bifoldlM ::
    (Monoid c, Foldable t, Monad m) => (c -> a -> m c) -> (c -> b -> m c) -> c -> t (f a b) -> m c
  bifoldlM f g c xs = foldlM (\c' x -> biappendM (f c') (g c') x) c xs

  -- | Right fold starting from 'mempty' (monadic)
  bifoldr1M ::
    (Monoid c, Foldable t, Monad m) => (a -> c -> m c) -> (b -> c -> m c) -> t (f a b) -> m c
  bifoldr1M f g xs = foldrM (\x c' -> biappendM (`f` c') (`g` c') x) mempty xs

  -- | Left fold starting from 'mempty' (monadic)
  bifoldl1M ::
    (Monoid c, Foldable t, Monad m) => (c -> a -> m c) -> (c -> b -> m c) -> t (f a b) -> m c
  bifoldl1M f g xs = foldlM (\c' x -> biappendM (f c') (g c') x) mempty xs

  -- | Map uniformly over both components when @a ~ b@ (monadic)
  ubimapM :: (a ~ b, Monad m) => (a -> m c) -> f a b -> m (f c c)
  ubimapM f = bimapM f f

  -- | Uniform monoidal append when @a ~ b@ (monadic)
  ubiappendM :: (Monoid c, a ~ b, Monad m) => (a -> m c) -> f a b -> m c
  ubiappendM f = biappendM f f

  -- | Uniform concatenation when @a ~ b@ (monadic)
  ubicatM :: (Foldable t, a ~ b, Monad m) => (a -> m c) -> t (f a b) -> m [c]
  ubicatM f = bicatM f f

  -- | Uniform monoidal fold when @a ~ b@ (monadic)
  ubifoldMapM :: (Foldable t, Monoid c, a ~ b, Monad m) => (a -> m c) -> t (f a b) -> m c
  ubifoldMapM f = bifoldMapM f f

  -- | Uniform list collection when @a ~ b@ (monadic)
  ubilistM :: (a ~ b, Monad m) => (a -> m c) -> f a b -> m [c]
  ubilistM f = bilistM f f

  -- | Uniform right fold when @a ~ b@ (monadic)
  ubifoldrM :: (Monoid c, Foldable t, a ~ b, Monad m) => (a -> c -> m c) -> c -> t (f a b) -> m c
  ubifoldrM f = bifoldrM f f

  -- | Uniform left fold when @a ~ b@ (monadic)
  ubifoldlM :: (Monoid c, Foldable t, a ~ b, Monad m) => (c -> a -> m c) -> c -> t (f a b) -> m c
  ubifoldlM f = bifoldlM f f

  -- | Uniform right fold from 'mempty' when @a ~ b@ (monadic)
  ubifoldr1M :: (Monoid c, Foldable t, a ~ b, Monad m) => (a -> c -> m c) -> t (f a b) -> m c
  ubifoldr1M f = bifoldr1M f f

  -- | Uniform left fold from 'mempty' when @a ~ b@ (monadic)
  ubifoldl1M :: (Monoid c, Foldable t, a ~ b, Monad m) => (c -> a -> m c) -> t (f a b) -> m c
  ubifoldl1M f = bifoldl1M f f

  -- | Pure 'bilistM'
  bilist :: (a -> c) -> (b -> c) -> f a b -> [c]
  bilist f g = runIdentity . bilistM (return . f) (return . g)

  -- | Pure 'bilistsndM'
  bilistsnd :: (b -> c) -> f a b -> [c]
  bilistsnd f = runIdentity . bilistsndM (return . f)

  -- | Pure 'bilistfstM'
  bilistfst :: (a -> c) -> f a b -> [c]
  bilistfst f = runIdentity . bilistfstM (return . f)

  -- | Pure 'biappendM'
  biappend :: (Monoid c) => (a -> c) -> (b -> c) -> f a b -> c
  biappend f g = runIdentity . biappendM (return . f) (return . g)

  -- | Pure 'bicatM'
  bicat :: (Foldable t) => (a -> c) -> (b -> c) -> t (f a b) -> [c]
  bicat f g = runIdentity . bicatM (return . f) (return . g)

  -- | Pure 'bifoldMapM'
  bifoldMap :: (Foldable t, Monoid c) => (a -> c) -> (b -> c) -> t (f a b) -> c
  bifoldMap f g = runIdentity . bifoldMapM (return . f) (return . g)

  -- | Pure 'bifoldrM'
  bifoldr :: (Monoid c, Foldable t) => (a -> c -> c) -> (b -> c -> c) -> c -> t (f a b) -> c
  bifoldr f g c = runIdentity . bifoldrM (\b x -> return $ f b x) (\b x -> return $ g b x) c

  -- | Pure 'bifoldlM'
  bifoldl :: (Monoid c, Foldable t) => (c -> a -> c) -> (c -> b -> c) -> c -> t (f a b) -> c
  bifoldl f g c = runIdentity . bifoldlM (\x b -> return $ f x b) (\x b -> return $ g x b) c

  -- | Pure 'bifoldr1M'
  bifoldr1 :: (Monoid c, Foldable t) => (a -> c -> c) -> (b -> c -> c) -> t (f a b) -> c
  bifoldr1 f g = runIdentity . bifoldrM (\b x -> return $ f b x) (\b x -> return $ g b x) mempty

  -- | Pure 'bifoldl1M'
  bifoldl1 :: (Monoid c, Foldable t) => (c -> a -> c) -> (c -> b -> c) -> t (f a b) -> c
  bifoldl1 f g = runIdentity . bifoldlM (\x b -> return $ f x b) (\x b -> return $ g x b) mempty

  -- | Pure 'ubimapM'
  ubimap :: (a ~ b) => (a -> c) -> f a b -> f c c
  ubimap f = runIdentity . ubimapM (return . f)

  -- | Pure 'ubiappendM'
  ubiappend :: (Monoid c, a ~ b) => (a -> c) -> f a b -> c
  ubiappend f = runIdentity . ubiappendM (return . f)

  -- | Pure 'ubicatM'
  ubicat :: (Foldable t, a ~ b) => (a -> c) -> t (f a b) -> [c]
  ubicat f = runIdentity . ubicatM (return . f)

  -- | Pure 'ubifoldMapM'
  ubifoldMap :: (Foldable t, Monoid c, a ~ b) => (a -> c) -> t (f a b) -> c
  ubifoldMap f = runIdentity . ubifoldMap (return . f)

  -- | Pure 'ubilistM'
  ubilist :: (a ~ b) => (a -> c) -> f a b -> [c]
  ubilist f = runIdentity . ubilistM (return . f)

  -- | Pure 'ubifoldrM'
  ubifoldr :: (Monoid c, Foldable t, a ~ b) => (a -> c -> c) -> c -> t (f a b) -> c
  ubifoldr f c = runIdentity . ubifoldrM (return2 f) c

  -- | Pure 'ubifoldlM'
  ubifoldl :: (Monoid c, Foldable t, a ~ b) => (c -> a -> c) -> c -> t (f a b) -> c
  ubifoldl f c = runIdentity . ubifoldlM (return2 f) c

  -- | Pure 'ubifoldr1M'
  ubifoldr1 :: (Monoid c, Foldable t, a ~ b) => (a -> c -> c) -> t (f a b) -> c
  ubifoldr1 f = runIdentity . ubifoldr1M (return2 f)

  -- | Pure 'ubifoldl1M'
  ubifoldl1 :: (Monoid c, Foldable t, a ~ b) => (c -> a -> c) -> t (f a b) -> c
  ubifoldl1 f = runIdentity . ubifoldl1M (return2 f)

instance Bifoldable Either where
  bilistM f _ (Left a) = do
    a' <- f a
    return [a']
  bilistM _ g (Right b) = do
    b' <- g b
    return [b']

instance Bifoldable (,) where
  bilistM f g (a, b) = do
    a' <- f a
    b' <- g b
    return [a', b']


================================================
FILE: library/Morloc/Data/Bifunctor.hs
================================================
{-# LANGUAGE TypeFamilies #-}

{- |
Module      : Morloc.Data.Bifunctor
Description : The Bifunctor typeclass, with monadic instances
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

A custom Bifunctor class that provides monadic variants ('bimapM', 'firstM',
'secondM') alongside the standard pure operations. The monadic variants are
the primary interface; pure operations are derived via 'Identity'.
-}
module Morloc.Data.Bifunctor (Bifunctor (..)) where

import Control.Monad.Identity (runIdentity)

class Bifunctor f where
  -- | Map monadically over both components
  bimapM :: (Monad m) => (a -> m a') -> (b -> m b') -> f a b -> m (f a' b')

  -- | Map monadically over the first component
  firstM :: (Monad m) => (a -> m a') -> f a b -> m (f a' b)
  firstM f = bimapM f return

  -- | Map monadically over the second component
  secondM :: (Monad m) => (b -> m b') -> f a b -> m (f a b')
  secondM g = bimapM return g

  -- | Map over both components
  bimap :: (a -> a') -> (b -> b') -> f a b -> f a' b'
  bimap f g = runIdentity . bimapM (return . f) (return . g)

  -- | Map over the first component
  first :: (a -> a') -> f a b -> f a' b
  first f = runIdentity . firstM (return . f)

  -- | Map over the second component
  second :: (b -> b') -> f a b -> f a b'
  second f = runIdentity . secondM (return . f)

instance Bifunctor Either where
  bimapM f _ (Left a) = Left <$> f a
  bimapM _ g (Right b) = Right <$> g b

instance Bifunctor (,) where
  bimapM f g (a, b) = (,) <$> f a <*> g b

instance Bifunctor ((,,) x1) where
  bimapM f g (x1, x2, x3) = (,,) x1 <$> f x2 <*> g x3


================================================
FILE: library/Morloc/Data/DAG.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Data.DAG
Description : Functions for working with directed acyclic graphs
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Operations on DAGs represented as @Map k (n, [(k, e)])@ where @k@ is the
node key, @n@ is node data, and @e@ is edge data. Used throughout the
compiler to represent module dependency graphs.
-}
module Morloc.Data.DAG
  ( edgelist
  , nodes
  , lookupNode
  , roots
  , mapNode
  , mapNodeM
  , mapNodeWithKeyM
  , mapEdge
  , synthesize
  , synthesizeNodes
  ) where

import qualified Data.Set as Set
import qualified Morloc.Data.Map as Map
import Morloc.Namespace.Prim
import Morloc.Namespace.State (MorlocMonad)

-- | Get all edges as @(source, target)@ pairs
edgelist :: DAG k e n -> [(k, k)]
edgelist d = concat [[(k, j) | (j, _) <- xs] | (k, (_, xs)) <- Map.toList d]

-- | Get all node values
nodes :: DAG k e n -> [n]
nodes = map fst . Map.elems

-- | Look up the node data for a given key
lookupNode :: (Ord k) => k -> DAG k e n -> Maybe n
lookupNode k d = case Map.lookup k d of
  (Just (n, _)) -> Just n
  Nothing -> Nothing

-- | Get all root keys (nodes with no incoming edges)
roots :: (Ord k) => DAG k e n -> [k]
roots d = Set.toList $ Set.difference parents children
  where
    g = edgelist d
    parents = Map.keysSet d
    children = Set.fromList (map snd g)

-- | Map a pure function over node data, leaving edges unchanged
mapNode :: (n1 -> n2) -> DAG k e n1 -> DAG k e n2
mapNode f = Map.map (first f)

-- | Map a monadic function over node data, leaving edges unchanged
mapNodeM :: (n1 -> MorlocMonad n2) -> DAG k e n1 -> MorlocMonad (DAG k e n2)
mapNodeM f = Map.mapM (\(n, xs) -> f n >>= (\n' -> return (n', xs)))

-- | Map a monadic function over node data with access to the key
mapNodeWithKeyM :: (k -> n1 -> MorlocMonad n2) -> DAG k e n1 -> MorlocMonad (DAG k e n2)
mapNodeWithKeyM f = Map.mapWithKeyM (\k (n, xs) -> f k n >>= (\n' -> return (n', xs)))

-- | Map a pure function over edge data, leaving nodes unchanged
mapEdge :: (e1 -> e2) -> DAG k e1 n -> DAG k e2 n
mapEdge f = Map.map (\(n, xs) -> (n, [(k, f e) | (k, e) <- xs]))

-- | Like 'synthesize' but keeps original edge data unchanged
synthesizeNodes ::
  (Ord k, Monad m) =>
  (k -> n1 -> [(k, e, n2)] -> m n2) ->
  DAG k e n1 ->
  m (Maybe (DAG k e n2))
synthesizeNodes f = synthesize f (\e _ _ -> return e)

{- | Bottom-up synthesis over a DAG: compute new node and edge values where
each node's new value depends on its children's already-computed values.
Returns 'Nothing' if the DAG contains cycles (detected by fixed-point
stall).
-}
synthesize ::
  (Ord k, Monad m) =>
  (k -> n1 -> [(k, e1, n2)] -> m n2) ->
  (e1 -> n2 -> n2 -> m e2) ->
  DAG k e1 n1 ->
  m (Maybe (DAG k e2 n2))
synthesize f fe d0 = go (Just Map.empty)
  where
    -- Iteratively process nodes whose children are all resolved
    go Nothing = return Nothing
    go (Just processed)
      | Map.size d0 == Map.size processed = return (Just processed)
      | otherwise = do
          processed' <- foldlM addIfReady processed (Map.toList d0)
          if Map.size processed' == Map.size processed
            -- No progress means a cycle
            then return Nothing
            else go (Just processed')

    -- Leaf nodes: no children to wait for
    addIfReady processed (key, (nodeVal, []))
      | Map.member key processed = return processed
      | otherwise = do
          newNode <- f key nodeVal []
          return $ Map.insert key (newNode, []) processed
    -- Interior nodes: all children must be processed first
    addIfReady processed (key, (nodeVal, childEdges))
      | Map.member key processed = return processed
      | otherwise = case mapM ((`Map.lookup` processed) . fst) childEdges of
          Nothing -> return processed
          (Just resolvedChildren) -> do
            let augmented = [(k, e, n2) | ((k, e), (n2, _)) <- zip childEdges resolvedChildren]
            newNode <- f key nodeVal augmented
            newEdges <-
              mapM
                (\((k2, e), (childNode, _)) -> (,) k2 <$> fe e newNode childNode)
                (zip childEdges resolvedChildren)
            return $ Map.insert key (newNode, newEdges) processed


================================================
FILE: library/Morloc/Data/Doc.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Data.Doc
Description : Pretty-printing utilities wrapping prettyprinter
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Re-exports "Prettyprinter" and "Prettyprinter.Render.Text", plus convenience
functions for rendering documents to 'Text', building code blocks, and
performing template-style text substitution.
-}
module Morloc.Data.Doc
  ( module Prettyprinter
  , module Prettyprinter.Render.Text
  , render
  , render'
  , textEsc'
  , escapeStringLit
  , escapeQuotes
  , tupledNoFold
  , int
  , integer
  , block
  , format
  ) where

import qualified Data.Text as DT
import Prettyprinter hiding (annotate, (<>))
import Prettyprinter.Render.Text

-- | Render a 'Doc' to strict 'DT.Text' using default layout options
render :: Doc ann -> DT.Text
render = renderStrict . layoutPretty defaultLayoutOptions

-- | Render a 'Doc' to 'String' (ignores layout)
render' :: Doc ann -> String
render' = show

-- | Convenience wrapper: @pretty@ specialized to 'Int'
int :: Int -> Doc ann
int = pretty

-- | Convenience wrapper: @pretty@ specialized to 'Integer'
integer :: Integer -> Doc ann
integer = pretty

-- | Format a code block with braces and indentation
block :: Int -> Doc ann -> Doc ann -> Doc ann
block level header body = align . vsep $ [header, "{", indent level body, "}"]

-- | Like 'tupled' but never folds long lines (folding breaks commenting)
tupledNoFold :: [Doc ann] -> Doc ann
tupledNoFold [] = ""
tupledNoFold (x : xs) = parens (foldl (\l r -> l <> "," <+> r) x xs)

-- | Re-escape whitespace and backslash for embedding in generated
-- string literals. Quote escaping is handled separately via
-- 'escapeQuotes' using the language-specific terminator.
escapeStringLit :: DT.Text -> DT.Text
escapeStringLit = DT.concatMap escapeChar
  where
    escapeChar '\\' = "\\\\"
    escapeChar '\n' = "\\n"
    escapeChar '\t' = "\\t"
    escapeChar '\r' = "\\r"
    escapeChar c = DT.singleton c

-- | Replace occurrences of a quote terminator with its escaped form.
escapeQuotes :: DT.Text -> DT.Text -> DT.Text -> DT.Text
escapeQuotes terminator escaped = DT.replace terminator escaped

-- | Render a 'DT.Text' literal as a double-quoted, escaped 'Doc'
textEsc' :: DT.Text -> Doc ann
textEsc' = dquotes . pretty . escapeQuotes "\"" "\\\"" . escapeStringLit

-- | Template substitution: split @fmtstr@ on @breaker@ and interleave @replacements@
format ::
  DT.Text -> -- main text with substitution patterns
  DT.Text -> -- break string
  [Doc ann] -> -- replacement strings
  Doc ann
format fmtstr breaker replacements =
  let xs = DT.splitOn breaker fmtstr
   in foldl (<>) (pretty . head $ xs) $ zipWith (\r x -> r <> pretty x) replacements (tail xs)


================================================
FILE: library/Morloc/Data/GMap.hs
================================================
{- |
Module      : Morloc.Data.GMap
Description : A general map datatype (non-injective and non-surjective)
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

A two-level map @GMap a b c@ that maps outer keys @a@ to inner keys @b@, and
inner keys @b@ to values @c@. Multiple outer keys may share the same inner
key (and thus value). Used in the compiler for type-alias indirection where
many names can refer to the same underlying definition.
-}
module Morloc.Data.GMap
  ( elems
  , empty
  , innerKeys
  , insert
  , insertWith
  , insertWithM
  , change
  , insertMany
  , insertManyWith
  , keys
  , lookup
  , mapInnerKeys
  , mapKeys
  , mapVals
  , mapValsM
  , mapValsWithKeyM
  , yIsX
  ) where

import qualified Data.Set as Set
import qualified Morloc.Data.Map as Map
import Morloc.Namespace.Prim hiding (insert, lookup)
import Prelude hiding (lookup)

-- | Map a function over all values
mapVals :: (c -> c') -> GMap a b c -> GMap a b c'
mapVals f (GMap x y) = GMap x (Map.map f y)

-- | Monadic 'mapVals'
mapValsM :: (Ord b, Monad m) => (c -> m c') -> GMap a b c -> m (GMap a b c')
mapValsM f (GMap m1 m2) = do
  let m2list = Map.toList m2
  xs2 <- mapM (f . snd) m2list
  return $ GMap m1 (Map.fromList (zip (map fst m2list) xs2))

-- | Monadic map over values with access to the inner key
mapValsWithKeyM :: (Ord b, Monad m) => (b -> c -> m c') -> GMap a b c -> m (GMap a b c')
mapValsWithKeyM f (GMap m1 m2) = do
  let m2list = Map.toList m2
  xs2 <- mapM (uncurry f) m2list
  return $ GMap m1 (Map.fromList (zip (map fst m2list) xs2))

-- | Map a function over outer keys
mapKeys :: (Ord a') => (a -> a') -> GMap a b c -> GMap a' b c
mapKeys f (GMap x y) = GMap (Map.mapKeys f x) y

-- | Map a function over inner keys (updating both the key mapping and value map)
mapInnerKeys :: (Ord b') => (b -> b') -> GMap a b c -> GMap a b' c
mapInnerKeys f (GMap x y) = GMap (Map.map f x) (Map.mapKeys f y)

-- | Get all outer keys
keys :: GMap a b c -> [a]
keys (GMap x _) = Map.keys x

-- | Get the sets of (mapped-to inner keys, all inner keys)
innerKeys :: (Ord b) => GMap a b c -> (Set.Set b, Set.Set b)
innerKeys (GMap x y) = (Set.fromList (Map.elems x), Set.fromList (Map.keys y))

-- | Get all values
elems :: GMap a b c -> [c]
elems (GMap _ y) = Map.elems y

-- | An empty 'GMap'
empty :: GMap a b c
empty = GMap Map.empty Map.empty

-- | Insert a mapping from outer key to inner key to value
insert :: (Ord a, Ord b) => a -> b -> c -> GMap a b c -> GMap a b c
insert k1 k2 x (GMap m1 m2) = GMap (Map.insert k1 k2 m1) (Map.insert k2 x m2)

-- | Insert with a combining function for values at colliding inner keys
insertWith :: (Ord a, Ord b) => (c -> c -> c) -> a -> b -> c -> GMap a b c -> GMap a b c
insertWith f k1 k2 x (GMap m1 m2) = GMap (Map.insert k1 k2 m1) (Map.insertWith f k2 x m2)

-- | Monadic 'insertWith'
insertWithM ::
  (Monad m, Ord a, Ord b) => (c -> c -> m c) -> a -> b -> c -> GMap a b c -> m (GMap a b c)
insertWithM f k1 k2 x1 (GMap m1 m2) = do
  let map1 = Map.insert k1 k2 m1
  x3 <- case Map.lookup k2 m2 of
    (Just x2) -> f x1 x2
    Nothing -> return x1
  return $ GMap map1 (Map.insert k2 x3 m2)

{- | Given an outer key, replace its associated value. Since multiple outer
keys may share the same inner key, this affects all of them.
-}
change :: (Ord a, Ord b) => a -> c -> GMap a b c -> Maybe (GMap a b c)
change k1 v (GMap x y) = do
  k2 <- Map.lookup k1 x
  return $ GMap x (Map.insert k2 v y)

-- | Insert multiple outer keys that all map to the same inner key and value
insertMany :: (Ord a, Ord b) => [a] -> b -> c -> GMap a b c -> GMap a b c
insertMany ks k2 x (GMap m1 m2) = GMap m1' m2'
  where
    m1' = Map.union (Map.fromList (zip ks (repeat k2))) m1
    m2' = Map.insert k2 x m2

-- | 'insertMany' with a combining function for colliding inner keys
insertManyWith :: (Ord a, Ord b) => (c -> c -> c) -> [a] -> b -> c -> GMap a b c -> GMap a b c
insertManyWith f ks k2 x (GMap m1 m2) = GMap m1' m2'
  where
    m1' = Map.union (Map.fromList (zip ks (repeat k2))) m1
    m2' = Map.insertWith f k2 x m2

{- | Make @newKey@ point to the same inner key as @oldKey@. Returns 'Nothing'
if @oldKey@ is absent.
-}
yIsX :: (Ord a) => a -> a -> GMap a b c -> Maybe (GMap a b c)
yIsX oldKey newKey (GMap m x) = do
  i <- Map.lookup oldKey m
  return (GMap (Map.insert newKey i m) x)

-- | Two-phase lookup: outer key to inner key, then inner key to value
lookup :: (Ord a, Ord b) => a -> GMap a b c -> GMapRet c
lookup k1 (GMap m1 m2) =
  case Map.lookup k1 m1 of
    Nothing -> GMapNoFst
    (Just k2) -> case Map.lookup k2 m2 of
      Nothing -> GMapNoSnd
      (Just x) -> GMapJust x


================================================
FILE: library/Morloc/Data/Json.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Data.Json
Description : Lightweight JSON builder utilities
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Minimal JSON text builders for generating manifest files and other JSON
output without depending on aeson for serialization. Each function produces
a 'Text' fragment that is valid JSON.
-}
module Morloc.Data.Json
  ( jsonEscape
  , jsonStr
  , jsonInt
  , jsonBool
  , jsonNull
  , jsonArr
  , jsonObj
  , jsonStrArr
  , jsonMaybeStr
  ) where

import Data.Char (ord)
import Data.Text (Text)
import qualified Data.Text as MT
import Numeric (showHex)

-- | Escape a text value for inclusion in a JSON string (without surrounding quotes)
jsonEscape :: Text -> Text
jsonEscape = MT.concatMap esc
  where
    esc '"' = "\\\""
    esc '\\' = "\\\\"
    esc '\n' = "\\n"
    esc '\r' = "\\r"
    esc '\t' = "\\t"
    esc '\b' = "\\b"
    esc '\f' = "\\f"
    esc c | c < ' ' = "\\u" <> MT.pack (pad4 (showHex (ord c) ""))
    esc c = MT.singleton c

    pad4 s = replicate (4 - length s) '0' ++ s

-- | Wrap a text value as a JSON string (escaped and double-quoted)
jsonStr :: Text -> Text
jsonStr t = "\"" <> jsonEscape t <> "\""

-- | Render an 'Int' as a JSON number
jsonInt :: Int -> Text
jsonInt = MT.pack . show

-- | Render a 'Bool' as a JSON boolean
jsonBool :: Bool -> Text
jsonBool True = "true"
jsonBool False = "false"

-- | The JSON null literal
jsonNull :: Text
jsonNull = "null"

-- | Render a list of pre-formatted JSON values as a JSON array
jsonArr :: [Text] -> Text
jsonArr xs = "[" <> MT.intercalate "," xs <> "]"

-- | Render key-value pairs as a JSON object (values are pre-formatted JSON)
jsonObj :: [(Text, Text)] -> Text
jsonObj pairs = "{" <> MT.intercalate "," [jsonStr k <> ":" <> v | (k, v) <- pairs] <> "}"

-- | Render a list of text values as a JSON array of strings
jsonStrArr :: [Text] -> Text
jsonStrArr = jsonArr . map jsonStr

-- | Render 'Nothing' as @null@, 'Just' as a JSON string
jsonMaybeStr :: Maybe Text -> Text
jsonMaybeStr Nothing = jsonNull
jsonMaybeStr (Just t) = jsonStr t


================================================
FILE: library/Morloc/Data/Map/Extra.hs
================================================
{- |
Module      : Morloc.Data.Map.Extra
Description : Additional functions for the Map class
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Monadic extensions to "Data.Map.Strict" that are not provided by the standard
library: monadic union, map, and three-way merge operations.
-}
module Morloc.Data.Map.Extra
  ( mergeMaps
  , mergeMapsM
  , mapKeysWithM
  , mapM
  , mapWithKeyM
  , unionWithM
  , unionsWithM
  ) where

import Control.Monad (foldM)
import Data.Bifunctor (first)
import Data.List.Extra (groupSort)
import qualified Data.Map.Strict as Map
import Prelude hiding (mapM)
import qualified Prelude

onSndM :: (Monad m) => (b -> m c) -> (a, b) -> m (a, c)
onSndM f (x, y) = (,) x <$> f y

-- | Monadic version of @Data.Map.unionWith@
unionWithM :: (Monad m, Ord a) => (b -> b -> m b) -> Map.Map a b -> Map.Map a b -> m (Map.Map a b)
unionWithM f m1 m2 = do
  pairs <- Prelude.mapM (onSndM (uncurry f)) (Map.toList $ Map.intersectionWith (,) m1 m2)

  return $
    Map.unions
      [ Map.difference m1 m2
      , Map.fromList pairs
      , Map.difference m2 m1
      ]

-- | Monadic version of @Data.Map.unionsWith@
unionsWithM :: (Monad m, Ord a) => (b -> b -> m b) -> [Map.Map a b] -> m (Map.Map a b)
unionsWithM f = foldM (unionWithM f) Map.empty

-- | Monadic version of @Data.Map.mapKeysWith@, merging values when keys collide
mapKeysWithM ::
  (Monad m, Ord k2) =>
  (a -> a -> m a) ->
  (k1 -> k2) ->
  Map.Map k1 a ->
  m (Map.Map k2 a)
mapKeysWithM f g m =
  Map.fromList
    <$> Prelude.mapM
      foldValues
      (groupSort $ map (first g) (Map.toList m))
  where
    foldValues (k, v : vs) = (,) k <$> foldM f v vs
    foldValues _ = undefined -- groupSort never produces empty value lists

-- | Monadic version of @Data.Map.map@
mapM :: (Monad m) => (a -> m b) -> Map.Map k a -> m (Map.Map k b)
mapM f = Map.traverseWithKey (\_ a -> f a)

-- | Monadic version of @Data.Map.mapWithKey@
mapWithKeyM :: (Monad m) => (k -> a -> m b) -> Map.Map k a -> m (Map.Map k b)
mapWithKeyM = Map.traverseWithKey

{- | Three-way merge of two maps: apply @fb@ to left-only, @fc@ to right-only,
and @fbc@ to entries present in both
-}
mergeMaps ::
  (Ord a) =>
  (b -> d) ->
  (c -> d) ->
  (b -> c -> d) ->
  Map.Map a b ->
  Map.Map a c ->
  Map.Map a d
mergeMaps fb fc fbc m1 m2 =
  Map.unions
    [ Map.map fb (Map.difference m1 m2)
    , Map.mapMaybeWithKey (\k v -> fbc v <$> Map.lookup k m2) (Map.intersection m1 m2)
    , Map.map fc (Map.difference m2 m1)
    ]

-- | Monadic version of 'mergeMaps'
mergeMapsM ::
  (Ord a, Monad m) =>
  (b -> m d) ->
  (c -> m d) ->
  (b -> c -> m d) ->
  Map.Map a b ->
  Map.Map a c ->
  m (Map.Map a d)
mergeMapsM fb fc fbc m1 m2 = do
  bs <- mapM fb $ Map.difference m1 m2
  bcs <- mapM (uncurry fbc) $ Map.intersectionWith (,) m1 m2
  cs <- mapM fc $ Map.difference m2 m1
  return $ Map.unions [bs, bcs, cs]


================================================
FILE: library/Morloc/Data/Map.hs
================================================
{- |
Module      : Morloc.Data.Map
Description : An extension of the base map module
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.Data.Map
  ( module Data.Map.Strict
  , module Morloc.Data.Map.Extra
  ) where

import Data.Map.Strict
import Morloc.Data.Map.Extra


================================================
FILE: library/Morloc/Data/Text.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Data.Text
Description : Text utilities and re-exports
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Re-exports "Data.Text", "Data.Text.IO", and "Data.Text.Encoding", plus
conversion helpers ('show'', 'read'') and string-stripping utilities
('unenclose', 'unangle', 'unquote', 'undquote').
-}
module Morloc.Data.Text
  ( module Data.Text
  , module Data.Text.IO
  , module Data.Text.Encoding
  , show'
  , pretty
  , read'
  , readMay'
  , unenclose
  , unangle
  , unquote
  , undquote
  , stripPrefixIfPresent
  , liftToText
  ) where

import Data.Maybe (fromMaybe)
import Data.Text hiding (map)
import Data.Text.Encoding
import Data.Text.IO
import qualified Data.Text.Lazy as DL
import qualified Safe
import qualified Text.Pretty.Simple as Pretty
import Prelude hiding (concat, length, lines, unlines)

-- | 'show' producing 'Text' instead of 'String'
show' :: (Show a) => a -> Text
show' = pack . Prelude.show

-- | 'read' accepting 'Text' instead of 'String'
read' :: (Read a) => Text -> a
read' = read . unpack

-- | Safe 'read' from 'Text', returning 'Nothing' on parse failure
readMay' :: (Read a) => Text -> Maybe a
readMay' = Safe.readMay . unpack

-- | Strip a prefix if present, otherwise return the text unchanged
stripPrefixIfPresent :: Text -> Text -> Text
stripPrefixIfPresent prefix text =
  case stripPrefix prefix text of
    (Just x) -> x
    Nothing -> text

-- | Pretty-print any 'Show' instance to 'Text' (no color)
pretty :: (Show a) => a -> Text
pretty = DL.toStrict . Pretty.pShowNoColor

-- | Lift a @String -> String@ function to operate on 'Text'
liftToText :: (String -> String) -> Text -> Text
liftToText f = pack . f . unpack

-- | Strip matching open\/close delimiters from a text value
unenclose :: Text -> Text -> Text -> Text
unenclose a b x = fromMaybe x (stripPrefix a x >>= stripSuffix b)

-- | Strip surrounding angle brackets: @\<foo\>@ -> @foo@
unangle :: Text -> Text
unangle = unenclose "<" ">"

-- | Strip surrounding single quotes: @\'foo\'@ -> @foo@
unquote :: Text -> Text
unquote = unenclose "'" "'"

-- | Strip surrounding double quotes: @\"foo\"@ -> @foo@
undquote :: Text -> Text
undquote = unenclose "\"" "\""


================================================
FILE: library/Morloc/DataFiles.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE TemplateHaskell #-}

{- |
Module      : Morloc.DataFiles
Description : Template-Haskell-embedded data files for runtime and codegen
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

All non-Haskell data files (C library sources, pool templates, init scripts,
lang.yaml configs, nexus source) are embedded at compile time via
'Data.FileEmbed.embedFileRelative'. This module provides typed access to
these files for use by 'Morloc.CodeGenerator.SystemConfig' (init) and the
translators (codegen).
-}
module Morloc.DataFiles
  ( EmbededFile (..)
  , LangSetup (..)
  , libmorlocHeader
  , poolTemplate
  , poolTemplateGeneric
  , langSetups
  , langRegistryFiles
  , languagesYaml
  ) where

import Data.FileEmbed (embedFileRelative)
import Data.Text (Text)
import qualified Data.Text as T
import Data.Text.Encoding (decodeUtf8)

data EmbededFile = EmbededFile
  { embededFileName :: String -- basename for the file
  , embededFileText :: Text -- full text the file contained at compile time
  }

-- | Per-language init setup: an init script and associated data files.
data LangSetup = LangSetup
  { lsName :: String
  , lsRequiredTools :: [String]
  , lsInitScript :: EmbededFile
  , lsFiles :: [EmbededFile]
  }

-- | The single self-contained morloc.h header (the ABI contract for libmorloc.so).
-- Language extensions and pool templates #include this to call into the Rust library.
libmorlocHeader :: Text
libmorlocHeader = decodeUtf8 $(embedFileRelative "data/morloc/morloc.h")

-- | Pool template lookup by canonical language name
poolTemplate :: Text -> EmbededFile
poolTemplate "cpp" = EmbededFile "pool.cpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/pool.cpp"))
poolTemplate name = error $ "No embedded pool template for " <> T.unpack name

-- | 3-section pool templates for the generic translator (sources, manifolds, dispatch)
poolTemplateGeneric :: Text -> EmbededFile
poolTemplateGeneric "py" = EmbededFile "pool.py" (decodeUtf8 $ $(embedFileRelative "data/lang/py/pool.py"))
poolTemplateGeneric "r" = EmbededFile "pool.R" (decodeUtf8 $ $(embedFileRelative "data/lang/r/pool.R"))
poolTemplateGeneric name = poolTemplate name

{- | Per-language init setups. Each bundles an init.sh script with
the data files that should be written to the build dir before running it.
-}
langSetups :: [LangSetup]
langSetups = [cppSetup, pythonSetup, rSetup, juliaSetup]

cppSetup :: LangSetup
cppSetup =
  LangSetup
    "C++"
    ["g++", "git"]
    (EmbededFile "init.sh" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/init.sh")))
    [ EmbededFile "cppmorloc.hpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/cppmorloc.hpp"))
    , EmbededFile "cppmorloc.cpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/cppmorloc.cpp"))
    , EmbededFile "morloc_pch.hpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/morloc_pch.hpp"))
    , EmbededFile "mlc_arrow.hpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/mlc_arrow.hpp"))
    , EmbededFile "mlc_tensor.hpp" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/mlc_tensor.hpp"))
    , EmbededFile "nanoarrow.h" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/nanoarrow/nanoarrow.h"))
    , EmbededFile "nanoarrow.c" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/nanoarrow/nanoarrow.c"))
    ]

pythonSetup :: LangSetup
pythonSetup =
  LangSetup
    "python"
    ["python3"]
    (EmbededFile "init.sh" (decodeUtf8 $ $(embedFileRelative "data/lang/py/init.sh")))
    [ EmbededFile "pymorloc.c" (decodeUtf8 $ $(embedFileRelative "data/lang/py/pymorloc.c"))
    , EmbededFile "setup.py" (decodeUtf8 $ $(embedFileRelative "data/lang/py/setup.py"))
    , EmbededFile "Makefile" (decodeUtf8 $ $(embedFileRelative "data/lang/py/Makefile"))
    ]

rSetup :: LangSetup
rSetup =
  LangSetup
    "R"
    ["R"]
    (EmbededFile "init.sh" (decodeUtf8 $ $(embedFileRelative "data/lang/r/init.sh")))
    [ EmbededFile "rmorloc.c" (decodeUtf8 $ $(embedFileRelative "data/lang/r/rmorloc.c"))
    ]

juliaSetup :: LangSetup
juliaSetup =
  LangSetup
    "Julia"
    ["julia"]
    (EmbededFile "init.sh" (decodeUtf8 $ $(embedFileRelative "data/lang/julia/init.sh")))
    [ EmbededFile "juliabridge.c" (decodeUtf8 $ $(embedFileRelative "data/lang/julia/juliabridge.c"))
    , EmbededFile
        "MorlocRuntime.jl"
        (decodeUtf8 $ $(embedFileRelative "data/lang/julia/MorlocRuntime.jl"))
    , EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/julia/lang.yaml"))
    , EmbededFile "pool.jl" (decodeUtf8 $ $(embedFileRelative "data/lang/julia/pool.jl"))
    ]

-- | Per-language lang.yaml files keyed by canonical name
langRegistryFiles :: [(String, EmbededFile)]
langRegistryFiles =
  [ ("c", EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/c/lang.yaml")))
  , ("cpp", EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/cpp/lang.yaml")))
  , ("py", EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/py/lang.yaml")))
  , ("r", EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/r/lang.yaml")))
  , ("jl", EmbededFile "lang.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/julia/lang.yaml")))
  ]

-- | Shared languages.yaml with pairwise costs
languagesYaml :: EmbededFile
languagesYaml = EmbededFile "languages.yaml" (decodeUtf8 $ $(embedFileRelative "data/lang/languages.yaml"))


================================================
FILE: library/Morloc/Frontend/API.hs
================================================
{- |
Module      : Morloc.Frontend.API
Description : Entry point for the frontend pipeline (parse, typecheck, valuecheck)
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Orchestrates the full frontend pipeline: parsing source files into a module
DAG, recursively resolving imports, and re-exporting the typechecker and
valuechecker entry points. This is the primary interface consumed by the
top-level compiler driver ('Morloc').
-}
module Morloc.Frontend.API
  ( parse
  , Parser.readType
  , Typecheck.typecheck
  , Typecheck.resolveTypes
  , Valuecheck.valuecheck
  ) where

import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as T
import qualified Morloc.Config as Config
import qualified Morloc.Data.DAG as MDD
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import Morloc.Frontend.Namespace
import Morloc.Frontend.Parser (PState (..), emptyPState)
import qualified Morloc.Frontend.Parser as Parser
import qualified Morloc.Frontend.Typecheck as Typecheck
import qualified Morloc.Frontend.Valuecheck as Valuecheck
import qualified Morloc.LangRegistry as LR
import qualified Morloc.Module as Mod
import qualified Morloc.Monad as MM
import qualified Morloc.System as MS
import System.Directory (doesDirectoryExist, doesFileExist, listDirectory)

{- | Parse a morloc source file and all its imports into a module DAG.
Recursively discovers and parses imported modules.
-}
parse ::
  -- | path to the current module (if we are reading from a file)
  Maybe Path ->
  -- | code of the current module
  Code ->
  MorlocMonad (DAG MVar Import ExprI)
parse f (Code code) = do
  moduleConfig <- Config.loadModuleConfig f
  langMap <- buildLangMap'

  -- Compute project root from entry-point file path
  let projectRoot = fmap MS.takeDirectory f

  let parserState =
        emptyPState
          { psModuleConfig = moduleConfig
          , psLangMap = langMap
          , psProjectRoot = projectRoot
          }

  -- store source text, project root, and load package metadata for the main file
  case f of
    Just path -> do
      MM.modify (\st -> st
        { stateSourceText = Map.insert path code (stateSourceText st)
        , stateProjectRoot = projectRoot
        })
      Mod.loadModuleMetadata path
    Nothing -> return ()

  case Parser.readProgram Nothing f code parserState mempty of
    (Left e) -> MM.throwSystemError $ pretty e
    (Right (mainDag, mainState)) -> do
      -- capture module-level docs from the main module before imports overwrite them
      MM.modify (\st -> st
        { stateModuleDoc = psModuleDoc mainState
        , stateModuleEpilogues = psModuleEpilogues mainState
        })
      parseImports mainDag mainState Map.empty
  where
    -- descend recursively into imports
    parseImports ::
      DAG MVar Import ExprI ->
      PState ->
      Map.Map MVar Path ->
      MorlocMonad (DAG MVar Import ExprI)
    parseImports d s m = case unimported of
      [] -> do
        -- transfer source positions from parser state into MorlocState
        MM.modify (\st -> st
          { stateSourceMap = psSourceMap s <> stateSourceMap st
          , stateTermDocs = psTermDocs s <> stateTermDocs st
          })
        -- emit any docstring warnings accumulated during desugar
        case psWarnings s of
          [] -> return ()
          ws -> MM.tell ws
        return d
      ((mainModule, importedModule) : _) -> do
        importPath <- case Map.lookup mainModule m of
          (Just mainPath) -> Mod.findModule (Just mainPath, mainModule) importedModule
          Nothing -> Mod.findModule (Nothing, mainModule) importedModule

        -- Load the <main>.yaml file associated with the main morloc package file
        moduleConfig <- Config.loadModuleConfig (Just importPath)
        let newState = s {psModuleConfig = moduleConfig}

        Mod.loadModuleMetadata importPath
        (childPath, code') <- openLocalModule importPath
        case Parser.readProgram (Just importedModule) childPath code' newState d of
          (Left e) -> MM.throwSystemError $ pretty e
          (Right (d', s')) ->
            -- The parsed module may have a different internal name than the
            -- import edge target (e.g., file declares "module units" but
            -- import edge targets ".units"). Reconcile by renaming the DAG
            -- entry to match the import name.
            let d'' = reconcileModuleName importedModule d d'
            in parseImports d'' s' (maybe m (\v -> Map.insert importedModule v m) childPath)
      where
        -- all modules that have already been parsed
        parsed = Map.keysSet d
        -- find all (module to module) edges in the graph where the imported
        -- module has not yet been parsed
        unimported = filter (\(_, importMod) -> not (Set.member importMod parsed)) (MDD.edgelist d)

    -- If readProgram added a key that doesn't match importedModule, rename it.
    -- This happens when a local import (".units") parses a file that declares
    -- "module units (...)". We rename the DAG key and the ModE name to match
    -- the import edge target.
    reconcileModuleName :: MVar -> DAG MVar Import ExprI -> DAG MVar Import ExprI -> DAG MVar Import ExprI
    reconcileModuleName importName dOld dNew =
      case newKeys of
        [actualName] | actualName /= importName ->
          -- Rename: delete the old key, insert under the import name with
          -- the ModE name rewritten to match
          case Map.lookup actualName dNew of
            Just (ExprI i (ModE _ es), edges) ->
              let renamed = Map.delete actualName dNew
              in Map.insert importName (ExprI i (ModE importName es), edges) renamed
            _ -> dNew  -- shouldn't happen
        _ -> dNew  -- zero or multiple new keys: nothing to reconcile
      where
        newKeys = filter (`Map.notMember` dOld) (Map.keys dNew)

-- | assume @t@ is a filename and open it, return file name and contents
openLocalModule :: Path -> MorlocMonad (Maybe Path, Text)
openLocalModule filename = do
  code <- liftIO $ MT.readFile filename
  MM.modify (\st -> st {stateSourceText = Map.insert filename code (stateSourceText st)})
  return (Just filename, code)

{- | Build a map from language aliases to Lang values, combining the
registry (built-in languages) with filesystem-discovered plugins.
-}
buildLangMap' :: MorlocMonad (Map.Map T.Text Lang)
buildLangMap' = do
  -- Get the registry-based lang map (all built-in languages)
  reg <- MM.gets stateLangRegistry
  let registryMap = LR.buildLangMap reg

  -- Discover additional plugin languages on the filesystem
  home <- MM.asks configHome
  let langDir = home </> "lang"
  exists <- liftIO $ doesDirectoryExist langDir
  pluginMap <-
    if not exists
      then return Map.empty
      else do
        dirs <- liftIO $ listDirectory langDir
        results <- liftIO $ mapM (scanLangDir langDir) dirs
        return $ Map.fromList [(n, lang) | Just (n, lang) <- results]

  -- Registry entries take precedence over filesystem discoveries
  return $ Map.union registryMap pluginMap
  where
    scanLangDir :: FilePath -> String -> IO (Maybe (T.Text, Lang))
    scanLangDir langDir dirName = do
      let descPath = langDir </> dirName </> "lang.yaml"
      hasDesc <- doesFileExist descPath
      if not hasDesc
        then return Nothing
        else do
          result <- LR.parseLangYamlFile descPath
          case result of
            Left _ -> return Nothing
            Right (name, ext) -> return $ Just (name, Lang name ext)


================================================
FILE: library/Morloc/Frontend/AST.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.AST
Description : Query and traversal functions over the indexed 'ExprI' AST
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Provides structural queries over the indexed expression tree ('ExprI'):
extracting module edges, exports, type definitions, signatures, sources,
fixity declarations, and index ranges. Used by 'Restructure', 'Link',
and 'Treeify' to inspect and manipulate the AST before code generation.
-}
module Morloc.Frontend.AST
  ( findEdges
  , findExport
  , findExportSet
  , findFixityMap
  , setExport
  , findSignatures
  , findTypedefs
  , findSignatureTypeTerms
  , checkExprI
  , findSources
  , maxIndex
  , getIndices
  , mapTypeInExprI
  ) where

import qualified Data.Set as Set
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM

-- | In the DAG, the two MVar are the two keys, Import is the edge data, Expr is the node data
findEdges :: ExprI -> (MVar, [(MVar, Import)], ExprI)
findEdges e@(ExprI _ (ModE n es)) = (n, [(importModuleName i, i) | (ExprI _ (ImpE i)) <- es], e)
findEdges _ = error "Expected a module"

-- | Collect all exported symbols into a flat set (ignoring indices).
findExportSet :: ExprI -> Set.Set Symbol
findExportSet e = case findExport e of
  (ExportMany ss gs) -> Set.map snd ss `Set.union` Set.unions [Set.map snd (exportGroupMembers g) | g <- gs]
  _ -> Set.empty

-- | Extract the 'Export' declaration from a module expression.
findExport :: ExprI -> Export
findExport e0 = case f e0 of
  (Just export) -> export
  Nothing -> ExportMany Set.empty []
  where
    f (ExprI _ (ExpE export)) = Just export
    f (ExprI i (ModE j (e : es))) = case f e of
      (Just export) -> Just export
      Nothing -> f (ExprI i (ModE j es))
    f _ = Nothing

-- | Replace the 'Export' declaration in a module expression.
setExport :: Export -> ExprI -> ExprI
setExport export = f
  where
    f (ExprI i (ExpE _)) = ExprI i (ExpE export)
    f (ExprI i (ModE m es)) = ExprI i (ModE m (map f es))
    f e = e

-- | Collect all 'Source' declarations from a module.
findSources :: ExprI -> [Source]
findSources (ExprI _ (SrcE ss)) = [ss]
findSources (ExprI _ (ModE _ es)) = concatMap findSources es
findSources _ = []

{- | Find all top-level type aliases in a module, split into general
(language-independent) and concrete (language-specific) maps.
-}
findTypedefs ::
  ExprI ->
  ( Map.Map TVar [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)]
  , Map.Map Lang (Map.Map TVar [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)])
  )
findTypedefs (ExprI _ (TypE (ExprTypeE Nothing v vs t d))) = (Map.singleton v [(vs, t, d, False)], Map.empty)
findTypedefs (ExprI _ (TypE (ExprTypeE (Just (lang, isTerminal)) v vs t d))) = (Map.empty, Map.singleton lang (Map.singleton v [(vs, t, d, isTerminal)]))
findTypedefs (ExprI _ (ModE _ es)) = foldl combine (Map.empty, Map.empty) (map findTypedefs es)
  where
    combine (g1, c1) (g2, c2) =
      ( Map.unionWith (<>) g1 g2
      , Map.unionWith (Map.unionWith (<>)) c1 c2
      )
findTypedefs _ = (Map.empty, Map.empty)

-- | Collect all non-generic type names used in signatures.
findSignatureTypeTerms :: ExprI -> [TVar]
findSignatureTypeTerms = unique . f
  where
    f :: ExprI -> [TVar]
    f (ExprI _ (ModE _ es)) = concatMap f es
    f (ExprI _ (SigE (Signature _ _ (EType t _ _ _)))) = findTypeTerms t
    f (ExprI _ (AssE _ _ es)) = concatMap f es
    f _ = []

-- | find all the non-generic terms in an unresolved type
findTypeTerms :: TypeU -> [TVar]
findTypeTerms (VarU v@(TV x))
  | isGeneric x = []
  | otherwise = [v]
findTypeTerms (ExistU _ (ps1, _) (rs2, _)) = concatMap findTypeTerms (ps1 ++ map snd rs2)
findTypeTerms (NatVarU _) = []
findTypeTerms (ForallU _ e) = findTypeTerms e
findTypeTerms (FunU ts t) = concatMap findTypeTerms ts <> findTypeTerms t
findTypeTerms (AppU t ts) = findTypeTerms t <> concatMap findTypeTerms ts
findTypeTerms (NamU _ _ ps rs) = concatMap findTypeTerms (map snd rs <> ps)
findTypeTerms (EffectU _ t) = findTypeTerms t
findTypeTerms (OptionalU t) = findTypeTerms t
findTypeTerms (NatLitU _) = []
findTypeTerms (NatAddU a b) = findTypeTerms a <> findTypeTerms b
findTypeTerms (NatMulU a b) = findTypeTerms a <> findTypeTerms b
findTypeTerms (NatSubU a b) = findTypeTerms a <> findTypeTerms b
findTypeTerms (NatDivU a b) = findTypeTerms a <> findTypeTerms b
findTypeTerms (LabeledU _ t) = findTypeTerms t

-- | Build the fixity map from top-level fixity declarations.
findFixityMap :: ExprI -> MorlocMonad (Map.Map EVar (Associativity, Int))
findFixityMap (ExprI _ (ModE _ es)) = do
  -- collect all fixity terms.
  -- these are allowed only at the top level, so no need for recursion.
  let allTerms =
        concat
          [ [(op, (ass, pre)) | op <- ops]
          | (ExprI _ (FixE (Fixity ass pre ops))) <- es
          ]

  foldlM tryAddTerm Map.empty allTerms
  where
    tryAddTerm ::
      Map.Map EVar (Associativity, Int) ->
      (EVar, (Associativity, Int)) ->
      MorlocMonad (Map.Map EVar (Associativity, Int))
    tryAddTerm m (k, v)
      | Map.member k m = MM.throwSystemError $ "Conflicting fixity definitions for" <+> pretty k
      | otherwise = return $ Map.insert k v m
findFixityMap _ = return Map.empty

{- | Find type signatures that are in the scope of the input expression. Do not
descend recursively into declaration where statements except if the input
expression is a declaration.
-}
findSignatures :: ExprI -> [(EVar, Maybe Label, EType)]
-- v is the name of the type
-- l is the optional label for the signature
-- t is the type
findSignatures (ExprI _ (ModE _ es)) = [(v, l, t) | (ExprI _ (SigE (Signature v l t))) <- es]
findSignatures (ExprI _ (AssE _ _ es)) = [(v, l, t) | (ExprI _ (SigE (Signature v l t))) <- es]
findSignatures (ExprI _ (SigE (Signature v l t))) = [(v, l, t)]
findSignatures _ = []

-- | Apply a monadic check function to every node in an 'ExprI' tree.
checkExprI :: (Monad m) => (ExprI -> m ()) -> ExprI -> m ()
checkExprI f e@(ExprI _ (ModE _ es)) = f e >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (AnnE e' _)) = f e >> checkExprI f e'
checkExprI f e@(ExprI _ (AssE _ e' es')) = f e >> checkExprI f e' >> mapM_ f es'
checkExprI f e@(ExprI _ (IstE _ _ es)) = f e >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (LamE _ e')) = f e >> checkExprI f e'
checkExprI f e@(ExprI _ (AppE e' es)) = f e >> checkExprI f e' >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (LstE es)) = f e >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (TupE es)) = f e >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (NamE rs)) = f e >> mapM_ (checkExprI f . snd) rs
checkExprI f e@(ExprI _ (BopE e1 _ _ e2)) = f e >> mapM_ (checkExprI f) [e1, e2]
checkExprI f e@(ExprI _ (LetE bindings body)) = f e >> mapM_ (checkExprI f . snd) bindings >> checkExprI f body
checkExprI f e@(ExprI _ (IfE c t el)) = f e >> mapM_ (checkExprI f) [c, t, el]
checkExprI f e@(ExprI _ (DoBlockE e')) = f e >> checkExprI f e'
checkExprI f e@(ExprI _ (EvalE e')) = f e >> checkExprI f e'
checkExprI f e@(ExprI _ (IntrinsicE _ es)) = f e >> mapM_ (checkExprI f) es
checkExprI f e@(ExprI _ (ParenE e')) = f e >> checkExprI f e'
checkExprI f e = f e

-- | Find the largest index used in an 'ExprI' tree.
maxIndex :: ExprI -> Int
maxIndex (ExprI i (ModE _ es)) = maximum (i : map maxIndex es)
maxIndex (ExprI i (AnnE e _)) = max i (maxIndex e)
maxIndex (ExprI i (IstE _ _ es)) = maximum (i : map maxIndex es)
maxIndex (ExprI i (AssE _ e es)) = maximum (i : map maxIndex (e : es))
maxIndex (ExprI i (LamE _ e)) = max i (maxIndex e)
maxIndex (ExprI i (AppE e es)) = maximum (i : map maxIndex (e : es))
maxIndex (ExprI i (LstE es)) = maximum (i : map maxIndex es)
maxIndex (ExprI i (TupE es)) = maximum (i : map maxIndex es)
maxIndex (ExprI i (NamE rs)) = maximum (i : map (maxIndex . snd) rs)
maxIndex (ExprI i (ExpE ExportAll)) = i
maxIndex (ExprI i (ExpE (ExportMany ss gs))) = maximum (i : map fst (Set.toList ss) ++ concatMap (map fst . Set.toList . exportGroupMembers) gs)
maxIndex (ExprI i (BopE e1 j _ e2)) = maximum [i, j, maxIndex e1, maxIndex e2]
maxIndex (ExprI i (LetE bindings body)) = maximum (i : maxIndex body : map (maxIndex . snd) bindings)
maxIndex (ExprI i (IfE c t e)) = maximum [i, maxIndex c, maxIndex t, maxIndex e]
maxIndex (ExprI i (DoBlockE e)) = max i (maxIndex e)
maxIndex (ExprI i (EvalE e)) = max i (maxIndex e)
maxIndex (ExprI i (IntrinsicE _ es)) = maximum (i : map maxIndex es)
maxIndex (ExprI i (ParenE e)) = max i (maxIndex e)
maxIndex (ExprI i _) = i

-- | Collect all indices from an 'ExprI' tree.
getIndices :: ExprI -> [Int]
getIndices (ExprI i (ModE _ es)) = i : concatMap getIndices es
getIndices (ExprI i (AnnE e _)) = i : getIndices e
getIndices (ExprI i (AssE _ e es)) = i : concatMap getIndices (e : es)
getIndices (ExprI i (IstE _ _ es)) = i : concatMap getIndices es
getIndices (ExprI i (LamE _ e)) = i : getIndices e
getIndices (ExprI i (AppE e es)) = i : concatMap getIndices (e : es)
getIndices (ExprI i (LstE es)) = i : concatMap getIndices es
getIndices (ExprI i (TupE es)) = i : concatMap getIndices es
getIndices (ExprI i (NamE rs)) = i : concatMap (getIndices . snd) rs
getIndices (ExprI i (ExpE ExportAll)) = [i]
getIndices (ExprI i (ExpE (ExportMany ss gs))) =
  i
    : [j | (j, _) <- Set.toList ss]
    ++ concatMap (\g -> [j | (j, _) <- Set.toList (exportGroupMembers g)]) gs
getIndices (ExprI i (BopE e1 j _ e2)) = [i, j] <> getIndices e1 <> getIndices e2
getIndices (ExprI i (LetE bindings body)) = i : concatMap (getIndices . snd) bindings <> getIndices body
getIndices (ExprI i (IfE c t e)) = i : concatMap getIndices [c, t, e]
getIndices (ExprI i (DoBlockE e)) = i : getIndices e
getIndices (ExprI i (EvalE e)) = i : getIndices e
getIndices (ExprI i (IntrinsicE _ es)) = i : concatMap getIndices es
getIndices (ExprI i (ParenE e)) = i : getIndices e
getIndices (ExprI i _) = [i]

-- | Apply a type transformation to all types in signatures and type definitions.
mapTypeInExprI :: (Monad m) => (TypeU -> TypeU) -> ExprI -> m ExprI
mapTypeInExprI f = go
  where
    go (ExprI i (SigE (Signature v l (EType t cs doc labels)))) =
      return $ ExprI i (SigE (Signature v l (EType (f t) cs doc labels)))
    go (ExprI i (AnnE e t)) = do
      e' <- go e
      return $ ExprI i (AnnE e' (f t))
    go (ExprI i (ModE m es)) = ExprI i . ModE m <$> mapM go es
    go (ExprI i (AssE v e es)) = ExprI i <$> (AssE v <$> go e <*> mapM go es)
    go (ExprI i (IstE cls ts es)) = ExprI i <$> (IstE cls (map f ts) <$> mapM go es)
    go (ExprI i (LamE vs e)) = ExprI i . LamE vs <$> go e
    go (ExprI i (AppE e es)) = ExprI i <$> (AppE <$> go e <*> mapM go es)
    go (ExprI i (LstE es)) = ExprI i . LstE <$> mapM go es
    go (ExprI i (TupE es)) = ExprI i . TupE <$> mapM go es
    go (ExprI i (NamE rs)) = ExprI i . NamE <$> mapM (\(k, e) -> (,) k <$> go e) rs
    go (ExprI i (LetE bindings body)) = do
      bindings' <- mapM (\(v, e) -> (,) v <$> go e) bindings
      body' <- go body
      return $ ExprI i (LetE bindings' body')
    go (ExprI i (IfE c t e)) = ExprI i <$> (IfE <$> go c <*> go t <*> go e)
    go (ExprI i (DoBlockE e)) = ExprI i . DoBlockE <$> go e
    go (ExprI i (EvalE e)) = ExprI i . EvalE <$> go e
    go (ExprI i (IntrinsicE intr es)) = ExprI i . IntrinsicE intr <$> mapM go es
    go e = return e


================================================
FILE: library/Morloc/Frontend/CST.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.CST
Description : Concrete syntax tree types for the Happy parser
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Types for the concrete syntax tree produced by the Happy-generated parser
(@Parser.y@). These preserve source spans and syntactic structure before
desugaring into the internal 'Expr' AST.
-}
module Morloc.Frontend.CST
  ( Span (..)
  , Loc (..)
  , HasPos (..)
  , CstExpr (..)
  , CstExport (..)
  , CstSigType (..)
  , CstTypeDef (..)
  , CstClassHead (..)
  , CstSigItem (..)
  , CstDoStmt (..)
  , CstAccessorBody (..)
  , CstAccessorTail (..)
  , at
  , (<->)
  , valOf
  ) where

import Data.Scientific (Scientific)
import Data.Text (Text)
import Morloc.Frontend.Token (Located (..), Pos (..))
import Morloc.Namespace.Expr (Associativity (..), Import (..))
import Morloc.Namespace.Prim
import Morloc.Namespace.Type (Constraint (..), NamType (..), TypeU (..))

-- | Source span: start position to end position
data Span = Span !Pos !Pos
  deriving (Show, Eq)

-- | Span-annotated wrapper
data Loc a = Loc !Span a
  deriving (Show, Eq)

valOf :: Loc a -> a
valOf (Loc _ x) = x

-- | Wrap a value at a single token's position
at :: Located -> a -> Loc a
at tok x = Loc (Span p p) x where p = locPos tok

{- | Build a span between any two things that have positions.
Works with Located tokens and Loc-wrapped values.
-}
class HasPos a where
  startPos :: a -> Pos
  endPos :: a -> Pos

instance HasPos Located where
  startPos = locPos
  endPos = locPos

instance HasPos (Loc a) where
  startPos (Loc (Span s _) _) = s
  endPos (Loc (Span _ e) _) = e

instance HasPos Span where
  startPos (Span s _) = s
  endPos (Span _ e) = e

-- | Build a span from a start-positioned thing to an end-positioned thing
(<->) :: (HasPos a, HasPos b) => a -> b -> Span
a <-> b = Span (startPos a) (endPos b)

infixl 5 <->

--------------------------------------------------------------------
-- CST node types
--------------------------------------------------------------------

data CstExpr
  = -- Top-level declarations
    CModE (Maybe Text) CstExport [Loc CstExpr]
  | CImpE Import
  | CSigE EVar CstSigType
  | CAssE EVar [Text] (Loc CstExpr) [Loc CstExpr]
  | CGuardedAssE EVar [Text] [(Loc CstExpr, Loc CstExpr)] (Loc CstExpr) [Loc CstExpr]
  | CTypE CstTypeDef
  | CClsE CstClassHead [CstSigItem]
  | CIstE ClassName [TypeU] [Loc CstExpr]
  | CFixE Associativity Int [EVar]
  | CSrcOldE Located (Maybe Text) [(Text, Maybe Text)]
  | CSrcNewE Located (Maybe Text) [(Bool, Text, Located)]
  | -- Expressions
    CAppE (Loc CstExpr) [Loc CstExpr]
  | CLamE [EVar] (Loc CstExpr)
  | CLetE [(EVar, Loc CstExpr)] (Loc CstExpr)
  | CBopE (Loc CstExpr) Located (Loc CstExpr)
  | CLabeledVarE Text EVar  -- label:var (e.g., large:mean)
  | CVarE EVar
  | CIntE Integer
  | CRealE Scientific
  | CStrE Text
  | CLogE Bool
  | CUniE
  | CNullE
  | CHolE
  | CLstE [Loc CstExpr]
  | CTupE [Loc CstExpr]
  | CNamE [(Key, Loc CstExpr)]
  | CAnnE (Loc CstExpr) TypeU
  | CDoE [CstDoStmt]
  | CAccessorE CstAccessorBody
  | CInterpE Text [Loc CstExpr] [Text] Text
  | CGuardExprE [(Loc CstExpr, Loc CstExpr)] (Loc CstExpr)
  | CForceE (Loc CstExpr)  -- ^ !expr force operator (only valid inside do-blocks)
  | CIntrinsicE Text  -- ^ @name intrinsic reference (text is the name without @)
  | CParenE !(Loc CstExpr)  -- ^ parenthesized expression (preserves grouping for BopE chains)
  | CInlineE (Loc CstExpr) -- ^ %inline wrapper for source declarations
  deriving (Show, Eq)

data CstExport
  = CstExportAll
  | CstExportMany [Located]
  deriving (Show, Eq)

data CstSigType = CstSigType
  { cstSigConstraintArgs :: Maybe [(Pos, TypeU)]
  , cstSigArgs :: [(Pos, TypeU)]
  }
  deriving (Show, Eq)

data CstTypeDef
  = CstTypeAlias (Maybe Located) (TVar, [Either (TVar, Kind) TypeU]) (TypeU, Bool)
  | CstTypeAliasForward (TVar, [Either (TVar, Kind) TypeU])
  | CstNamTypeWhere NamType (TVar, [Either (TVar, Kind) TypeU]) [(Located, Key, TypeU)]
  | CstNamTypeLegacy (Maybe Located) NamType (TVar, [Either (TVar, Kind) TypeU]) (Text, Bool) [(Key, TypeU)]
  deriving (Show, Eq)

data CstClassHead
  = CCHSimple TypeU
  | CCHConstrained TypeU TypeU
  | CCHMultiConstrained [Constraint] TypeU
  deriving (Show, Eq)

data CstSigItem = CstSigItem EVar CstSigType
  deriving (Show, Eq)

data CstDoStmt
  = CstDoBind EVar (Loc CstExpr)
  | CstDoBare (Loc CstExpr)
  | CstDoLet EVar (Loc CstExpr)
  deriving (Show, Eq)

data CstAccessorBody
  = CABKey Text CstAccessorTail
  | CABIdx Int CstAccessorTail
  | CABGroup [CstAccessorBody]
  deriving (Show, Eq)

data CstAccessorTail
  = CATEnd
  | CATSet (Loc CstExpr)
  | CATChain CstAccessorBody
  deriving (Show, Eq)


================================================
FILE: library/Morloc/Frontend/Desugar.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.Desugar
Description : Transform the concrete syntax tree (CST) into the internal ExprI AST
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Desugars CST nodes produced by the Happy parser into the indexed 'ExprI'
AST used by later compiler passes. Handles: binary operator insertion,
hole-to-lambda expansion, do-notation lowering, string interpolation,
accessor patterns, type quantification, source resolution, and implicit
main wrapping.
-}
module Morloc.Frontend.Desugar
  ( desugarProgram
  , desugarExpr
  , DState (..)
  , D
  , ParseError (..)
  , showParseError
  ) where

import qualified Control.Monad.State.Strict as State
import qualified Data.Map.Strict as Map
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as T
import qualified Morloc.BaseTypes as BT
import Morloc.Frontend.CST
import Morloc.Frontend.Token hiding (startPos)
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.Type
import System.FilePath (combine, dropExtension, makeRelative, splitDirectories, takeDirectory)

--------------------------------------------------------------------
-- Desugar state and monad
--------------------------------------------------------------------

data ParseError = ParseError
  { pePos :: !Pos
  , peMsg :: !String
  , peExpected :: ![String]
  , peSourceLines :: ![Text]
  }
  deriving (Show)

showParseError :: String -> ParseError -> String
showParseError filename (ParseError pos msg expected srcLines) =
  let ln = posLine pos
      col = posCol pos
      header = filename ++ ":" ++ show ln ++ ":" ++ show col ++ ": " ++ msg
      context = formatSourceContext srcLines ln col
      expectMsg = case cleanExpected expected of
        [] -> ""
        [x] -> "\n  expected " ++ x
        xs -> "\n  expected one of: " ++ intercalate ", " xs
   in header ++ context ++ expectMsg

formatSourceContext :: [Text] -> Int -> Int -> String
formatSourceContext srcLines ln col
  | ln < 1 || ln > length srcLines = ""
  | otherwise =
      let srcLine = srcLines !! (ln - 1)
          lineNum = show ln
          pad = replicate (length lineNum) ' '
          pointer = replicate (col - 1) ' ' ++ "^"
       in "\n  "
            ++ pad
            ++ " |\n  "
            ++ lineNum
            ++ " | "
            ++ T.unpack srcLine
            ++ "\n  "
            ++ pad
            ++ " | "
            ++ pointer

cleanExpected :: [String] -> [String]
cleanExpected = filter (not . isInternal) . nub . map friendlyName
  where
    isInternal s = s `elem` ["VLBRACE", "VRBRACE", "VSEMI", "EOF"]
    friendlyName "LOWER" = "identifier"
    friendlyName "UPPER" = "type name"
    friendlyName "OPERATOR" = "operator"
    friendlyName "INTEGER" = "integer"
    friendlyName "FLOAT" = "number"
    friendlyName "STRING" = "string"
    friendlyName "STRSTART" = "string"
    friendlyName "STRMID" = "string"
    friendlyName "STREND" = "string"
    friendlyName "INTERPOPEN" = "'#{'"
    friendlyName "INTERPCLOSE" = "'}'"
    friendlyName "GDOT" = "'.'"
    friendlyName s = s

data DState = DState
  { dsExpIndex :: !Int
  , dsSourceMap :: !(Map.Map Int SrcLoc)
  , dsDocMap :: !(Map.Map Pos [Text])
  , dsModulePath :: !(Maybe Path)
  , dsModuleConfig :: !ModuleConfig
  , dsSourceLines :: ![Text]
  , dsLangMap :: !(Map.Map Text Lang) -- alias -> Lang for all known languages
  , dsProjectRoot :: !(Maybe Path) -- project root (directory of entry-point file)
  , dsTermDocs :: !(Map.Map EVar [Text]) -- declaration-level docstrings
  , dsWarnings :: ![Text] -- accumulated docstring warnings, drained by the caller
  , dsModuleDoc :: ![Text] -- module-level description lines
  , dsModuleEpilogues :: ![[Text]] -- epilogue blocks for top-level help
  }
  deriving (Show)

type D a = State.StateT DState (Either ParseError) a

dfail :: Pos -> String -> D a
dfail pos msg = do
  srcLines <- State.gets dsSourceLines
  State.lift (Left (ParseError pos msg [] srcLines))

dwarn :: [Text] -> D ()
dwarn [] = return ()
dwarn ws = State.modify (\s -> s { dsWarnings = dsWarnings s <> ws })

--------------------------------------------------------------------
-- ID generation with proper spans
--------------------------------------------------------------------

freshIdSpan :: Span -> D Int
freshIdSpan (Span start end) = do
  s <- State.get
  let i = dsExpIndex s
      loc = SrcLoc (Just (posFile start)) (posLine start) (posCol start) (posLine end) (posCol end)
  State.put
    s
      { dsExpIndex = i + 1
      , dsSourceMap = Map.insert i loc (dsSourceMap s)
      }
  return i

freshIdPos :: Pos -> D Int
freshIdPos p = freshIdSpan (Span p p)

freshExprSpan :: Span -> Expr -> D ExprI
freshExprSpan sp e = do
  i <- freshIdSpan sp
  return (ExprI i e)

noSrcLoc :: SrcLoc
noSrcLoc = SrcLoc Nothing 0 0 0 0

freshExprFrom :: ExprI -> Expr -> D ExprI
freshExprFrom (ExprI refId _) e = do
  s <- State.get
  let i = dsExpIndex s
      loc = Map.findWithDefault noSrcLoc refId (dsSourceMap s)
  State.put
    s
      { dsExpIndex = i + 1
      , dsSourceMap = Map.insert i loc (dsSourceMap s)
      }
  return (ExprI i e)

--------------------------------------------------------------------
-- Docstring helpers
--------------------------------------------------------------------

lookupDocsAt :: Pos -> D [Text]
lookupDocsAt pos = do
  docMap <- State.gets dsDocMap
  return (Map.findWithDefault [] pos docMap)

-- | Capture declaration-level docstring lines, keyed by term name.
-- Extracts only free description lines (the same way processArgDocLines
-- does via docLines); key-value entries like metavar:, arg:, etc. are
-- intentionally ignored at the declaration level since those describe
-- type-signature interface details.
captureDeclDocs :: Pos -> EVar -> D ()
captureDeclDocs pos name = do
  docs <- lookupDocsAt pos
  vars <- processArgDocLinesD docs
  let descLines = docLines vars
  case descLines of
    [] -> return ()
    _ -> State.modify (\s -> s { dsTermDocs = Map.insert name descLines (dsTermDocs s) })

-- | Result of classifying a single docstring line.
data ParsedDocLine
  = DocDirective !Text !Text  -- recognized `<key>: <value>` shape (key not yet validated against an allowlist)
  | DocDesc !Text             -- free-form description line (possibly empty)
  deriving (Show)

-- | Classify one `--'` line into a directive or a description.
--
-- Rules:
--  * A single leading space (the conventional space after `--'`) is trimmed
--    from description lines so authors can indent list items with extra
--    spaces. Trailing whitespace is stripped.
--  * A leading backslash (after stripping surrounding whitespace) is an
--    escape: it is consumed and the rest of the line becomes a description
--    line with no directive parsing. Literal `\foo:` therefore needs
--    `\\foo:` (standard backslash-doubling convention).
--  * Otherwise, if the line starts with `<word>:` (no spaces in `<word>`)
--    it is returned as a DocDirective. Validation against the allowlist
--    of known directive names is done by the caller.
parseDocKV :: Text -> ParsedDocLine
parseDocKV txt =
  let stripped = T.strip txt
      descLine = T.stripEnd $ case T.uncons txt of
        Just (' ', rest) -> rest
        _ -> txt
   in case T.uncons stripped of
        Just ('\\', rest) -> DocDesc (T.stripEnd rest)
        _ -> case T.breakOn ":" stripped of
          (key, colonRest)
            | not (T.null colonRest)
            , not (T.null key)
            , not (T.any (== ' ') key) ->
                DocDirective key (T.strip (T.drop 1 colonRest))
          _ -> DocDesc descLine

parseCliOpt :: Text -> Maybe CliOpt
parseCliOpt txt = case T.unpack (T.strip txt) of
  '-' : '-' : rest@(_ : _) -> Just (CliOptLong (T.pack rest))
  '-' : c : '/' : '-' : '-' : rest@(_ : _) -> Just (CliOptBoth c (T.pack rest))
  '-' : c : [] -> Just (CliOptShort c)
  _ -> Nothing

-- Known directive keys recognized inside argument / signature docstrings.
argDocDirectiveKeys :: [Text]
argDocDirectiveKeys =
  ["name", "literal", "unroll", "default", "metavar", "arg", "true", "false", "return"]

-- Known directive keys recognized on `source` declarations.
sourceDocDirectiveKeys :: [Text]
sourceDocDirectiveKeys = ["name", "rsize"]

unknownDirectiveWarning :: [Text] -> Text -> Text
unknownDirectiveWarning knownKeys k =
  "warning: unknown docstring directive '" <> k <> "'"
  <> " (recognized: " <> T.intercalate ", " knownKeys <> "); "
  <> "if this was intended as prose, prefix the line with '\\' to suppress this warning (e.g. '\\"
  <> k <> ":')"

processArgDocLines :: [Text] -> ([Text], ArgDocVars)
processArgDocLines = foldl step ([], defaultValue)
  where
    step (ws, d) line = case parseDocKV line of
      DocDesc v
        | T.null v -> (ws, d)
        | otherwise -> (ws, d {docLines = docLines d <> [v]})
      DocDirective k v -> case k of
        "name" -> (ws, d {docName = Just v})
        "literal" -> (ws, d {docLiteral = Just (parseDocBool v)})
        "unroll" -> (ws, d {docUnroll = Just (parseDocBool v)})
        "default" -> (ws, d {docDefault = Just v})
        "metavar" -> (ws, d {docMetavar = Just v})
        "arg" -> (ws, d {docArg = parseCliOpt v})
        "true" -> (ws, d {docTrue = parseCliOpt v})
        "false" -> (ws, d {docFalse = parseCliOpt v})
        "return" -> (ws, d {docReturn = Just v})
        _ ->
          let w = unknownDirectiveWarning argDocDirectiveKeys k
              desc = k <> ": " <> v
           in (ws <> [w], d {docLines = docLines d <> [desc]})

parseDocBool :: Text -> Bool
parseDocBool v = v == "true" || v == "True"

processModuleDocLines :: [Text] -> ([Text], [Text], [[Text]])
processModuleDocLines = finalize . foldl step ([], Nothing, [])
  where
    step (desc, curEpi, epis) line = case parseDocKV line of
      DocDesc v -> case curEpi of
        Nothing -> (desc <> [v], Nothing, epis)
        Just epi -> (desc, Just (epi <> [v]), epis)
      DocDirective k _v -> case k of
        "epilogue" ->
          let epis' = case curEpi of
                Nothing -> epis
                Just epi -> epis <> [epi]
          in (desc, Just [], epis')
        _ ->
          let line' = k <> ": " <> _v
          in case curEpi of
            Nothing -> (desc <> [line'], Nothing, epis)
            Just epi -> (desc, Just (epi <> [line']), epis)

    finalize (desc, curEpi, epis) =
      let epis' = case curEpi of
            Nothing -> epis
            Just epi -> epis <> [epi]
      in ([], desc, epis')

applySourceDocs :: [Text] -> Source -> ([Text], Source)
applySourceDocs lns src = foldl step ([], src) lns
  where
    step (ws, s) line = case parseDocKV line of
      DocDesc v
        | T.null v -> (ws, s)
        | otherwise -> (ws, s {srcNote = srcNote s <> [v]})
      DocDirective k v -> case k of
        "name" -> (ws, s {srcName = SrcName v})
        "rsize" -> (ws, s {srcRsize = mapMaybe readMaybeInt (T.words v)})
        _ ->
          let w = unknownDirectiveWarning sourceDocDirectiveKeys k
              desc = k <> ": " <> v
           in (ws <> [w], s {srcNote = srcNote s <> [desc]})
    readMaybeInt t = case reads (T.unpack t) of
      [(n, "")] -> Just n
      _ -> Nothing

-- | D-monad wrapper: parse argument docstring lines and accumulate any
-- warnings into 'dsWarnings' for the caller to drain.
processArgDocLinesD :: [Text] -> D ArgDocVars
processArgDocLinesD ls = do
  let (ws, v) = processArgDocLines ls
  dwarn ws
  return v

-- | D-monad wrapper: apply `source` docstring lines and accumulate warnings.
applySourceDocsD :: [Text] -> Source -> D Source
applySourceDocsD ls src = do
  let (ws, s) = applySourceDocs ls src
  dwarn ws
  return s

--------------------------------------------------------------------
-- Type helpers
--------------------------------------------------------------------

forallWrap :: [TVar] -> TypeU -> TypeU
forallWrap [] t = t
forallWrap (v : vs) t = ForallU v (forallWrap vs t)

-- | Extract LabeledU wrappers from function argument types.
-- Returns a map from nat var name to argument position index,
-- and the type with all LabeledU stripped.
extractLabels :: TypeU -> (Map.Map TVar Int, TypeU)
extractLabels = go
  where
    go (ForallU v t) = let (labels, t') = go t in (labels, ForallU v t')
    go (FunU args ret) =
      let (labels, args') = extractFromArgs 0 args
          ret' = stripLabels ret
       in (labels, FunU args' ret')
    go t = (Map.empty, stripLabels t)

    extractFromArgs :: Int -> [TypeU] -> (Map.Map TVar Int, [TypeU])
    extractFromArgs _ [] = (Map.empty, [])
    extractFromArgs idx (LabeledU v inner : rest) =
      let (labels, rest') = extractFromArgs (idx + 1) rest
       in (Map.insert v idx labels, stripLabels inner : rest')
    extractFromArgs idx (t : rest) =
      let (labels, rest') = extractFromArgs (idx + 1) rest
       in (labels, stripLabels t : rest')

    stripLabels :: TypeU -> TypeU
    stripLabels (LabeledU _ t) = stripLabels t
    stripLabels (ForallU v t) = ForallU v (stripLabels t)
    stripLabels (FunU ts t) = FunU (map stripLabels ts) (stripLabels t)
    stripLabels (AppU t ts) = AppU (stripLabels t) (map stripLabels ts)
    stripLabels (NamU o v ps rs) = NamU o v (map stripLabels ps) [(k, stripLabels t) | (k, t) <- rs]
    stripLabels (EffectU effs t) = EffectU effs (stripLabels t)
    stripLabels (OptionalU t) = OptionalU (stripLabels t)
    stripLabels (NatAddU a b) = NatAddU (stripLabels a) (stripLabels b)
    stripLabels (NatMulU a b) = NatMulU (stripLabels a) (stripLabels b)
    stripLabels (NatSubU a b) = NatSubU (stripLabels a) (stripLabels b)
    stripLabels (NatDivU a b) = NatDivU (stripLabels a) (stripLabels b)
    stripLabels (ExistU v (ps, pc) (rs, rc)) = ExistU v (map stripLabels ps, pc) (map (second stripLabels) rs, rc)
    stripLabels t = t

quantifyType :: TypeU -> TypeU
quantifyType t =
  let natVars = collectNatVars t
      t' = promoteNatVars natVars t
      typeVars = nub (collectGenVars t')
   in forallWrap typeVars t'
  where
    -- Collect type variables (excluding NatVarU which are already promoted)
    collectGenVars :: TypeU -> [TVar]
    collectGenVars (VarU v@(TV name))
      | not (T.null name), isLower (T.head name) = [v]
      | otherwise = []
    collectGenVars (NatVarU _) = []
    collectGenVars (ForallU v inner) = filter (/= v) (collectGenVars inner)
    collectGenVars (AppU f args) = collectGenVars f ++ concatMap collectGenVars args
    collectGenVars (FunU args ret) = concatMap collectGenVars args ++ collectGenVars ret
    collectGenVars (NamU _ _ ts entries) = concatMap collectGenVars ts ++ concatMap (collectGenVars . snd) entries
    collectGenVars (EffectU _ inner) = collectGenVars inner
    collectGenVars (OptionalU inner) = collectGenVars inner
    collectGenVars (NatLitU _) = []
    collectGenVars (NatAddU a b) = collectGenVars a ++ collectGenVars b
    collectGenVars (NatMulU a b) = collectGenVars a ++ collectGenVars b
    collectGenVars (NatSubU a b) = collectGenVars a ++ collectGenVars b
    collectGenVars (NatDivU a b) = collectGenVars a ++ collectGenVars b
    collectGenVars (LabeledU _ inner) = collectGenVars inner
    collectGenVars _ = []

    -- Collect variables that appear in nat-kinded positions:
    -- Only inside NatAddU, NatMulU, NatSubU, NatDivU.
    -- Typedef-based detection (e.g., Tensor2 params) is handled by refineKinds.
    collectNatVars :: TypeU -> Set.Set TVar
    collectNatVars = go False
      where
        go inNat (VarU v@(TV name))
          | inNat, not (T.null name), isLower (T.head name) = Set.singleton v
          | otherwise = Set.empty
        go _ (NatVarU v) = Set.singleton v
        go _ (ForallU _ inner) = go False inner
        go _ (AppU f args) = go False f <> Set.unions (map (go False) args)
        go _ (FunU args ret) = Set.unions (map (go False) args) <> go False ret
        go _ (NamU _ _ ts entries) = Set.unions (map (go False) ts) <> Set.unions (map (go False . snd) entries)
        go _ (EffectU _ inner) = go False inner
        go _ (OptionalU inner) = go False inner
        go _ (NatLitU _) = Set.empty
        go _ (NatAddU a b) = go True a <> go True b
        go _ (NatMulU a b) = go True a <> go True b
        go _ (NatSubU a b) = go True a <> go True b
        go _ (NatDivU a b) = go True a <> go True b
        go inNat (LabeledU _ inner) = go inNat inner
        go _ _ = Set.empty

-- | Promote VarU to NatVarU for variables identified as nat-kinded
promoteNatVars :: Set.Set TVar -> TypeU -> TypeU
promoteNatVars natVars = go
  where
    go (VarU v)
      | Set.member v natVars = NatVarU v
      | otherwise = VarU v
    go t@(NatVarU _) = t
    go (ExistU v (ps, pc) (rs, rc)) = ExistU v (map go ps, pc) (map (second go) rs, rc)
    go (ForallU v t) = ForallU v (go t)
    go (FunU ts t) = FunU (map go ts) (go t)
    go (AppU t ts) = AppU (go t) (map go ts)
    go (NamU o n ps rs) = NamU o n (map go ps) [(k, go t) | (k, t) <- rs]
    go (EffectU effs t) = EffectU effs (go t)
    go (OptionalU t) = OptionalU (go t)
    go t@(NatLitU _) = t
    go (NatAddU a b) = NatAddU (go a) (go b)
    go (NatMulU a b) = NatMulU (go a) (go b)
    go (NatSubU a b) = NatSubU (go a) (go b)
    go (NatDivU a b) = NatDivU (go a) (go b)
    go (LabeledU n t) = LabeledU n (go t)

parseLang :: Located -> D Lang
parseLang tok = do
  langs <- State.gets dsLangMap
  case Map.lookup (T.toLower name) langs of
    Just lang -> return lang
    Nothing -> dfail (locPos tok) ("unknown language: " ++ T.unpack name)
  where
    name = getName' tok

getName' :: Located -> Text
getName' (Located _ (TokLowerName n) _) = n
getName' (Located _ (TokUpperName n) _) = n
getName' (Located _ _ t) = t

--------------------------------------------------------------------
-- Constraint extraction
--------------------------------------------------------------------

extractConstraints :: TypeU -> D [Constraint]
extractConstraints (AppU (VarU (TV name)) args) =
  return [Constraint (ClassName name) args]
extractConstraints (VarU (TV name)) =
  return [Constraint (ClassName name) []]
extractConstraints (NamU NamRecord _ _ _) =
  dfail (Pos 0 0 "") "invalid constraint syntax"
extractConstraints t =
  case flattenTupleConstraint t of
    Just cs -> return cs
    Nothing -> dfail (Pos 0 0 "") ("invalid constraint: " ++ show t)

flattenTupleConstraint :: TypeU -> Maybe [Constraint]
flattenTupleConstraint (AppU (VarU (TV name)) args)
  | T.isPrefixOf "Tuple" name = mapM typeToConstraint args
  | otherwise = Just [Constraint (ClassName name) args]
flattenTupleConstraint (VarU (TV name)) =
  Just [Constraint (ClassName name) []]
flattenTupleConstraint _ = Nothing

typeToConstraint :: TypeU -> Maybe Constraint
typeToConstraint (AppU (VarU (TV name)) args) =
  Just (Constraint (ClassName name) args)
typeToConstraint (VarU (TV name)) =
  Just (Constraint (ClassName name) [])
typeToConstraint _ = Nothing

extractClassDef :: TypeU -> D (ClassName, [TVar])
extractClassDef (AppU (VarU (TV name)) args) = do
  tvs <- mapM typeToTVar args
  return (ClassName name, tvs)
extractClassDef (VarU (TV name)) =
  return (ClassName name, [])
extractClassDef _ = dfail (Pos 0 0 "") "invalid class head"

typeToTVar :: TypeU -> D TVar
typeToTVar (VarU tv) = return tv
typeToTVar _ = dfail (Pos 0 0 "") "expected type variable in class head"

--------------------------------------------------------------------
-- Signature and type construction
--------------------------------------------------------------------

argsToType :: [(Pos, TypeU)] -> TypeU
argsToType [] = BT.unitU
argsToType [(_, t)] = t
argsToType ts = FunU (map snd (init ts)) (snd (last ts))

desugarSigType :: Pos -> CstSigType -> D ([Constraint], [ArgDocVars], TypeU)
desugarSigType _pos (CstSigType (Just constraintArgs) args) = do
  cs <- extractConstraints (argsToType constraintArgs)
  argDocs <- mapM (\(p, _) -> lookupDocsAt p) args
  argDocVars <- mapM processArgDocLinesD argDocs
  return (cs, argDocVars, argsToType args)
desugarSigType _pos (CstSigType Nothing args) = do
  argDocs <- mapM (\(p, _) -> lookupDocsAt p) args
  argDocVars <- mapM processArgDocLinesD argDocs
  return ([], argDocVars, argsToType args)

desugarTableEntries :: NamType -> [(Key, TypeU)] -> [(Key, TypeU)]
desugarTableEntries NamTable entries = [(k, wrapList t) | (k, t) <- entries]
  where
    wrapList (ForallU v t) = ForallU v (wrapList t)
    wrapList t = BT.listU t
desugarTableEntries _ entries = entries

resolveSourceFile :: Maybe Path -> Maybe Text -> Maybe Path
resolveSourceFile modulePath srcFile =
  case (modulePath, srcFile) of
    (Just f, Just srcfile') -> Just $ combine (takeDirectory f) (T.unpack srcfile')
    (Just _, Nothing) -> Nothing
    (Nothing, s) -> fmap T.unpack s

--------------------------------------------------------------------
-- Intrinsic resolution
--------------------------------------------------------------------

resolveIntrinsic :: Pos -> Text -> D Intrinsic
resolveIntrinsic pos name = case parseIntrinsic name of
  Just intr -> return intr
  Nothing -> dfail pos ("unknown intrinsic: @" ++ T.unpack name)

--------------------------------------------------------------------
-- Accessor resolution
--------------------------------------------------------------------

data AccessorResult
  = ARGetter Selector
  | ARSetter Selector [ExprI]

buildAccessor :: Span -> CstAccessorBody -> D ExprI
buildAccessor sp body = do
  desBody <- desugarAccessorBody body
  result <- resolveBody desBody
  case result of
    ARGetter sel -> freshExprSpan sp (PatE (PatternStruct sel))
    ARSetter sel vals -> do
      patI <- freshExprSpan sp (PatE (PatternStruct sel))
      lamI <- freshIdSpan sp
      let v = EV (".setter_" <> T.pack (show lamI))
      vArg <- freshExprSpan sp (VarE defaultValue v)
      appI <- freshExprSpan sp (AppE patI (vArg : vals))
      return (ExprI lamI (LamE [v] appI))

-- Intermediate accessor types (with ExprI values after desugaring)
data IAccessorBody
  = IABKey Text IAccessorTail
  | IABIdx Int IAccessorTail
  | IABGroup [IAccessorBody]

data IAccessorTail
  = IATEnd
  | IATSet ExprI
  | IATChain IAccessorBody

desugarAccessorBody :: CstAccessorBody -> D IAccessorBody
desugarAccessorBody (CABKey name tail') = IABKey name <$> desugarAccessorTail tail'
desugarAccessorBody (CABIdx idx tail') = IABIdx idx <$> desugarAccessorTail tail'
desugarAccessorBody (CABGroup bodies) = IABGroup <$> mapM desugarAccessorBody bodies

desugarAccessorTail :: CstAccessorTail -> D IAccessorTail
desugarAccessorTail CATEnd = return IATEnd
desugarAccessorTail (CATSet e) = IATSet <$> desugarExpr e
desugarAccessorTail (CATChain body) = IATChain <$> desugarAccessorBody body

resolveBody :: IAccessorBody -> D AccessorResult
resolveBody (IABKey name tail') = do
  inner <- resolveTail tail'
  return (wrapKey name inner)
resolveBody (IABIdx idx tail') = do
  inner <- resolveTail tail'
  return (wrapIdx idx inner)
resolveBody (IABGroup entries) = resolveGroup entries

resolveTail :: IAccessorTail -> D AccessorResult
resolveTail IATEnd = return (ARGetter SelectorEnd)
resolveTail (IATSet expr) = return (ARSetter SelectorEnd [expr])
resolveTail (IATChain body) = resolveBody body

wrapKey :: Text -> AccessorResult -> AccessorResult
wrapKey name (ARGetter sel) = ARGetter (SelectorKey (name, sel) [])
wrapKey name (ARSetter sel vals) = ARSetter (SelectorKey (name, sel) []) vals

wrapIdx :: Int -> AccessorResult -> AccessorResult
wrapIdx idx (ARGetter sel) = ARGetter (SelectorIdx (idx, sel) [])
wrapIdx idx (ARSetter sel vals) = ARSetter (SelectorIdx (idx, sel) []) vals

resolveGroup :: [IAccessorBody] -> D AccessorResult
resolveGroup bodies = do
  results <- mapM resolveBody bodies
  let getters = [s | ARGetter s <- results]
      setterPairs = [(s, vs) | ARSetter s vs <- results]
  case (getters, setterPairs) of
    (gs, []) -> return (ARGetter (mergeSelectors gs))
    ([], ss) -> return (ARSetter (mergeSelectors (map fst ss)) (concatMap snd ss))
    _ -> dfail (Pos 0 0 "") "cannot mix getter and setter entries in .()"

mergeSelectors :: [Selector] -> Selector
mergeSelectors [] = SelectorEnd
mergeSelectors [s] = s
mergeSelectors sels =
  let idxEntries = concat [s : ss | SelectorIdx s ss <- sels]
      keyEntries = concat [s : ss | SelectorKey s ss <- sels]
   in case (idxEntries, keyEntries) of
        (is, []) -> case is of [] -> SelectorEnd; (x : xs) -> SelectorIdx x xs
        ([], (x : xs)) -> SelectorKey x xs
        _ -> error "Cannot mix key and index selectors in getter"

--------------------------------------------------------------------
-- Do-notation desugaring
--------------------------------------------------------------------

-- Desugar a do-block to a let-chain. Non-final bare statements and <- binds
-- are wrapped in EvalE so the typechecker sees them as forced effects (pure
-- non-finals are therefore rejected). The final bare statement is returned
-- unwrapped so synthE DoBlockS can flatten it (if effectful) or let tryCoerce
-- lift it (if pure).
desugarDo :: Span -> [CstDoStmt] -> D ExprI
desugarDo sp [] = dfail (startPos sp) "empty do block"
desugarDo _sp [CstDoBare e] = desugarExpr e
desugarDo sp [CstDoBind _ _] = dfail (startPos sp) "do block cannot end with a bind (<-)"
desugarDo sp [CstDoLet _ _] = dfail (startPos sp) "do block cannot end with a let binding"
desugarDo sp (CstDoLet v e : rest) = do
  e' <- desugarExpr e
  restE <- desugarDo sp rest
  freshExprSpan sp (LetE [(v, e')] restE)
desugarDo sp (CstDoBind v e : rest) = do
  e' <- desugarExpr e
  forceE <- freshExprSpan sp (EvalE e')
  restE <- desugarDo sp rest
  freshExprSpan sp (LetE [(v, forceE)] restE)
desugarDo sp (CstDoBare e : rest) = do
  idx <- freshIdSpan sp
  let discardVar = EV ("_do_" <> T.pack (show idx))
  e' <- desugarExpr e
  forceE <- freshExprSpan sp (EvalE e')
  restE <- desugarDo sp rest
  freshExprSpan sp (LetE [(discardVar, forceE)] restE)

--------------------------------------------------------------------
-- Interpolation desugaring
--------------------------------------------------------------------

mkInterpString :: Span -> Text -> [ExprI] -> [Text] -> Text -> D ExprI
mkInterpString sp startText exprs mids endText = do
  let suffixes = mids ++ [endText]
  patI <- freshExprSpan sp (PatE (PatternText startText suffixes))
  freshExprSpan sp (AppE patI exprs)

--------------------------------------------------------------------
-- Implicit main wrapping
--------------------------------------------------------------------

mkImplicitMain :: [ExprI] -> D [ExprI]
mkImplicitMain es = do
  modI <- freshIdPos (Pos 0 0 "")
  return [ExprI modI (ModE (MV "main") es)]

--------------------------------------------------------------------
-- Expression desugaring: Loc CstExpr -> D ExprI
--------------------------------------------------------------------

desugarExpr :: Loc CstExpr -> D ExprI
-- Variables and literals
desugarExpr (Loc sp (CLabeledVarE label v)) = do
  moduleConfig <- State.gets dsModuleConfig
  case Map.lookup label (moduleConfigLabeledGroups moduleConfig) of
    Just config -> freshExprSpan sp (VarE config v)
    Nothing -> dfail (startPos sp)
      ("Undefined label '" ++ T.unpack label
       ++ "': no matching entry in module config labeled-groups")
desugarExpr (Loc sp (CVarE v)) = freshExprSpan sp (VarE defaultValue v)
desugarExpr (Loc sp (CIntE n)) = freshExprSpan sp (IntE n)
desugarExpr (Loc sp (CRealE n)) = freshExprSpan sp (RealE n)
desugarExpr (Loc sp (CStrE s)) = freshExprSpan sp (StrE s)
desugarExpr (Loc sp (CLogE b)) = freshExprSpan sp (LogE b)
desugarExpr (Loc sp CUniE) = freshExprSpan sp UniE
desugarExpr (Loc sp CNullE) = freshExprSpan sp NullE
desugarExpr (Loc sp CHolE) = freshExprSpan sp HolE
-- Intrinsics: eta-expand when under-applied so they behave as first-class functions
desugarExpr (Loc sp (CIntrinsicE name)) = do
  intr <- resolveIntrinsic (startPos sp) name
  etaExpandIntrinsic sp intr []
desugarExpr (Loc sp (CAppE (Loc _ (CIntrinsicE name)) args)) = do
  intr <- resolveIntrinsic (startPos sp) name
  args' <- mapM desugarExpr args
  etaExpandIntrinsic sp intr args'
-- Compound expressions
desugarExpr (Loc _ (CAppE f args)) = do
  f' <- desugarExpr f
  args' <- mapM desugarExpr args
  freshExprFrom f' (AppE f' args')
desugarExpr (Loc sp (CLamE vs body)) = do
  body' <- desugarExpr body
  freshExprSpan sp (LamE vs body')
desugarExpr (Loc sp (CLetE bindings body)) = do
  bindings' <- mapM (\(v, e) -> do e' <- desugarExpr e; return (v, e')) bindings
  body' <- desugarExpr body
  freshExprSpan sp (LetE bindings' body')
desugarExpr (Loc sp (CParenE inner@(Loc _ CBopE{}))) = do
  inner' <- desugarExpr inner
  freshExprSpan sp (ParenE inner')
desugarExpr (Loc _ (CParenE inner)) = desugarExpr inner
desugarExpr (Loc _ (CBopE lhs opTok rhs)) = do
  lhs' <- desugarExpr lhs
  rhs' <- desugarExpr rhs
  opI <- freshIdSpan (Span (locPos opTok) (locPos opTok))
  freshExprSpan (Span (locPos opTok) (locPos opTok)) (BopE lhs' opI (tokToEVar opTok) rhs')
desugarExpr (Loc sp (CLstE es)) = do
  es' <- mapM desugarExpr es
  freshExprSpan sp (LstE es')
desugarExpr (Loc sp (CTupE es)) = do
  es' <- mapM desugarExpr es
  freshExprSpan sp (TupE es')
desugarExpr (Loc sp (CNamE entries)) = do
  entries' <- mapM (\(k, e) -> do e' <- desugarExpr e; return (k, e')) entries
  freshExprSpan sp (NamE entries')
desugarExpr (Loc sp (CAnnE e t)) = do
  e' <- desugarExpr e
  freshExprSpan sp (AnnE e' (quantifyType t))
desugarExpr (Loc sp (CDoE stmts)) = do
  body <- desugarDo sp stmts
  freshExprSpan sp (DoBlockE body)
desugarExpr (Loc sp (CAccessorE body)) = buildAccessor sp body
desugarExpr (Loc sp (CInterpE startText exprs mids endText)) = do
  exprs' <- mapM desugarExpr exprs
  mkInterpString sp startText exprs' mids endText
desugarExpr (Loc sp (CGuardExprE guards defaultExpr)) = desugarGuards sp guards defaultExpr
desugarExpr (Loc sp (CForceE e)) = do
  e' <- desugarExpr e
  freshExprSpan sp (EvalE e')

-- Top-level declarations should not appear inside expressions
desugarExpr (Loc _ CModE{}) = error "desugarExpr: unexpected CModE in expression position"
desugarExpr (Loc _ (CImpE {})) = error "desugarExpr: unexpected CImpE in expression position"
desugarExpr (Loc _ (CSigE {})) = error "desugarExpr: unexpected CSigE in expression position"
desugarExpr (Loc _ (CAssE {})) = error "desugarExpr: unexpected CAssE in expression position"
desugarExpr (Loc _ (CTypE {})) = error "desugarExpr: unexpected CTypE in expression position"
desugarExpr (Loc _ (CClsE {})) = error "desugarExpr: unexpected CClsE in expression position"
desugarExpr (Loc _ (CIstE {})) = error "desugarExpr: unexpected CIstE in expression position"
desugarExpr (Loc _ (CFixE {})) = error "desugarExpr: unexpected CFixE in expression position"
desugarExpr (Loc _ (CSrcOldE {})) = error "desugarExpr: unexpected CSrcOldE in expression position"
desugarExpr (Loc _ (CSrcNewE {})) = error "desugarExpr: unexpected CSrcNewE in expression position"
desugarExpr (Loc _ (CGuardedAssE {})) = error "desugarExpr: unexpected CGuardedAssE in expression position"
desugarExpr (Loc _ (CInlineE {})) = error "desugarExpr: unexpected CInlineE in expression position"

-- | Wrap an intrinsic in a lambda if it has fewer args than its arity.
-- Fully applied intrinsics pass through as IntrinsicE nodes.
etaExpandIntrinsic :: Span -> Intrinsic -> [ExprI] -> D ExprI
etaExpandIntrinsic sp intr args = do
  let arity = intrinsicArity intr
      actual = length args
  if actual >= arity
    then freshExprSpan sp (IntrinsicE intr args)
    else do
      idx <- freshIdSpan sp
      let remaining = arity - actual
          vars = [EV ("_intr_" <> T.pack (show idx) <> "_" <> T.pack (show j)) | j <- [0..remaining-1]]
      varExprs <- mapM (\v -> freshExprSpan sp (VarE defaultValue v)) vars
      intrExpr <- freshExprSpan sp (IntrinsicE intr (args ++ varExprs))
      freshExprSpan sp (LamE vars intrExpr)


--------------------------------------------------------------------
-- Top-level declaration desugaring
--------------------------------------------------------------------

-- | Infer a dot-prefixed module name from a file path relative to the project root.
-- e.g., projectRoot=/project, filePath=/project/lib/math/main.loc -> ".lib.math"
inferModuleName :: Path -> Path -> Text
inferModuleName projectRoot filePath =
  let relPath = makeRelative projectRoot filePath
      parts = splitDirectories relPath
      -- Strip .loc extension from the last component
      cleaned = case parts of
        [] -> ["main"]
        _ -> init parts ++ [dropExtension (last parts)]
      -- Strip trailing "main" for directory modules (but not if it's the only component)
      stripped = case cleaned of
        xs | length xs > 1 && last xs == "main" -> init xs
        xs -> xs
  in "." <> T.intercalate "." (map T.pack stripped)

desugarTopLevel :: Loc CstExpr -> D [ExprI]
desugarTopLevel (Loc sp (CModE maybeName export body)) = do
  name <- case maybeName of
    Just n -> return n
    Nothing -> do
      modPath <- State.gets dsModulePath
      projRoot <- State.gets dsProjectRoot
      case (modPath, projRoot) of
        (Just mp, Just pr) -> return (inferModuleName pr mp)
        _ -> dfail (startPos sp) "nameless module requires a file path and project root"
  -- capture module-level docstrings (--' lines before module keyword)
  docs <- lookupDocsAt (startPos sp)
  let (_warns, desc, epis) = processModuleDocLines docs
  State.modify $ \s -> s
    { dsModuleDoc = desc
    , dsModuleEpilogues = epis
    }
  expExprI <- desugarExport sp export
  bodyExprs <- concatMapM desugarTopLevel body
  modI <- freshIdSpan sp
  return [ExprI modI (ModE (MV name) (expExprI : bodyExprs))]
desugarTopLevel (Loc sp (CImpE imp)) = do
  e <- freshExprSpan sp (ImpE imp)
  return [e]
desugarTopLevel (Loc sp (CSigE name sigType)) = do
  docs <- lookupDocsAt (startPos sp)
  cmdDoc <- processArgDocLinesD docs
  (cs, argDocs, t) <- desugarSigType (startPos sp) sigType
  let t' = quantifyType t
      doc = ArgDocSig cmdDoc (init argDocs) (last argDocs)
      (labels, t'') = extractLabels t'
      et = EType t'' (Set.fromList cs) doc labels
  e <- freshExprSpan sp (SigE (Signature name Nothing et))
  return [e]
desugarTopLevel (Loc sp (CAssE name params body whereDecls)) = do
  captureDeclDocs (startPos sp) name
  body' <- desugarExpr body
  whereDecls' <- concatMapM desugarTopLevel whereDecls
  e <- case params of
    [] -> freshExprSpan sp (AssE name body' whereDecls')
    vs -> do
      lam <- freshExprSpan sp (LamE (map EV vs) body')
      freshExprSpan sp (AssE name lam whereDecls')
  return [e]
desugarTopLevel (Loc sp (CGuardedAssE name params guards defaultExpr whereDecls)) = do
  captureDeclDocs (startPos sp) name
  body' <- desugarGuards sp guards defaultExpr
  whereDecls' <- concatMapM desugarTopLevel whereDecls
  e <- case params of
    [] -> freshExprSpan sp (AssE name body' whereDecls')
    vs -> do
      lam <- freshExprSpan sp (LamE (map EV vs) body')
      freshExprSpan sp (AssE name lam whereDecls')
  return [e]
desugarTopLevel (Loc sp (CTypE td)) = desugarTypeDef sp td
desugarTopLevel (Loc sp (CClsE classHead sigs)) = do
  (cs, cn, vs) <- desugarClassHead classHead
  sigs' <- mapM desugarSigItem sigs
  e <- freshExprSpan sp (ClsE (Typeclass cs cn vs sigs'))
  return [e]
desugarTopLevel (Loc sp (CIstE cn types body)) = do
  bodyExprs <- concatMapM desugarTopLevel body
  e <- freshExprSpan sp (IstE cn (map quantifyType types) bodyExprs)
  return [e]
desugarTopLevel (Loc sp (CFixE assoc prec ops)) = do
  e <- freshExprSpan sp (FixE (Fixity assoc prec ops))
  return [e]
desugarTopLevel (Loc sp (CSrcOldE langTok srcFile items)) = do
  lang <- parseLang langTok
  modPath <- State.gets dsModulePath
  let path = resolveSourceFile modPath srcFile
  mapM (mkOldSource sp lang path) items
desugarTopLevel (Loc sp (CSrcNewE langTok srcFile nameTuples)) = do
  lang <- parseLang langTok
  modPath <- State.gets dsModulePath
  let path = resolveSourceFile modPath srcFile
  mapM (mkNewSource sp lang path) nameTuples
desugarTopLevel (Loc _ (CInlineE inner)) = do
  exprs <- desugarTopLevel inner
  return (map markSourceInline exprs)
  where
    markSourceInline (ExprI i (SrcE src)) = ExprI i (SrcE src { srcInline = True })
    markSourceInline e = e -- %inline on non-source definitions is not yet implemented

-- Expression-level CST nodes should not appear at top level
desugarTopLevel node = do
  e <- desugarExpr node
  return [e]

--------------------------------------------------------------------
-- Guard desugaring
--------------------------------------------------------------------

-- | Desugar guard clauses with an explicit default into nested IfE expressions.
-- ? cond1 = body1 ? cond2 = body2 : defaultBody
-- becomes: IfE cond1 body1 (IfE cond2 body2 defaultBody)
desugarGuards :: Span -> [(Loc CstExpr, Loc CstExpr)] -> Loc CstExpr -> D ExprI
desugarGuards _ [] defaultExpr = desugarExpr defaultExpr
desugarGuards sp ((cond, body) : rest) defaultExpr = do
  cond' <- desugarExpr cond
  body' <- desugarExpr body
  elseE <- desugarGuards sp rest defaultExpr
  freshExprSpan sp (IfE cond' body' elseE)

--------------------------------------------------------------------
-- Export desugaring
--------------------------------------------------------------------

desugarExport :: Span -> CstExport -> D ExprI
desugarExport sp CstExportAll = freshExprSpan sp (ExpE ExportAll)
desugarExport sp (CstExportMany locs) = do
  items <- mapM (\tok -> do i <- freshIdPos (locPos tok); return (i, symVal' tok)) locs
  freshExprSpan sp (ExpE (ExportMany (Set.fromList items) []))

symVal' :: Located -> Symbol
symVal' (Located _ (TokLowerName n) _) = TermSymbol (EV n)
symVal' (Located _ (TokUpperName n) _) = TypeSymbol (TV n)
symVal' (Located _ (TokOperator n) _) = TermSymbol (EV n)
symVal' (Located _ TokMinus _) = TermSymbol (EV "-")
symVal' (Located _ TokStar _) = TermSymbol (EV "*")
symVal' (Located _ TokDot _) = TermSymbol (EV ".")
symVal' (Located _ TokLAngle _) = TermSymbol (EV "<")
symVal' (Located _ TokRAngle _) = TermSymbol (EV ">")
symVal' _ = TermSymbol (EV "?")

tokToEVar :: Located -> EVar
tokToEVar (Located _ (TokOperator n) _) = EV n
tokToEVar (Located _ TokMinus _) = EV "-"
tokToEVar (Located _ TokStar _) = EV "*"
tokToEVar (Located _ TokDot _) = EV "."
tokToEVar (Located _ TokLAngle _) = EV "<"
tokToEVar (Located _ TokRAngle _) = EV ">"
tokToEVar _ = EV "?"

--------------------------------------------------------------------
-- Type definition desugaring
--------------------------------------------------------------------

desugarTypeDef :: Span -> CstTypeDef -> D [ExprI]
desugarTypeDef sp (CstTypeAlias maybeLangTok (v, vs) (t, isTerminal)) = do
  lang <- case maybeLangTok of
    Nothing -> return Nothing
    Just tok -> do
      l <- parseLang tok
      return (Just (l, isTerminal))
  docs <- lookupDocsAt (startPos sp)
  docVars <- if null docs then return defaultValue else processArgDocLinesD docs
  e <- freshExprSpan sp (TypE (ExprTypeE lang v vs t (ArgDocAlias docVars)))
  return [e]
desugarTypeDef sp (CstTypeAliasForward (v, vs)) = do
  let t = if null vs then VarU v else AppU (VarU v) (map (either (VarU . fst) id) vs)
  e <- freshExprSpan sp (TypE (ExprTypeE Nothing v vs t (ArgDocAlias defaultValue)))
  return [e]
desugarTypeDef sp (CstNamTypeWhere nt (v, vs) locEntries) = do
  recDocs <- lookupDocsAt (startPos sp)
  recDocVars <- processArgDocLinesD recDocs
  fieldDocs <-
    mapM
      (\(loc, _, _) -> do dl <- lookupDocsAt (locPos loc); processArgDocLinesD dl)
      locEntries
  let entries = [(k, ty) | (_, k, ty) <- locEntries]
      entries' = desugarTableEntries nt entries
      doc = ArgDocRec recDocVars (zip (map fst entries') fieldDocs)
      t = NamU nt v (map (either (VarU . fst) id) vs) entries'
  e <- freshExprSpan sp (TypE (ExprTypeE Nothing v vs t doc))
  return [e]
desugarTypeDef sp (CstNamTypeLegacy maybeLangTok nt (v, vs) (conName, isTerminal) entries) = do
  lang <- case maybeLangTok of
    Nothing -> return Nothing
    Just tok -> do
      l <- parseLang tok
      return (Just (l, isTerminal))
  let con = if T.null conName then v else TV conName
      entries' = desugarTableEntries nt entries
      t = NamU nt con (map (either (VarU . fst) id) vs) entries'
      doc = ArgDocRec defaultValue [(k, defaultValue) | (k, _) <- entries']
  e <- freshExprSpan sp (TypE (ExprTypeE lang v vs t doc))
  return [e]

--------------------------------------------------------------------
-- Class/instance desugaring
--------------------------------------------------------------------

desugarClassHead :: CstClassHead -> D ([Constraint], ClassName, [TVar])
desugarClassHead (CCHSimple t) = do
  (cn, vs) <- extractClassDef t
  return ([], cn, vs)
desugarClassHead (CCHConstrained constraintType headType) = do
  cs <- extractConstraints constraintType
  (cn, vs) <- extractClassDef headType
  return (cs, cn, vs)
desugarClassHead (CCHMultiConstrained cs headType) = do
  (cn, vs) <- extractClassDef headType
  return (cs, cn, vs)

desugarSigItem :: CstSigItem -> D Signature
desugarSigItem (CstSigItem name sigType) = do
  (cs, argDocs, t) <- desugarSigType (Pos 0 0 "") sigType
  let wrappedT = quantifyType t
      (labels, wrappedT') = extractLabels wrappedT
      doc = ArgDocSig defaultValue (init argDocs) (last argDocs)
      et = EType wrappedT' (Set.fromList cs) doc labels
  return (Signature name Nothing et)

--------------------------------------------------------------------
-- Source desugaring
--------------------------------------------------------------------

mkOldSource :: Span -> Lang -> Maybe Path -> (Text, Maybe Text) -> D ExprI
mkOldSource sp lang path (name, mayAlias) = do
  let alias = maybe name id mayAlias
  freshExprSpan
    sp
    ( SrcE
        Source
          { srcName = SrcName name
          , srcLang = lang
          , srcPath = path
          , srcAlias = EV alias
          , srcLabel = Nothing
          , srcRsize = []
          , srcNote = []
          , srcInline = False
          , srcOperator = isOperatorName name
          }
    )

mkNewSource :: Span -> Lang -> Maybe Path -> (Bool, Text, Located) -> D ExprI
mkNewSource sp lang path (isInline, name, nameTok) = do
  docLines' <- lookupDocsAt (locPos nameTok)
  let isOp = isOperatorName name
      baseSrc =
        Source
          { srcName = SrcName name
          , srcLang = lang
          , srcPath = path
          , srcAlias = EV name
          , srcLabel = Nothing
          , srcRsize = []
          , srcNote = []
          , srcInline = isInline
          , srcOperator = isOp
          }
  src <- applySourceDocsD docLines' baseSrc
  freshExprSpan sp (SrcE src)

isOperatorName :: Text -> Bool
isOperatorName t = case T.uncons t of
  Just (c, _) -> not (isLower c) && not (isUpper c) && c /= '_'
  Nothing -> False

--------------------------------------------------------------------
-- Program entry point
--------------------------------------------------------------------

{- | Desugar a list of CST nodes into ExprI nodes.
Handles implicit main wrapping for bare declarations.
-}
desugarProgram :: Bool -> [Loc CstExpr] -> D [ExprI]
desugarProgram isImplicitMain cstNodes = do
  exprIs <- concatMapM desugarTopLevel cstNodes
  if isImplicitMain
    then mkImplicitMain exprIs
    else return exprIs

--------------------------------------------------------------------
-- Utility
--------------------------------------------------------------------

-- concatMapM is imported from Morloc.Internal via Morloc.Namespace.Prim


================================================
FILE: library/Morloc/Frontend/Lexer.hs
================================================
{-# LANGUAGE BangPatterns #-}
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.Lexer
Description : Hand-written lexer for Morloc with layout token insertion
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Tokenizes morloc source code and inserts virtual layout tokens
({, }, ;) for indentation-sensitive blocks (module bodies, where clauses,
class/instance bodies, do-blocks).
-}
module Morloc.Frontend.Lexer
  ( lexMorloc
  , LexError (..)
  , showLexError
  ) where

import Data.Char (isAlpha, isAlphaNum, isDigit, isHexDigit, isLower, isOctDigit, isUpper)
import qualified Data.Map.Strict as Map
import Data.Text (Text)
import qualified Data.Text as T
import Morloc.Frontend.Token

data LexError = LexError !Pos !String
  deriving (Show, Eq)

showLexError :: LexError -> String
showLexError (LexError pos msg) =
  posFile pos ++ ":" ++ show (posLine pos) ++ ":" ++ show (posCol pos) ++ ": " ++ msg

{- | Lex morloc source code into a token stream with layout tokens inserted,
plus a map from positions to associated docstring lines, and a list of
group annotation tokens (for command group support in export lists).
-}
lexMorloc :: String -> Text -> Either LexError ([Located], Map.Map Pos [Text], [Located])
lexMorloc filename input = do
  rawTokens <- lexRaw filename (T.unpack input) (startPos filename)
  let rawTokens' = distinguishGetterDots rawTokens
  let (docMap, groupToks, filtered) = extractDocstrings rawTokens'
  return (insertLayout filtered, docMap, groupToks)

-- | Distinguish chained getter dots from standalone ones based on position.
-- A TokGetterDot that immediately follows the previous token (no whitespace)
-- becomes TokGetterDotChain, used for accessor chaining like .foo.bar.
-- A TokGetterDot preceded by whitespace stays as-is, parsed as a separate atom.
distinguishGetterDots :: [Located] -> [Located]
distinguishGetterDots [] = []
distinguishGetterDots [x] = [x]
distinguishGetterDots (prev : cur@(Located curPos TokGetterDot _) : rest)
  | posLine (locPos prev) == posLine curPos
  , posCol (locPos prev) + T.length (locText prev) == posCol curPos
  = prev : distinguishGetterDots (cur { locToken = TokGetterDotChain } : rest)
  | otherwise = prev : distinguishGetterDots (cur : rest)
distinguishGetterDots (x : rest) = x : distinguishGetterDots rest

{- | Extract docstring and group annotation tokens. Docstrings are associated
with the position of the following non-doc token. Group annotation tokens
are returned in order for post-processing.
-}
extractDocstrings :: [Located] -> (Map.Map Pos [Text], [Located], [Located])
extractDocstrings = go [] Map.empty [] []
  where
    go _acc docMap groupToks accToks [] = (docMap, reverse groupToks, reverse accToks)
    go acc docMap groupToks accToks (Located _ (TokDocLine txt) _ : rest) =
      go (acc ++ [txt]) docMap groupToks accToks rest
    go acc docMap groupToks accToks (tok@(Located _ (TokGroupLine _) _) : rest) =
      -- Flush pending docstrings to the group annotation position, then record the group token
      let docMap' = if null acc then docMap else Map.insert (locPos tok) acc docMap
       in go [] docMap' (tok : groupToks) accToks rest
    go acc docMap groupToks accToks (tok@(Located pos _ _) : rest) =
      let docMap' = if null acc then docMap else Map.insert pos acc docMap
       in go [] docMap' groupToks (tok : accToks) rest

-- Raw lexer state
data LexState = LexState
  { lsInput :: !String -- remaining input
  , lsPos :: !Pos -- current position
  , lsTokens :: ![Located] -- accumulated tokens (reversed)
  }

-- | Lex into raw tokens (no layout processing)
lexRaw :: String -> String -> Pos -> Either LexError [Located]
lexRaw _filename input pos0 = go (LexState input pos0 [])
  where
    go :: LexState -> Either LexError [Located]
    go st = case lsInput st of
      [] -> Right (reverse (Located (lsPos st) TokEOF "" : lsTokens st))
      _ -> do
        st' <- lexOne st
        go st'

-- | Lex a single token, advancing the state
lexOne :: LexState -> Either LexError LexState
lexOne st@(LexState input pos toks) = case input of
  -- Whitespace
  '\n' : rest -> Right st {lsInput = rest, lsPos = nextLine pos}
  c : rest
    | c == ' ' || c == '\t' || c == '\r' ->
        Right st {lsInput = rest, lsPos = advanceCol pos 1}
  -- Block comments {- ... -}
  '{' : '-' : rest -> skipBlockComment (advanceCol pos 2) rest (1 :: Int)
    where
      skipBlockComment p s 0 = Right st {lsInput = s, lsPos = p}
      skipBlockComment p ('{' : '-' : s) n = skipBlockComment (advanceCol p 2) s (n + 1)
      skipBlockComment p ('-' : '}' : s) n = skipBlockComment (advanceCol p 2) s (n - 1)
      skipBlockComment p ('\n' : s) n = skipBlockComment (nextLine p) s n
      skipBlockComment p (_ : s) n = skipBlockComment (advanceCol p 1) s n
      skipBlockComment p [] _ = Left (LexError p "unterminated block comment")

  -- Group annotation comments: --* ...
  '-' : '-' : '*' : rest ->
    let (line, rest') = span (/= '\n') rest
        txt = T.pack line
        len = 3 + length line
     in Right
          st
            { lsInput = rest'
            , lsPos = advanceCol pos len
            , lsTokens = Located pos (TokGroupLine txt) (T.pack ("--*" ++ line)) : toks
            }
  -- Docstring comments: --' ...
  '-' : '-' : '\'' : rest ->
    let (line, rest') = span (/= '\n') rest
        txt = T.pack line
        len = 3 + length line
     in Right
          st
            { lsInput = rest'
            , lsPos = advanceCol pos len
            , lsTokens = Located pos (TokDocLine txt) (T.pack ("--'" ++ line)) : toks
            }
  -- Line comments: -- (but not --' or --^)
  '-' : '-' : rest
    | not (null rest) && head rest `elem` ['\'', '^'] ->
        Left (LexError pos "unexpected docstring marker")
    | otherwise ->
        let (_, rest') = span (/= '\n') rest
         in Right st {lsInput = rest', lsPos = advanceCol pos (2 + length (takeWhile (/= '\n') rest))}
  -- Triple-quoted strings
  '\'' : '\'' : '\'' : rest -> lexMultilineString pos "'''" rest st
  '"' : '"' : '"' : rest -> lexMultilineString pos "\"\"\"" rest st
  -- Double-quoted strings (with interpolation support)
  '"' : rest -> lexDoubleString pos rest st
  -- Numbers: try hex, octal, binary first, then decimal/float
  '0' : 'x' : rest -> lexHexNumber pos rest st
  '0' : 'X' : rest -> lexHexNumber pos rest st
  '0' : 'o' : rest -> lexOctalNumber pos rest st
  '0' : 'O' : rest -> lexOctalNumber pos rest st
  '0' : 'b' : rest -> lexBinaryNumber pos rest st
  '0' : 'B' : rest -> lexBinaryNumber pos rest st
  c : _ | isDigit c -> lexDecNumber pos input st
  -- Delimiters and punctuation
  '(' : rest -> emit1 TokLParen "(" rest
  ')' : rest -> emit1 TokRParen ")" rest
  '[' : rest -> emit1 TokLBracket "[" rest
  ']' : rest -> emit1 TokRBracket "]" rest
  '{' : rest -> emit1 TokLBrace "{" rest
  '}' : rest -> emit1 TokRBrace "}" rest
  ',' : rest -> emit1 TokComma "," rest
  ';' : rest -> emit1 TokSemicolon ";" rest
  -- Underscore: standalone '_' is a hole, '_var' is an identifier
  '_' : c : rest
    | isAlphaNum c || c == '\'' || c == '_' ->
        -- identifier starting with underscore (e.g., _do_5)
        lexIdent pos ('_' : c : rest) st
  '_' : rest ->
    emit1 TokUnderscore "_" rest
  -- Backslash (lambda)
  '\\' : rest -> emit1 TokBackslash "\\" rest
  -- Dot: TokGetterDot when immediately followed by lowercase letter, digit, or '(' (getter/setter),
  -- TokDot otherwise (composition operator, module separator).
  -- When followed by an operator char (e.g., '..' or '.='), falls through to the operator lexer.
  -- When followed by a digit, emit both TokGetterDot and TokInteger to prevent float parsing
  -- (e.g., .1.2 should be getter .1 then getter .2, not getter then float 1.2)
  '.' : c : rest
    | isDigit c ->
        let (digits, rest') = span isDigit (c : rest)
            val = read digits :: Integer
            dotPos = pos
            numPos = advanceCol pos 1
         in Right
              st
                { lsInput = rest'
                , lsPos = advanceCol numPos (length digits)
                , lsTokens =
                    Located numPos (TokInteger val) (T.pack digits)
                      : Located dotPos TokGetterDot "."
                      : toks
                }
  '.' : c : rest
    | isLower c || c == '(' ->
        emit1 TokGetterDot "." (c : rest)
  '.' : c : rest
    | not (isOperatorChar c) ->
        emit1 TokDot "." (c : rest)
  '.' : [] ->
    emit1 TokDot "." []
  -- Bang -- special: ! is force operator, !! is chained force
  -- But !!! or != etc. are user-defined operators (fall through to operator lexer)
  '!' : '!' : c : rest
    | not (isOperatorChar c) ->
        Right
          st
            { lsInput = c : rest
            , lsPos = advanceCol pos 2
            , lsTokens =
                Located (advanceCol pos 1) TokBang "!"
                  : Located pos TokBang "!"
                  : toks
            }
  '!' : '!' : [] ->
    Right
      st
        { lsInput = []
        , lsPos = advanceCol pos 2
        , lsTokens =
            Located (advanceCol pos 1) TokBang "!"
              : Located pos TokBang "!"
              : toks
        }
  '!' : c : rest
    | not (isOperatorChar c) ->
        emit1 TokBang "!" (c : rest)
  '!' : [] ->
    emit1 TokBang "!" []
  -- Question mark -- standalone ? is guard token, multi-char like ?= are operators
  '?' : c : rest
    | not (isOperatorChar c) ->
        emit1 TokQuestion "?" (c : rest)
  '?' : [] ->
    emit1 TokQuestion "?" []
  -- Pragmas: %inline
  '%' : 'i' : 'n' : 'l' : 'i' : 'n' : 'e' : rest
    | null rest || not (isAlphaNum (head rest) || head rest == '_' || head rest == '\'') ->
        Right st { lsInput = rest, lsPos = advanceCol pos 7
                 , lsTokens = Located pos TokPragmaInline "%inline" : toks }
  -- Intrinsics: @name (@ followed by lowercase letter)
  '@' : c : rest | isLower c ->
    let (word, rest') = span (\x -> isAlphaNum x || x == '\'' || x == '_') (c : rest)
        name = T.pack word
        len = 1 + length word
     in Right st { lsInput = rest', lsPos = advanceCol pos len
                 , lsTokens = Located pos (TokIntrinsic name) (T.cons '@' name) : toks }
  -- Operators and reserved operator sequences
  c : rest | isOperatorChar c -> lexOperator pos (c : rest) st
  -- Identifiers and keywords
  c : rest | isAlpha c -> lexIdent pos (c : rest) st
  -- Negative numbers: sign directly attached
  -- This is handled in the parser by parsing - as a unary operator

  -- Unknown character
  c : _ -> Left (LexError pos ("unexpected character: " ++ show c))
  [] -> Right st -- handled by go
  where
    emit1 tok txt rest =
      Right
        st
          { lsInput = rest
          , lsPos = advanceCol pos (T.length txt)
          , lsTokens = Located pos tok txt : toks
          }

-- | Lex an identifier or keyword. The first character may be a letter or underscore.
-- When a lowercase identifier is immediately followed by '.' and a lowercase letter
-- (no space), emit TokNsDot between them to support qualified names (e.g., f.map).
-- Exception: if the preceding token is TokGetterDot, we're in a getter chain
-- (e.g., .home.altitude) and the dot should NOT be treated as a namespace dot.
lexIdent :: Pos -> String -> LexState -> Either LexError LexState
lexIdent pos input st =
  let (word, rest) = spanIdent input
      txt = T.pack word
      tok = classifyWord txt
      len = length word
   in case (tok, rest) of
        (TokLowerName _, '.' : c : rest')
          | isLower c, not (afterGetterDot (lsTokens st)) ->
              let dotPos = advanceCol pos len
               in Right st
                    { lsInput = c : rest'
                    , lsPos = advanceCol dotPos 1
                    , lsTokens = Located dotPos TokNsDot "."
                                   : Located pos tok txt
                                   : lsTokens st
                    }
        -- Label colon: label:id (no space)
        (TokLowerName _, ':' : c : rest')
          | isLower c || c == '_' ->
              let colonPos = advanceCol pos len
               in Right st
                    { lsInput = c : rest'
                    , lsPos = advanceCol colonPos 1
                    , lsTokens = Located colonPos TokLabelColon ":"
                                   : Located pos tok txt
                                   : lsTokens st
                    }
        _ -> Right
              st
                { lsInput = rest
                , lsPos = advanceCol pos len
                , lsTokens = Located pos tok txt : lsTokens st
                }
  where
    afterGetterDot :: [Located] -> Bool
    afterGetterDot (Located _ TokGetterDot _ : _) = True
    afterGetterDot _ = False

spanIdent :: String -> (String, String)
spanIdent [] = ([], [])
spanIdent (c : cs)
  | isAlpha c || c == '_' =
      let (rest, remaining) = span (\x -> isAlphaNum x || x == '\'' || x == '_') cs
       in (c : rest, remaining)
  | otherwise = ([], c : cs)

{- | Module component: lowercase start, may contain dashes
We handle dashes in module names in the parser by combining tokens.
The lexer just produces normal identifiers.
-}
classifyWord :: Text -> Token
classifyWord "module" = TokModule
classifyWord "import" = TokImport
classifyWord "export" = TokExport
classifyWord "source" = TokSource
classifyWord "from" = TokFrom
classifyWord "where" = TokWhere
classifyWord "as" = TokAs
classifyWord "True" = TokTrue
classifyWord "False" = TokFalse
classifyWord "type" = TokType
classifyWord "record" = TokRecord
classifyWord "object" = TokObject
classifyWord "table" = TokTable
classifyWord "class" = TokClass
classifyWord "instance" = TokInstance
classifyWord "infixl" = TokInfixl
classifyWord "infixr" = TokInfixr
classifyWord "infix" = TokInfix
classifyWord "let" = TokLet
classifyWord "in" = TokIn
classifyWord "do" = TokDo
classifyWord "Null" = TokNull
classifyWord t
  | isUpper (T.head t) = TokUpperName t
  | otherwise = TokLowerName t

-- | Lex an operator
lexOperator :: Pos -> String -> LexState -> Either LexError LexState
lexOperator pos input st =
  let (opStr, rest) = span isOperatorChar input
      txt = T.pack opStr
      tok = classifyOp txt
      len = length opStr
   in Right
        st
          { lsInput = rest
          , lsPos = advanceCol pos len
          , lsTokens = Located pos tok txt : lsTokens st
          }

classifyOp :: Text -> Token
classifyOp "::" = TokDColon
classifyOp "->" = TokArrow
classifyOp "=>" = TokFatArrow
classifyOp "<-" = TokBind
classifyOp "=" = TokEquals
classifyOp ":" = TokColon
classifyOp "*" = TokStar
classifyOp "-" = TokMinus
-- < and > are also operators but we need them as angle brackets in some contexts
-- The parser handles disambiguation
classifyOp "<" = TokLAngle
classifyOp ">" = TokRAngle
classifyOp t = TokOperator t

isOperatorChar :: Char -> Bool
isOperatorChar c = c `elem` (":!$%&*+./<=>?@\\^|-~#" :: String)

-- | Lex a double-quoted string, handling interpolation
lexDoubleString :: Pos -> String -> LexState -> Either LexError LexState
lexDoubleString start input st = go (advanceCol start 1) input []
  where
    go pos ('"' : rest) acc =
      let txt = T.pack (reverse acc)
          fullTxt = "\"" <> txt <> "\""
       in Right
            st
              { lsInput = rest
              , lsPos = advanceCol pos 1
              , lsTokens = Located start (TokString txt) fullTxt : lsTokens st
              }
    go pos ('#' : '{' : rest) acc =
      -- start of interpolation
      let prefix = T.pack (reverse acc)
          tok =
            if null (lsTokens st) || not (isStringContinuation (lsTokens st))
              then TokStringStart prefix
              else TokStringMid prefix
          prefixTxt = "\"" <> prefix <> "#{"
       in lexInterpBody
            (advanceCol pos 2)
            rest
            1
            st
              { lsTokens = Located (advanceCol pos 0) TokInterpOpen "#{" : Located start tok prefixTxt : lsTokens st
              }
            start
    go pos ('\\' : c : rest) acc =
      let escaped = case c of
            'n' -> '\n'
            't' -> '\t'
            '\\' -> '\\'
            '"' -> '"'
            _ -> c
       in go (advanceCol pos 2) rest (escaped : acc)
    go pos ('\n' : _) _ = Left (LexError pos "unterminated string literal (use triple quotes for multi-line strings)")
    go pos (c : rest) acc = go (advanceCol pos 1) rest (c : acc)
    go pos [] _ = Left (LexError pos "unterminated string literal")

    isStringContinuation (Located _ (TokStringStart _) _ : _) = True
    isStringContinuation (Located _ (TokStringMid _) _ : _) = True
    isStringContinuation _ = False

-- | Lex the body of an interpolation #{...}, tracking brace depth
lexInterpBody :: Pos -> String -> Int -> LexState -> Pos -> Either LexError LexState
lexInterpBody pos ('}' : rest) 1 st stringStartPos =
  -- end of interpolation, resume string lexing
  let st' = st {lsTokens = Located pos TokInterpClose "}" : lsTokens st}
   in lexStringAfterInterp (advanceCol pos 1) rest st' stringStartPos
lexInterpBody pos ('}' : rest) depth st strPos =
  lexInterpBody (advanceCol pos 1) rest (depth - 1) st strPos
lexInterpBody pos ('{' : rest) depth st strPos =
  lexInterpBody (advanceCol pos 1) rest (depth + 1) st strPos
lexInterpBody pos input _ st _ = do
  -- lex one token from the interpolated expression
  st' <- lexOne st {lsInput = input, lsPos = pos}
  -- continue lexing the interpolation body
  case lsInput st' of
    [] -> Left (LexError pos "unterminated string interpolation")
    _ -> case lsTokens st' of
      (Located _ TokEOF _ : _) -> Left (LexError pos "unterminated string interpolation")
      _ -> do
        -- figure out remaining brace depth from what was consumed
        let consumed = length input - length (lsInput st')
            braceChange = countBraces (take consumed input)
        lexInterpBody (lsPos st') (lsInput st') (1 + braceChange) st' (Pos 0 0 "")
  where
    countBraces = foldl (\n c -> case c of '{' -> n + 1; '}' -> n - 1; _ -> n) 0

-- | After interpolation closes, resume lexing the string
lexStringAfterInterp :: Pos -> String -> LexState -> Pos -> Either LexError LexState
lexStringAfterInterp pos ('"' : rest) st _ =
  let txt = T.empty
   in Right
        st
          { lsInput = rest
          , lsPos = advanceCol pos 1
          , lsTokens = Located pos (TokStringEnd txt) "\"" : lsTokens st
          }
lexStringAfterInterp pos ('#' : '{' : rest) st strStartPos =
  -- another interpolation immediately
  let tok = TokStringMid T.empty
   in lexInterpBody
        (advanceCol pos 2)
        rest
        1
        st {lsTokens = Located pos TokInterpOpen "#{" : Located pos tok "" : lsTokens st}
        strStartPos
lexStringAfterInterp pos input st _ = go pos input []
  where
    go p ('"' : rest) acc =
      let txt = T.pack (reverse acc)
       in Right
            st
              { lsInput = rest
              , lsPos = advanceCol p 1
              , lsTokens = Located pos (TokStringEnd txt) ("" <> txt <> "\"") : lsTokens st
              }
    go p ('#' : '{' : rest) acc =
      let txt = T.pack (reverse acc)
       in lexInterpBody
            (advanceCol p 2)
            rest
            1
            st {lsTokens = Located p TokInterpOpen "#{" : Located pos (TokStringMid txt) "" : lsTokens st}
            pos
    go p ('\\' : c : rest) acc =
      let escaped = case c of
            'n' -> '\n'
            't' -> '\t'
            '\\' -> '\\'
            '"' -> '"'
            _ -> c
       in go (advanceCol p 2) rest (escaped : acc)
    go p ('\n' : _) _ = Left (LexError p "unterminated string literal")
    go p (c : rest) acc = go (advanceCol p 1) rest (c : acc)
    go p [] _ = Left (LexError p "unterminated string literal")

-- | Lex a multiline (triple-quoted) string with interpolation
lexMultilineString :: Pos -> String -> String -> LexState -> Either LexError LexState
lexMultilineString start delim input st = go (advanceCol start 3) input []
  where
    delimLen = length delim

    go pos s acc
      | take delimLen s == delim =
          let rawTxt = T.pack (reverse acc)
              txt = processMultilineString rawTxt
              fullTxt = T.pack delim <> rawTxt <> T.pack delim
           in Right
                st
                  { lsInput = drop delimLen s
                  , lsPos = advanceCol pos delimLen
                  , lsTokens = Located start (TokString txt) fullTxt : lsTokens st
                  }
    go pos ('#' : '{' : rest) acc =
      -- interpolation inside multiline string
      let prefix = T.pack (reverse acc)
          tok = TokStringStart prefix
       in lexMultilineInterpBody
            (advanceCol pos 2)
            rest
            1
            st {lsTokens = Located pos TokInterpOpen "#{" : Located start tok "" : lsTokens st}
            start
            delim
    go pos ('\\' : c : rest) acc =
      let escaped = case c of
            'n' -> '\n'
            't' -> '\t'
            '\\' -> '\\'
            '\'' -> '\''
            '"' -> '"'
            _ -> c
       in go (advanceCol pos 2) rest (escaped : acc)
    go pos ('\n' : rest) acc = go (nextLine pos) rest ('\n' : acc)
    go pos (c : rest) acc = go (advanceCol pos 1) rest (c : acc)
    go pos [] _ = Left (LexError pos "unterminated multiline string literal")

-- | Lex interpolation body inside a multiline string
lexMultilineInterpBody ::
  Pos -> String -> Int -> LexState -> Pos -> String -> Either LexError LexState
lexMultilineInterpBody pos ('}' : rest) 1 st strStartPos delim =
  -- end of interpolation, resume multiline string
  let st' = st {lsTokens = Located pos TokInterpClose "}" : lsTokens st}
   in lexMultilineAfterInterp (advanceCol pos 1) rest st' strStartPos delim
lexMultilineInterpBody pos input _ st _ _ = do
  st' <- lexOne st {lsInput = input, lsPos = pos}
  case lsInput st' of
    [] -> Left (LexError pos "unterminated string interpolation")
    ('}' : rest) ->
      let st'' = st' {lsTokens = Located (lsPos st') TokInterpClose "}" : lsTokens st'}
       in lexMultilineAfterInterp (advanceCol (lsPos st') 1) rest st'' pos ""
    _ -> lexMultilineInterpBody (lsPos st') (lsInput st') 1 st' pos ""

-- | Resume multiline string after interpolation
lexMultilineAfterInterp :: Pos -> String -> LexState -> Pos -> String -> Either LexError LexState
lexMultilineAfterInterp pos input st _ delim = go pos input []
  where
    delimLen = length delim

    go p s acc
      | delimLen > 0 && take delimLen s == delim =
          let txt = T.pack (reverse acc)
           in Right
                st
                  { lsInput = drop delimLen s
                  , lsPos = advanceCol p delimLen
                  , lsTokens = Located pos (TokStringEnd txt) "" : lsTokens st
                  }
    go p ('#' : '{' : rest) acc =
      let txt = T.pack (reverse acc)
       in lexMultilineInterpBody
            (advanceCol p 2)
            rest
            1
            st {lsTokens = Located p TokInterpOpen "#{" : Located pos (TokStringMid txt) "" : lsTokens st}
            pos
            delim
    go p ('\n' : rest) acc = go (nextLine p) rest ('\n' : acc)
    go p (c : rest) acc = go (advanceCol p 1) rest (c : acc)
    go p [] _ = Left (LexError p "unterminated multiline string literal")

-- | Lex a hexadecimal number after 0x prefix
lexHexNumber :: Pos -> String -> LexState -> Either LexError LexState
lexHexNumber pos input st =
  let (digits, rest) = span isHexDigit input
   in if null digits
        then Left (LexError pos "expected hexadecimal digits after 0x")
        else
          let val = foldl (\n d -> n * 16 + fromIntegral (hexVal d)) 0 digits
              len = 2 + length digits
              txt = T.pack ("0x" ++ digits)
           in Right
                st
                  { lsInput = rest
                  , lsPos = advanceCol pos len
                  , lsTokens = Located pos (TokInteger val) txt : lsTokens st
                  }
  where
    hexVal c
      | c >= '0' && c <= '9' = fromEnum c - fromEnum '0'
      | c >= 'a' && c <= 'f' = fromEnum c - fromEnum 'a' + 10
      | c >= 'A' && c <= 'F' = fromEnum c - fromEnum 'A' + 10
      | otherwise = 0

-- | Lex an octal number after 0o prefix
lexOctalNumber :: Pos -> String -> LexState -> Either LexError LexState
lexOctalNumber pos input st =
  let (digits, rest) = span isOctDigit input
   in if null digits
        then Left (LexError pos "expected octal digits after 0o")
        else
          let val = foldl (\n d -> n * 8 + fromIntegral (fromEnum d - fromEnum '0')) 0 digits
              len = 2 + length digits
              txt = T.pack ("0o" ++ digits)
           in Right
                st
                  { lsInput = rest
                  , lsPos = advanceCol pos len
                  , lsTokens = Located pos (TokInteger val) txt : lsTokens st
                  }

-- | Lex a binary number after 0b prefix
lexBinaryNumber :: Pos -> String -> LexState -> Either LexError LexState
lexBinaryNumber pos input st =
  let (digits, rest) = span (\c -> c == '0' || c == '1') input
   in if null digits
        then Left (LexError pos "expected binary digits after 0b")
        else
          let val = foldl (\n d -> n * 2 + fromIntegral (fromEnum d - fromEnum '0')) 0 digits
              len = 2 + length digits
              txt = T.pack ("0b" ++ digits)
           in Right
                st
                  { lsInput = rest
                  , lsPos = advanceCol pos len
                  , lsTokens = Located pos (TokInteger val) txt : lsTokens st
                  }

-- | Lex a decimal integer or float, with optional scientific notation
lexDecNumber :: Pos -> String -> LexState -> Either LexError LexState
lexDecNumber pos input st =
  let (intPart, rest1) = span isDigit input
   in case rest1 of
        -- Float: digits.digits
        '.' : c : rest2
          | isDigit c ->
              let (fracPart, rest3) = span isDigit (c : rest2)
                  (expPart, rest4) = lexExponent rest3
                  numStr = intPart ++ "." ++ fracPart ++ expPart
                  val = read numStr :: Double
                  len = length numStr
               in Right
                    st
                      { lsInput = rest4
                      , lsPos = advanceCol pos len
                      , lsTokens = Located pos (TokFloat val) (T.pack numStr) : lsTokens st
                      }
        -- Integer with exponent (e.g., 5e10) -- treated as float
        'e' : _ ->
          let (expPart, rest3) = lexExponent rest1
           in if null expPart
                then mkInt intPart rest1
                else
                  let numStr = intPart ++ expPart
                      val = read numStr :: Double
                      len = length numStr
                   in Right
                        st
                          { lsInput = rest3
                          , lsPos = advanceCol pos len
                          , lsTokens = Located pos (TokFloat val) (T.pack numStr) : lsTokens st
                          }
        'E' : _ ->
          let (expPart, rest3) = lexExponent rest1
           in if null expPart
                then mkInt intPart rest1
                else
                  let numStr = intPart ++ expPart
                      val = read numStr :: Double
                      len = length numStr
                   in Right
                        st
                          { lsInput = rest3
                          , lsPos = advanceCol pos len
                          , lsTokens = Located pos (TokFloat val) (T.pack numStr) : lsTokens st
                          }
        -- Plain integer
        _ -> mkInt intPart rest1
  where
    mkInt digits rest =
      let val = read digits :: Integer
          len = length digits
       in Right
            st
              { lsInput = rest
              , lsPos = advanceCol pos len
              , lsTokens = Located pos (TokInteger val) (T.pack digits) : lsTokens st
              }

{- | Try to lex a scientific notation exponent (e.g., e10, e-3, E+5)
Returns the exponent string and remaining input. Empty string if no exponent.
-}
lexExponent :: String -> (String, String)
lexExponent ('e' : '+' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'e' : '+' : rest)
        else ("e+" ++ digits, rest')
lexExponent ('e' : '-' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'e' : '-' : rest)
        else ("e-" ++ digits, rest')
lexExponent ('e' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'e' : rest)
        else ("e" ++ digits, rest')
lexExponent ('E' : '+' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'E' : '+' : rest)
        else ("E+" ++ digits, rest')
lexExponent ('E' : '-' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'E' : '-' : rest)
        else ("E-" ++ digits, rest')
lexExponent ('E' : rest) =
  let (digits, rest') = span isDigit rest
   in if null digits
        then ("", 'E' : rest)
        else ("E" ++ digits, rest')
lexExponent rest = ("", rest)

{- | Process a multiline (triple-quoted) string: strip leading/trailing blank
lines and remove common indentation.
-}
processMultilineString :: Text -> Text
processMultilineString txt =
  let stripped = removeTrailingSpace (removeLeadingSpace txt)
   in reindent stripped
  where
    removeLeadingSpace :: Text -> Text
    removeLeadingSpace s = case T.lines s of
      [] -> ""
      (first : rest)
        | T.null (T.strip first) -> T.unlines rest
        | otherwise -> T.unlines (first : rest)

    removeTrailingSpace :: Text -> Text
    removeTrailingSpace s = case T.lines s of
      [] -> ""
      ls
        | T.null (T.strip (last ls)) -> T.unlines (init ls)
        | otherwise -> T.unlines ls

    reindent :: Text -> Text
    reindent s = case T.lines s of
      [] -> ""
      ls ->
        let nonEmpty = filter (not . T.null . T.strip) ls
            spaces = map (T.length . T.takeWhile (== ' ')) nonEmpty
            minSpaces = if null spaces then 0 else minimum spaces
         in T.unlines (map (T.drop minSpaces) ls)

-- Position helpers
advanceCol :: Pos -> Int -> Pos
advanceCol (Pos l c f) n = Pos l (c + n) f

nextLine :: Pos -> Pos
nextLine (Pos l _ f) = Pos (l + 1) 1 f

--------------------------------------------------------------------
-- Layout token insertion
--------------------------------------------------------------------

{- | Insert virtual braces and semicolons based on indentation.

Layout contexts:
  1. Top-level: the body of a module (or implicit main)
  2. After 'where' keyword (function where, class/instance bodies)
  3. After 'do' keyword

Algorithm (GHC-inspired):
  - When we see a layout keyword (where, do), the next token's column
    defines a new layout context. Emit virtual {.
  - For the top-level, the first declaration's column starts the context.
  - When the next token aligns with the context column, emit ;.
  - When the next token is left of the context column, emit } and pop.
  - Explicit { after a layout keyword enters a non-indentation context.
-}
data LayoutContext
  = -- | virtual { at this column
    IndentCtx !Int
  | -- | let-introduced layout context at this column (closed by 'in')
    LetCtx !Int
  | -- | real {, no indentation tracking
    ExplicitCtx
  deriving (Show, Eq)

-- | Is the token a layout keyword (introduces an indented block)?
isLayoutKeyword :: Token -> Bool
isLayoutKeyword TokWhere = True
isLayoutKeyword TokDo = True
isLayoutKeyword TokLet = True
isLayoutKeyword _ = False

insertLayout :: [Located] -> [Located]
insertLayout [] = []
insertLayout toks = beginTopLevel toks
  where
    -- Handle the top-level layout. The top-level body (after module header
    -- or at the start for implicit main) gets a layout context.
    beginTopLevel :: [Located] -> [Located]
    beginTopLevel ts = case ts of
      -- File starts with 'module': skip the header, then start layout
      (Located p TokModule _ : rest) ->
        Located p TokModule "" : skipModuleHeader rest
      -- File starts with something else: implicit main, start layout immediately
      (_ : _) -> startLayoutCtx TokModule [] ts
      [] -> []

    -- Skip past 'module Name (exports)' to find where the body starts.
    -- We need to find the opening '(' of the export list, then track
    -- paren depth to find the matching ')'.
    skipModuleHeader :: [Located] -> [Located]
    skipModuleHeader [] = []
    skipModuleHeader (t@(Located _ TokLParen _) : rest) =
      -- Found the opening ( of exports, now track depth starting at 1
      t : skipExportList 1 rest
    skipModuleHeader (t : rest) = t : skipModuleHeader rest

    -- Track paren depth inside the export list
    skipExportList :: Int -> [Located] -> [Located]
    skipExportList _ [] = []
    skipExportList depth (t@(Located _ TokLParen _) : rest) =
      t : skipExportList (depth + 1) rest
    skipExportList depth (t@(Located _ TokRParen _) : rest)
      | depth <= 1 = t : startLayoutCtx TokModule [] rest -- closing ) of export list
      | otherwise = t : skipExportList (depth - 1) rest
    skipExportList depth (t : rest) = t : skipExportList depth rest

    -- Skip module header during processing (for multi-module files).
    -- Same as skipModuleHeader/skipExportList but preserves existing contexts.
    skipModuleHeaderInBody :: [LayoutContext] -> [Located] -> [Located]
    skipModuleHeaderInBody ctxs [] = closingBraces ctxs []
    skipModuleHeaderInBody ctxs (t@(Located _ TokLParen _) : rest) =
      t : skipExportListInBody ctxs 1 rest
    skipModuleHeaderInBody ctxs (t : rest) = t : skipModuleHeaderInBody ctxs rest

    skipExportListInBody :: [LayoutContext] -> Int -> [Located] -> [Located]
    skipExportListInBody ctxs _ [] = closingBraces ctxs []
    skipExportListInBody ctxs depth (t@(Located _ TokLParen _) : rest) =
      t : skipExportListInBody ctxs (depth + 1) rest
    skipExportListInBody ctxs depth (t@(Located _ TokRParen _) : rest)
      | depth <= 1 = t : startLayoutCtx TokModule ctxs rest
      | otherwise = t : skipExportListInBody ctxs (depth - 1) rest
    skipExportListInBody ctxs depth (t : rest) = t : skipExportListInBody ctxs depth rest

    -- Start a new layout context at the column of the next token
    -- The Token parameter indicates which keyword triggered the context
    -- (TokLet uses LetCtx, others use IndentCtx)
    startLayoutCtx :: Token -> [LayoutContext] -> [Located] -> [Located]
    startLayoutCtx _ ctxs [] = closingBraces ctxs []
    startLayoutCtx _ ctxs [eof@(Located _ TokEOF _)] =
      -- empty body
      Located (locPos eof) TokVLBrace ""
        : Located (locPos eof) TokVRBrace ""
        : closingBraces ctxs [eof]
    -- Explicit brace after layout keyword: skip virtual layout, let the
    -- brace be handled as an explicit context by emitToken/process.
    startLayoutCtx _ ctxs (t@(Located _ TokLBrace _) : rest) =
      t : process (ExplicitCtx : ctxs) rest
    startLayoutCtx kw ctxs (t : rest)
      | otherwise =
          let col = posCol (locPos t)
              ctx = case kw of
                TokLet -> LetCtx col
                _      -> IndentCtx col
              newCtxs = ctx : ctxs
              vopen = Located (locPos t) TokVLBrace ""
           in -- The first token of a layout block must not get a VSEMI before it
              -- (indentCheck would emit one since col == n). So we handle it
              -- specially, bypassing indentation checking.
              vopen : emitFirstToken newCtxs t rest

    -- Emit the first token of a layout block. Like processToken but
    -- without indentation checking (the first token defines the column,
    -- it should not receive a VSEMI).
    emitFirstToken :: [LayoutContext] -> Located -> [Located] -> [Located]
    emitFirstToken ctxs tok rest
      | locToken tok == TokEOF = closingBraces ctxs [tok]
      | otherwise = emitToken ctxs tok rest

    -- Main processing loop
    process :: [LayoutContext] -> [Located] -> [Located]
    process ctxs [] = closingBraces ctxs []
    process ctxs (t : rest) = processToken ctxs t rest

    -- Process a single token with the current context stack
    processToken :: [LayoutContext] -> Located -> [Located] -> [Located]
    processToken ctxs tok rest
      -- EOF: close all contexts
      | locToken tok == TokEOF = closingBraces ctxs [tok]
      -- Regular token: check indentation first (may emit VSEMI/VRBRACE)
      | otherwise = indentCheck ctxs tok rest

    -- Check indentation of a regular token against the context stack
    indentCheck :: [LayoutContext] -> Located -> [Located] -> [Located]
    indentCheck [] tok rest = emitToken [] tok rest
    indentCheck (ExplicitCtx : ctxs) tok rest = emitToken (ExplicitCtx : ctxs) tok rest
    -- 'in' immediately closes a LetCtx regardless of indentation
    indentCheck (LetCtx _ : cs) tok rest
      | locToken tok == TokIn =
          Located (locPos tok) TokVRBrace "" : emitToken cs tok rest
    -- ';' closes a LetCtx so that let-bindings terminate inside explicit-brace blocks
    indentCheck (LetCtx _ : cs) tok rest
      | locToken tok == TokSemicolon =
          Located (locPos tok) TokVRBrace "" : indentCheck cs tok rest
    indentCheck ctxs@(LetCtx n : cs) tok rest
      | col == n && isBlockCloser (locToken tok) =
          Located (locPos tok) TokVRBrace "" : indentCheck cs tok rest
      | col == n =
          Located (locPos tok) TokVSemi "" : emitToken ctxs tok rest
      | col > n =
          emitToken ctxs tok rest
      | otherwise =
          Located (locPos tok) TokVRBrace "" : indentCheck cs tok rest
      where
        col = posCol (locPos tok)
    indentCheck ctxs@(IndentCtx n : cs) tok rest
      | col == n && isBlockCloser (locToken tok) =
          -- 'module' at layout column closes the current block
          Located (locPos tok) TokVRBrace "" : indentCheck cs tok rest
      | col == n =
          -- aligned: emit semicolon before this token
          Located (locPos tok) TokVSemi "" : emitToken ctxs tok rest
      | col > n =
          -- indented further: continuation of previous item
          emitToken ctxs tok rest
      | otherwise =
          -- dedented: close this context, then re-check
          Located (locPos tok) TokVRBrace "" : indentCheck cs tok rest
      where
        col = posCol (locPos tok)

    -- Tokens that close a layout block even when at the same indentation level
    isBlockCloser :: Token -> Bool
    isBlockCloser TokModule = True
    isBlockCloser TokWhere = True
    isBlockCloser _ = False

    -- Emit a token with special handling for keywords
    emitToken :: [LayoutContext] -> Located -> [Located] -> [Located]
    emitToken ctxs tok rest
      -- Module keyword: emit it and skip the header, then start layout
      | locToken tok == TokModule =
          tok : skipModuleHeaderInBody ctxs rest
      -- Layout keywords: emit the keyword, then start a new layout context
      | isLayoutKeyword (locToken tok) =
          tok : startLayoutCtx (locToken tok) ctxs rest
      -- Explicit open brace
      | locToken tok == TokLBrace =
          tok : process (ExplicitCtx : ctxs) rest
      -- Explicit close brace
      | locToken tok == TokRBrace =
          closeToExplicit ctxs tok rest
      -- Prefix pragma: suppress VSEMI before the next token
      | locToken tok == TokPragmaInline =
          tok : case rest of
            (next : rest') -> emitFirstToken ctxs next rest'
            [] -> closingBraces ctxs []
      -- Regular token
      | otherwise = tok : process ctxs rest

    -- Close layout contexts until we find an explicit brace context
    closeToExplicit :: [LayoutContext] -> Located -> [Located] -> [Located]
    closeToExplicit (ExplicitCtx : ctxs) tok rest =
      tok : process ctxs rest
    closeToExplicit (IndentCtx _ : ctxs) tok rest =
      Located (locPos tok) TokVRBrace "" : closeToExplicit ctxs tok rest
    closeToExplicit (LetCtx _ : ctxs) tok rest =
      Located (locPos tok) TokVRBrace "" : closeToExplicit ctxs tok rest
    closeToExplicit [] tok rest =
      -- unbalanced }, let the parser report the error
      tok : process [] rest

    -- Emit closing braces for all remaining contexts
    closingBraces :: [LayoutContext] -> [Located] -> [Located]
    closingBraces [] rest = rest
    closingBraces (_ : cs) rest =
      let p = case rest of
            (Located pp _ _ : _) -> pp
            [] -> Pos 1 1 ""
       in Located p TokVRBrace "" : closingBraces cs rest


================================================
FILE: library/Morloc/Frontend/Link.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Frontend.Link
Description : Link terms, sources, and typeclasses into 'MorlocState'
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Walks the module DAG bottom-up and populates 'MorlocState' with signatures
('stateSignatures'), typeclass instances ('stateTypeclasses'), and name
mappings ('stateName'). This is the bridge between the parsed AST and the
state-based representation consumed by 'Treeify'.
-}
module Morloc.Frontend.Link (link) where

import Data.Set (Set)
import qualified Data.Set as Set
import qualified Morloc.Data.DAG as DAG
import Morloc.Data.Doc
import Morloc.Data.Map (Map)
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as DT
import Morloc.Frontend.Merge (mergeSignatureSet, weaveTermTypes)
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM
import Morloc.Typecheck.Internal (qualify, unqualify)

-- The following terms are modified in morloc state
--  * stateSignatures :: GMap Int Int SignatureSet -- links terms to types
--    - update SignatureSet when ClsE or IstE is encountered
--    - add term entry when any term is encountered
--  * stateTypeclasses :: Map EVar Instance -- only used to retrieve global typeclass terms, like pack and unpack
--    - update when Packable instance is encountered
--  * stateName :: Map Int EVar
--    - update when term is encountered (same places as stateSignature term updates)

-- when each new module is entered, the keys for linkTerms and linkClasses is
-- rewritten based on the AliasedSymbol edge aliases
data LinkState = LinkState
  { linkTerms :: Map EVar Int
  -- ^ stateSignatures index 2
  , linkClasses :: Map ClassName (Int, Typeclass Signature, Map EVar Int)
  -- ^ maps class methods into stateSignatures index 2
  }

{- | Synthesize the module DAG bottom-up, linking all terms, sources,
typeclass instances, and declarations into 'MorlocState'.
-}
link :: DAG MVar [AliasedSymbol] ExprI -> MorlocMonad ()
link d0 = do
  mayResult <- DAG.synthesizeNodes synth d0
  case mayResult of
    Nothing -> error "cyclical"
    (Just _) -> return ()

synth ::
  MVar ->
  ExprI ->
  [(MVar, [AliasedSymbol], LinkState)] ->
  MorlocMonad LinkState
synth k0 e0 edges = do
  inheritedState <- mapM (realiasLinkState k0) edges >>= mergeLinkStates k0
  finalState <- addLocalState k0 e0 inheritedState
  _ <- linkLocalTerms k0 finalState e0
  return finalState

-- Will raise error if any import term is absent in the linkstate list
realiasLinkState ::
  MVar -> (MVar, [AliasedSymbol], LinkState) -> MorlocMonad (MVar, MVar, LinkState)
realiasLinkState m1 (m2, ss, s) = do
  termmap <-
    mergeValues "terms" $
      map (\(n, a) -> (a, Map.lookup n (linkTerms s))) [(n, a) | AliasedTerm n a <- ss]
  classmap <-
    mergeValues "classes" $ map (\n -> (n, Map.lookup n (linkClasses s))) [n | AliasedClass n <- ss]
  return (m1, m2, LinkState termmap classmap)
  where
    mergeValues :: (Ord k, Show k) => String -> [(k, Maybe v)] -> MorlocMonad (Map k v)
    mergeValues msg xs = case [v | (v, Nothing) <- xs] of
      [] -> return $ Map.fromList [(v, i) | (v, Just i) <- xs]
      missing -> error $ "Undefined " <> msg <> " imports:" <> show missing <> "\n  ss = " <> show ss

throwInheritanceError :: MVar -> MDoc -> MorlocMonad a
throwInheritanceError m msg = MM.throwSystemError $ "In module" <+> squotes (pretty m) <> ":" <+> msg

-- All LinkState objects whould have already been renamed by realiasLinkState.
--
-- will raise error if
--   1. if multiple separate typeclasses are imported under the same name
--   2. if any imported term overlaps with a typeclass method
--   3. if multiple separate terms are imported under the same name
--
-- This function needs to iterate through the imports such that the modules
-- involved with conflicts can be identified for better error messages. So all
-- imported terms are first pooled, then iterated through one-by-one checking
-- for conflicts. Term identity is based on index, which maps one-to-one to type
-- or class signature.
mergeLinkStates :: MVar -> [(MVar, MVar, LinkState)] -> MorlocMonad LinkState
mergeLinkStates m0 imps = do
  -- Set EVar
  let terms = Set.unions $ [Map.keysSet s | (_, _, LinkState s _) <- imps]
      -- Set ClassName
      classes = Set.unions $ [Map.keysSet s | (_, _, LinkState _ s) <- imps]
      -- Map EVar [(MVar, Int)]
      termGroups =
        Map.fromSet
          (\k -> catMaybes [(,,) m1 m2 <$> Map.lookup k (linkTerms s) | (m1, m2, s) <- imps])
          terms
      -- Map ClassName [(MVar, (Int, Map EVar Int))]
      classGroups =
        Map.fromSet
          (\k -> catMaybes [(,,) m1 m2 <$> Map.lookup k (linkClasses s) | (m1, m2, s) <- imps])
          classes

  termmap <- Map.mapWithKeyM mergeTerms termGroups
  classmap <- Map.mapWithKeyM mergeClasses classGroups
  _ <- checkTermClassConflicts termmap classmap
  return $ LinkState termmap classmap
  where
    mergeTerms :: EVar -> [(MVar, MVar, Int)] -> MorlocMonad Int
    mergeTerms _ [] = error "Compiler bug: This cannot be empty"
    mergeTerms _ [(_, _, i)] = return i
    mergeTerms v ((m1, importMod1, i) : (_, importMod2, j) : xs)
      | i == j = mergeTerms v ((m1, importMod1, j) : xs)
      | otherwise =
          throwInheritanceError m0 $
            "Illegal masking of type signatures for" <+> squotes (pretty v)
              <> "\n It is imported from modules"
                <+> squotes (pretty importMod1)
                <+> "and"
                <+> squotes (pretty importMod2)
              <> "\n Terms may have multiple implementations but not multiple type signatures"

    mergeClasses ::
      ClassName -> [(MVar, MVar, (Int, a, Map EVar Int))] -> MorlocMonad (Int, a, Map EVar Int)
    mergeClasses _ [] = error "This will never be empty"
    mergeClasses _ [(_, _, x)] = return x
    mergeClasses v ((_, m1b, (i, _, _)) : (m2a, m2b, y@(j, _, _)) : xs)
      | i == j = mergeClasses v ((m2a, m2b, y) : xs)
      | otherwise =
          throwInheritanceError m0 $
            "\n  Cannot merge non-eqivalent definitions of typeclass"
              <+> squotes (pretty v)
              <+> "\n  Definitions are imported from modules"
              <+> squotes (pretty m1b)
              <+> "and"
              <+> squotes (pretty m2b)

    checkTermClassConflicts :: Map EVar Int -> Map ClassName (Int, a, Map EVar Int) -> MorlocMonad ()
    checkTermClassConflicts me mc = case catMaybes . map (checkTermClassConflict me) $ Map.toList mc of
      [] -> return ()
      ((cls, vs) : _) ->
        throwInheritanceError m0 $
          "\n  The following terms are defined both as polymorphic terms in typeclass"
            <+> squotes (pretty cls)
            <+> "and as independent monomorphic terms:"
            <+> list (map pretty vs)

    checkTermClassConflict ::
      Map EVar Int -> (ClassName, (Int, a, Map EVar Int)) -> Maybe (ClassName, [EVar])
    checkTermClassConflict me (cls, (_, _, mc)) = case Set.toList (Set.intersection (Map.keysSet me) (Map.keysSet mc)) of
      [] -> Nothing
      conflicts -> Just (cls, conflicts)

-- updates stateSignature index 2
addLocalState :: MVar -> ExprI -> LinkState -> MorlocMonad LinkState
addLocalState m0 e0 s0 = do
  s1 <- findDefs e0 s0
  (_, s2) <- findFreeDefs e0 (Set.empty, s1)
  return s2
  where
    -- Iterate through the expression and add signatures and typeclasses. This
    -- needs to be done before the sources, declarations, and instances are
    -- added, since these all need to augment code that has already be indexed.
    findDefs (ExprI sigIndex (SigE (Signature v _ e))) lstate = do
      -- get the (GMap Int Int SigantureSet) map from state
      (GMap idmap sigmap) <- MM.gets stateSignatures
      -- define a new monomorphic term with no implementations
      let sigset = Monomorphic (TermTypes (Just e) [] [])
          sigmap' = Map.insert sigIndex sigset sigmap
      -- update state with the signature, the signature index will be linked to by
      -- all future terms of this type (even after they have been aliased)
      MM.modify (\s -> s {stateSignatures = GMap idmap sigmap'})
      -- update the map between term names and signature indices
      return $ lstate {linkTerms = Map.insert v sigIndex (linkTerms lstate)}
    -- create new entries for class definitions and type signatures
    findDefs (ExprI clsIndex (ClsE tcls@(Typeclass constraints cls vs sigs))) lstate = do
      -- get sigmap
      (GMap idmap sigmap) <- MM.gets stateSignatures
      -- generate an index for each signature in this typeclass
      sigsIdx <- mapM (\sig -> (,) <$> MM.getCounter <*> pure sig) sigs
      -- add these new typeclass methods to stateSignatures as polymorphic entries
      let sigmap' = foldr (\(i, Signature v _ t) m -> Map.insert i (Polymorphic cls v t []) m) sigmap sigsIdx

      -- setup stateTypeclasses
      let xs = [(v, Instance cls vs et []) | Signature v _ et <- sigs]
      tmap <- MM.gets stateTypeclasses
      tmap' <- foldlM (\m (k, v) -> insertWithCheck k v m) tmap xs

      -- update morloc state
      MM.modify
        ( \s ->
            s
              { stateSignatures = GMap idmap sigmap'
              , stateTypeclasses = tmap'
              , stateClassDefs = Map.insert cls constraints (stateClassDefs s)
              }
        )

      -- generate the (Map EVar Int) list for LinkedState
      let vmap = Map.fromList [(v, i) | (i, Signature v _ _) <- sigsIdx]
          classes = Map.insert cls (clsIndex, tcls, vmap) (linkClasses lstate)
      return $ lstate {linkClasses = classes}
    -- We only search for definitions at the top level. This may be the top-level
    -- inside of a where statement.
    findDefs (ExprI _ (ModE _ es)) lstate = foldrM findDefs lstate es
    -- All other types return the map unchanged
    findDefs _ lstate = return lstate

    insertWithCheck :: EVar -> Instance -> Map EVar Instance -> MorlocMonad (Map EVar Instance)
    insertWithCheck k v m = case Map.lookup k m of
      (Just inst2) ->
        throwInheritanceError m0 $
          "The typeclasses"
            <+> (squotes . pretty . className $ inst2)
            <+> "and"
            <+> (squotes . pretty . className $ v)
            <+> "have conflicting definitions of the term"
            <+> squotes (pretty k)
      Nothing -> return $ Map.insert k v m

    -- Handle assignments that do not have signatures
    findFreeDefs (ExprI _ (AssE v _ _)) (terms, lstate)
      | Set.member v terms || Map.member v (linkTerms lstate) = return (terms, lstate)
      | otherwise = do
          -- make new index to use for all definitions of this term
          idx <- MM.getCounter
          (GMap idmap sigmap) <- MM.gets stateSignatures
          -- define a new monomorphic term with no implementation and no type
          let sigset = Monomorphic (TermTypes Nothing [] [])
              sigmap' = Map.insert idx sigset sigmap
              terms' = Set.insert v terms
          MM.modify (\s -> s {stateSignatures = GMap idmap sigmap'})
          let lstate' = lstate {linkTerms = Map.insert v idx (linkTerms lstate)}
          return (terms', lstate')
    findFreeDefs (ExprI _ (LetE bindings body)) s = do
      s' <- foldrM (\(_, e) s0' -> findFreeDefs e s0') s bindings
      findFreeDefs body s'
    findFreeDefs (ExprI _ (ModE _ es)) s = foldrM findFreeDefs s es
    findFreeDefs (ExprI _ (IfE c t e)) s = findFreeDefs c s >>= findFreeDefs t >>= findFreeDefs e
    findFreeDefs (ExprI _ (DoBlockE e)) s = findFreeDefs e s
    findFreeDefs (ExprI _ (EvalE e)) s = findFreeDefs e s
    findFreeDefs (ExprI _ (IntrinsicE _ es)) s = foldrM findFreeDefs s es
    findFreeDefs _ s = return s

toCondensedState :: LinkState -> Map EVar (Int, Maybe (Typeclass Signature))
toCondensedState s = Map.union terms classes
  where
    terms = Map.map (\i -> (i, Nothing)) (linkTerms s)
    classes =
      Map.fromList . concat $
        [ [(v, (i, Just tcls)) | (v, i) <- Map.toList emap]
        | (_, tcls, emap) <- Map.elems (linkClasses s)
        ]

-- link source, declaration, and instance to stateSignature index 2
-- link terms to stateSignature index 1 and stateName
linkLocalTerms :: MVar -> LinkState -> ExprI -> MorlocMonad ()
linkLocalTerms m0 s0 e0 = linkLocal Set.empty s0 (toCondensedState s0) e0
  where
    -- link a new source statement to its type in morloc state
    linkLocal ::
      Set EVar -> LinkState -> Map EVar (Int, Maybe (Typeclass Signature)) -> ExprI -> MorlocMonad ()
    linkLocal _ _ cs (ExprI i (SrcE src)) = do
      case Map.lookup (srcAlias src) cs of
        -- A source with no associated type signature may be a constructor.
        -- If it is a term, then it must have a signature if it is to be used, but
        -- its use will raise a dedicated error later. So we let it pass for now.
        Nothing -> return ()
        (Just (_, Just (Typeclass _ cls _ _))) ->
          MM.throwSourcedError i $
            "Source term"
              <+> squotes (pretty (srcAlias src))
              <+> "conflicts with the same term in typeclass"
              <+> squotes (pretty cls)
        (Just (termIdx, Nothing)) -> do
          (GMap idmap sigmap) <- MM.gets stateSignatures
          case Map.lookup termIdx sigmap of
            Nothing ->
              error
                "This should be unreachable since there is an associated signature and it should have been loaded"
            (Just (Monomorphic tt)) -> do
              let srcTerm = (m0, Idx i src)
                  tt' = tt {termConcrete = srcTerm : termConcrete tt}
                  sigmap' = Map.insert termIdx (Monomorphic tt') sigmap
                  idmap' = Map.insert i termIdx idmap
              MM.modify (\s -> s {stateSignatures = GMap idmap' sigmap'})
            (Just (Polymorphic cls _ _ _)) ->
              MM.throwSourcedError i $
                "Source term"
                  <+> squotes (pretty (srcAlias src))
                  <+> " overlaps a term in typeclass"
                  <+> squotes (pretty cls)

    -- link a new declaration to its type in morloc state and recurse into its
    -- local where block as needed
    linkLocal bnds c cs (ExprI i (AssE v e es)) = do
      updateName i v
      case Map.lookup v cs of
        Nothing -> error "Bug: This case should be unreachable"
        (Just (_, Just _)) -> undefined -- handle error for src that overlaps typeclass term
        (Just (termIdx, Nothing)) -> do
          (GMap idmap sigmap) <- MM.gets stateSignatures
          case Map.lookup termIdx sigmap of
            Nothing ->
              error
                "Bug: This should be unreachable since there is an associated signature and it should have been loaded"
            (Just (Monomorphic tt)) -> do
              let tt' = tt {termDecl = e : termDecl tt}
                  sigmap' = Map.insert termIdx (Monomorphic tt') sigmap
                  idmap' = Map.insert i termIdx idmap
              MM.modify (\ms -> ms {stateSignatures = GMap idmap' sigmap'})
              (bnds', c', _) <- case e of
                (ExprI _ (LamE vs _)) ->
                  return
                    ( foldr Set.insert bnds vs
                    , c {linkTerms = foldr Map.delete (linkTerms c) vs}
                    , foldr Map.delete cs vs
                    )
                _ -> return (bnds, c, cs)
              -- link expressions in the where statement within a local scope
              c'' <- foldrM (addLocalState m0) c' (e : es)

              mapM_ (linkLocal bnds' c'' (toCondensedState c'')) (e : es)
            (Just (Polymorphic cls _ _ _)) ->
              MM.throwSourcedError i $
                "Declared term" <+> squotes (pretty v) <+> " overlaps a term in typeclass" <+> squotes (pretty cls)
    linkLocal bnds c cs (ExprI i (IstE cls ts es)) = do
      case Map.lookup cls (linkClasses c) of
        Nothing ->
          MM.throwSourcedError i $
            "There is no typeclass declaration for instance"
              <+> squotes (pretty cls)
              <+> "in the scope of module"
              <+> squotes (pretty m0)
        (Just (_, Typeclass superConstraints _ vs sigs, emap)) ->
          if length vs /= length ts
            then
              MM.throwSourcedError i $
                "In module" <+> squotes (pretty m0)
                  <> ": the instance and typeclass definitions for"
                    <+> squotes (pretty cls)
                    <+> "differ in number of terms"
            else do
              checkSuperclassConstraints i cls (zip vs ts) superConstraints
              if null es
                then
                  -- Source-less instance: register each method with its
                  -- specialized general type but no implementations.
                  -- This enables typechecking without requiring sources.
                  linkEmptyInstance m0 cls (zip vs ts) sigs emap
                else
                  mapM_ (linkInstance (linkLocal bnds c cs) m0 cls (zip vs ts) sigs emap) es
    linkLocal bnds _ cs (ExprI termIdx (VarE _ v))
      | Set.member v bnds = return ()
      | otherwise = case Map.lookup v cs of
          -- handle both monomorphic terms and polymorphic typeclass terms
          (Just (sigIdx, _)) -> updateSigLinks v termIdx sigIdx
          Nothing -> MM.throwSourcedError termIdx $ "Undefined term: " <> pretty v
    linkLocal _ _ cs (ExprI i (ExpE (ExportMany (Set.toList -> ss) gs))) =
      let allSs = ss ++ concatMap (Set.toList . exportGroupMembers) gs
       in mapM_ linkExp [(v, termIdx, Map.lookup v cs) | (termIdx, TermSymbol v) <- allSs]
      where
        linkExp :: (EVar, Int, Maybe (Int, a)) -> MorlocMonad ()
        linkExp (v, termIdx, Just (sigIdx, _)) = updateSigLinks v termIdx sigIdx
        -- TODO: give this a good error message - it is a user facing issue
        -- Is raised when an exported term, such as a sourced function, is
        -- exported with no signature in scope.
        linkExp (v, _, Nothing) =
          MM.throwSourcedError i $ "Undefined export" <+> squotes (pretty v)
    linkLocal _ _ _ (ExprI _ (ExpE ExportAll)) = error "Bug: ExportAll should no longer be present"
    -- Shadowing is allowed, so here all terms in `s` that are bound by the lambda
    -- need to be removed
    linkLocal bnds c cs (ExprI i (LamE vs e)) = do
      (c', cs') <- foldlM shadow (c, cs) vs
      let bnds' = Set.union bnds (Set.fromList vs)
      linkLocal bnds' c' cs' e
      where
        shadow ::
          (LinkState, Map EVar (Int, Maybe (Typeclass Signature))) ->
          EVar ->
          MorlocMonad (LinkState, Map EVar (Int, Maybe (Typeclass Signature)))
        shadow (ls, cs') v = case Map.lookup v cs' of
          Nothing -> return (ls, cs)
          (Just (_, Nothing)) -> return (ls {linkTerms = Map.delete v (linkTerms ls)}, Map.delete v cs')
          (Just (_, Just _)) ->
            MM.throwSourcedError i $ "Illegal shadowing of typeclass term:" <+> pretty v

    -- The `m` should always be the same as `m0`, since modules don't next.
    -- Even if there are two modules defined in one file, they will still be
    -- unnested, same as if they were in different files.
    linkLocal bnds c cs (ExprI i (ModE m es))
      | m /= m0 = MM.throwSourcedError i $ "Nested modules are not currently supported"
      | otherwise = mapM_ (linkLocal bnds c cs) es
    -- let-bound variables are local, like lambda-bound
    linkLocal bnds c cs (ExprI _ (LetE bindings body)) = do
      bnds' <-
        foldlM
          ( \b (v, e) -> do
              linkLocal b c cs e
              return (Set.insert v b)
          )
          bnds
          bindings
      linkLocal bnds' c cs body
    -- simple recursive cases
    linkLocal bnds c cs (ExprI _ (LstE es)) = mapM_ (linkLocal bnds c cs) es
    linkLocal bnds c cs (ExprI _ (TupE es)) = mapM_ (linkLocal bnds c cs) es
    linkLocal bnds c cs (ExprI _ (NamE (map snd -> es))) = mapM_ (linkLocal bnds c cs) es
    linkLocal bnds c cs (ExprI _ (AppE e es)) = mapM_ (linkLocal bnds c cs) (e : es)
    linkLocal bnds c cs (ExprI _ (AnnE e _)) = linkLocal bnds c cs e
    linkLocal bnds c cs (ExprI _ (IfE cond thenE elseE)) = mapM_ (linkLocal bnds c cs) [cond, thenE, elseE]
    linkLocal bnds c cs (ExprI _ (DoBlockE e)) = linkLocal bnds c cs e
    linkLocal bnds c cs (ExprI _ (EvalE e)) = linkLocal bnds c cs e
    linkLocal bnds c cs (ExprI _ (IntrinsicE _ es)) = mapM_ (linkLocal bnds c cs) es
    -- terminal cases
    linkLocal _ _ _ _ = return ()

    updateSigLinks :: EVar -> Int -> Int -> MorlocMonad ()
    updateSigLinks v termIdx sigIdx = do
      (GMap idmap sigmap) <- MM.gets stateSignatures
      let idmap' = Map.insert termIdx sigIdx idmap
      MM.modify
        ( \ms ->
            ms
              { stateSignatures = GMap idmap' sigmap
              , stateName = Map.insert termIdx v (stateName ms)
              }
        )

    updateName :: Int -> EVar -> MorlocMonad ()
    updateName i v = MM.modify (\s -> s {stateName = Map.insert i v (stateName s)})

-- Register a source-less instance: for each method in the typeclass, create a
-- TermTypes with the specialized general type but no concrete implementations.
-- This allows typechecking to succeed even without language-specific sources.
linkEmptyInstance ::
  MVar ->
  ClassName ->
  [(TVar, TypeU)] ->
  [Signature] ->
  Map EVar Int ->
  MorlocMonad ()
linkEmptyInstance _ cls0 params0 sigs emap = mapM_ go sigs
  where
    go (Signature v _ et) =
      case Map.lookup v emap of
        Nothing -> return ()
        Just stateIdx -> do
          t <- substituteInstanceTypes params0 (etype et)
          let et' = et {etype = t}
              tt = TermTypes (Just et') [] []
          (GMap idmap sigmap) <- MM.gets stateSignatures
          tcls <- MM.gets stateTypeclasses
          case Map.lookup stateIdx sigmap of
            Nothing -> return ()
            (Just sigset) -> do
              -- Use the general class type (et) for the Polymorphic wrapper,
              -- matching linkInstance. The specialized type (et') is only
              -- inside the TermTypes.
              sigset' <- mergeSignatureSet sigset (Polymorphic cls0 v et [tt])
              let sigmap' = Map.insert stateIdx sigset' sigmap
              newInstance <- case Map.lookup v tcls of
                Nothing ->
                  return $ Instance cls0 (map fst params0) et [tt]
                (Just inst) ->
                  return $ inst {instanceTerms = weaveTermTypes tt (instanceTerms inst)}
              let tcls' = Map.insert v newInstance tcls
              MM.modify (\ms -> ms {stateSignatures = GMap idmap sigmap', stateTypeclasses = tcls'})

-- Goal:
--   for each term in [Signature], add a TermTypes instance to the correct
--   SignatureSet in stateSignatures. This will be a polymorphic case.
--     Polymorphic ClassName EVar EType [TermTypes]
linkInstance ::
  (ExprI -> MorlocMonad ()) ->
  MVar ->
  ClassName ->
  [(TVar, TypeU)] ->
  [Signature] ->
  Map EVar Int ->
  ExprI ->
  MorlocMonad ()
linkInstance linker m0 cls0 params0 sigs0 emap0 e0 = linkExpr e0
  where
    linkExpr (ExprI i (SrcE src)) = do
      let v = srcAlias src
      (Signature _ _ et, stateIdx) <- lookupInfo v
      t <- substituteInstanceTypes params0 (etype et)
      let et' = et {etype = t}
      let tt = TermTypes (Just et') [(m0, Idx i src)] []
      linkTermTypes v et tt stateIdx
    linkExpr (ExprI _ (AssE v e es)) = do
      mapM_ linker (e : es)
      (Signature _ _ et, stateIdx) <- lookupInfo v
      t <- substituteInstanceTypes params0 (etype et)
      let et' = et {etype = t}
      let tt = TermTypes (Just et') [] [e]
      linkTermTypes v et tt stateIdx
    linkExpr _ =
      error
        "Unreachable, instances may only contain sources and instances -- this should have been caught in the parser."

    lookupInfo :: EVar -> MorlocMonad (Signature, Int)
    lookupInfo v = case ([sig | sig@(Signature v' _ _) <- sigs0, v == v'], Map.lookup v emap0) of
      ([sig], Just i) -> return (sig, i)
      _ ->
        throwInheritanceError m0 $
          "\n  Instance of class"
            <+> squotes (pretty cls0)
            <+> "contains undefined term"
            <+> squotes (pretty v)

    linkTermTypes :: EVar -> EType -> TermTypes -> Int -> MorlocMonad ()
    linkTermTypes v et tt stateIdx = do
      (GMap idmap sigmap) <- MM.gets stateSignatures
      tcls <- MM.gets stateTypeclasses
      case Map.lookup stateIdx sigmap of
        Nothing -> undefined -- should be unreachable
        (Just sigset) -> do
          sigset' <- mergeSignatureSet sigset (Polymorphic cls0 v et [tt])
          let sigmap' = Map.insert stateIdx sigset' sigmap
          newInstance <- case Map.lookup v tcls of
            Nothing -> do
              return $ Instance cls0 (map fst params0) et [tt]
            (Just inst) -> do
              return $ inst {instanceTerms = weaveTermTypes tt (instanceTerms inst)}
          let tcls' = Map.insert v newInstance tcls
          MM.modify (\ms -> ms {stateSignatures = GMap idmap sigmap', stateTypeclasses = tcls'})

{- Substitute the instance types into the class function definition

Suppose we have the following class and instances:

class Reversible a b where
  forward :: a -> b
  backward :: b -> a

instance Reversible ([a],[b]) [(a,b)] where
  ...

If we are handling the single instance above for the `forward` function:

  classVars: [a, b]
  classType: forall a b . a -> b
  instanceParameters: forall a b . ([a], [b])
                      forall a b . [(a, b)]

and the return type should be

  forall a b . ([a],[b]) -> [(a,b)]

A problem here is that the instance parameters *share* qualifiers. The `a` and `b`
in the first instance parameter are the same as those in the second. But not the
same as the `a` and `b` in the class.

-}
substituteInstanceTypes :: [(TVar, TypeU)] -> TypeU -> MorlocMonad TypeU
substituteInstanceTypes (unzip -> (clsVars, instanceParameters)) clsType = do
  -- find all qualifiers in the instance parameter list
  let instanceQualifiers = unique $ concatMap (fst . unqualify) instanceParameters

      -- rewrite the class type such that the class qualifiers appear first and
      -- do not conflict with parameter qualifiers
      cleanClassType = replaceQualifiers instanceQualifiers (putClassVarsFirst clsType)

      -- substitute in the parameter types
      finalType =
        qualify instanceQualifiers $
          substituteQualifiers cleanClassType (map (snd . unqualify) instanceParameters)

  MM.sayVVV $
    "substituteInstanceTypes"
      <> "\n  classVars:" <+> pretty clsVars
      <> "\n  classType:" <+> pretty clsType
      <> "\n  instanceParameters:" <+> pretty instanceParameters
      <> "\n  -------------------"
      <> "\n  instanceQualifiers:" <+> pretty instanceQualifiers
      <> "\n  cleanClassType:" <+> pretty cleanClassType
      <> "\n  finalType:" <+> pretty finalType

  return finalType
  where
    putClassVarsFirst :: TypeU -> TypeU
    putClassVarsFirst t =
      let (vs, t') = unqualify t
       in qualify (clsVars <> filter (`notElem` clsVars) vs) t'

    replaceQualifiers :: [TVar] -> TypeU -> TypeU
    replaceQualifiers vs0 t0 = f vs0 [r | r <- freshVariables, r `notElem` doNotUse] t0
      where
        -- qualifiers to avoid when replacing
        doNotUse = vs0 <> (fst . unqualify) t0

        f (v : vs) (r : rs) (ForallU v' t)
          | v == v' = ForallU r . f vs rs $ substituteTVar v' (VarU r) t
          | otherwise = ForallU v' (f (v : vs) (r : rs) t)
        f vs rs (EffectU effs t) = EffectU effs (f vs rs t)
        f vs rs (OptionalU t) = OptionalU (f vs rs t)
        f _ _ t = t

        freshVariables = [1 ..] >>= flip replicateM ['a' .. 'z'] |>> TV . DT.pack

    substituteQualifiers :: TypeU -> [TypeU] -> TypeU
    substituteQualifiers (ForallU v t) (r : rs) = substituteQualifiers (substituteTVar v r t) rs
    substituteQualifiers t _ = t

-- Check that all superclass constraints are satisfied for an instance declaration.
-- For example, if `class Eq a => Ord a`, then `instance Ord Int` requires `instance Eq Int`.
checkSuperclassConstraints :: Int -> ClassName -> [(TVar, TypeU)] -> [Constraint] -> MorlocMonad ()
checkSuperclassConstraints _ _ _ [] = return ()
checkSuperclassConstraints i cls params constraints = do
  classDefs <- MM.gets stateClassDefs
  mapM_ (checkOne classDefs) constraints
  where
    checkOne :: Map ClassName [Constraint] -> Constraint -> MorlocMonad ()
    checkOne classDefs (Constraint superCls superTypeArgs) = do
      let substArgs = applyParams superTypeArgs params
      case Map.lookup superCls classDefs of
        Nothing ->
          MM.throwSourcedError i $
            "Superclass" <+> squotes (pretty superCls) <+> "is not defined"
        Just _ -> do
          tcls <- MM.gets stateTypeclasses
          let methodsOfSuper = [inst | (_, inst) <- Map.toList tcls, className inst == superCls]
              hasMatchingInstance = any (matchesSuperInstance substArgs) methodsOfSuper
          if not hasMatchingInstance
            then
              MM.throwSourcedError i $
                "Instance"
                  <+> pretty cls
                  <+> hsep (map pretty (map snd params))
                  <+> "requires"
                  <+> pretty superCls
                  <+> hsep (map pretty substArgs)
                  <+> "but no such instance exists"
            else return ()

    applyParams :: [TypeU] -> [(TVar, TypeU)] -> [TypeU]
    applyParams ts [] = ts
    applyParams ts ((v, r) : ps) = applyParams (map (substituteTVar v r) ts) ps

    matchesSuperInstance :: [TypeU] -> Instance -> Bool
    matchesSuperInstance _ inst = not (null (instanceTerms inst))


================================================
FILE: library/Morloc/Frontend/Merge.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.Merge
Description : Merge and unify type signatures, term types, and typeclasses
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Morloc allows multiple implementations of the same term. When definitions
from different modules are combined, their type signatures, source
implementations, and typeclass instances must be merged while detecting
conflicts. This module provides the merge operations used by 'Link' and
'Restructure' to unify these definitions.
-}
module Morloc.Frontend.Merge
  ( mergeTermTypes
  , weaveTermTypes
  , mergeEType
  , mergeTypeUs
  , mergeTypeclasses
  , mergeIndexedInstances
  , unionTermTypes
  , mergeSignatureSet
  , mergeFirstIndexM
  ) where

-- TODO: tighten all this up, formalize these operations and follow the
-- conventions below. Make a typeclass for these mergeable types.
--
-- union :: [a] -> [a] -> Either MorlocError [a]
-- weave :: a -> [a] -> Either MorlocError [a]
-- merge :: a -> a -> Either MorlocError a

import Morloc.Data.Doc
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM

-- | Merge two 'Indexed' values, keeping the index from the first.
mergeFirstIndexM :: (Monad m) => (a -> a -> m a) -> Indexed a -> Indexed a -> m (Indexed a)
mergeFirstIndexM f (Idx i x) (Idx _ y) = Idx i <$> f x y

-- | Merge two 'TermTypes', combining general types, sources, and declarations.
mergeTermTypes :: TermTypes -> TermTypes -> MorlocMonad TermTypes
mergeTermTypes (TermTypes g1 cs1 es1) (TermTypes g2 cs2 es2) =
  TermTypes
    <$> maybeCombine mergeEType g1 g2
    <*> pure (unique (cs1 <> cs2))
    <*> pure (unique (es1 <> es2))
  where
    -- either combine terms or take the first on that is defined, or whatever
    maybeCombine :: (Monad m) => (a -> a -> m a) -> Maybe a -> Maybe a -> m (Maybe a)
    maybeCombine f (Just a) (Just b) = Just <$> f a b
    maybeCombine _ (Just a) _ = return $ Just a
    maybeCombine _ _ (Just b) = return $ Just b
    maybeCombine _ _ _ = return Nothing

{- | Insert a 'TermTypes' into a list, merging with an existing entry
if they share an equivalent general type.
-}
weaveTermTypes :: TermTypes -> [TermTypes] -> [TermTypes]
weaveTermTypes t1@(TermTypes (Just gt1) srcs1 es1) (t2@(TermTypes (Just gt2) srcs2 es2) : ts)
  | equivalent (etype gt1) (etype gt2) =
      TermTypes (Just gt1) (unique (srcs1 <> srcs2)) (es1 <> es2) : ts
  | otherwise = t2 : weaveTermTypes t1 ts
weaveTermTypes (TermTypes Nothing srcs1 es1) ((TermTypes e2 srcs2 es2) : ts2) =
  weaveTermTypes (TermTypes e2 (srcs1 <> srcs2) (es1 <> es2)) ts2
weaveTermTypes TermTypes {} (TermTypes {} : _) = error "what the why?"
weaveTermTypes t1 [] = [t1]

{- | This function defines how general types are merged. There are decisions
encoded in this function that should be vary carefully considered.
 * Can properties simply be concatenated?
 * What if constraints are contradictory?
 * Should general type merging even be possible?
-}
mergeEType :: EType -> EType -> MorlocMonad EType
mergeEType (EType t1 cs1 edoc1 labels1) (EType t2 cs2 edoc2 _labels2) =
  EType <$> mergeTypeUs t1 t2 <*> pure (cs1 <> cs2) <*> pure edocs12 <*> pure labels1
  where
    edocs12 = mergeEdocs edoc1 edoc2

    -- TODO: is there a real use case where we would want to merge docstrings?
    mergeEdocs x _ = x

-- merge two general types
mergeTypeUs :: TypeU -> TypeU -> MorlocMonad TypeU
mergeTypeUs t1 t2
  | equivalent t1 t2 = return t1
  | otherwise =
      MM.throwSystemError $
        "Incompatible general types:" <+> parens (pretty t1) <+> "vs" <+> parens (pretty t2)

throwConflictingInstancesError :: MDoc -> Instance -> Instance -> MorlocMonad a
throwConflictingInstancesError msg inst1 inst2
  | inst1 == inst2 =
      MM.throwSystemError $
        "Found conflict between overlapping instances for class"
          <+> squotes (pretty (className inst1))
          <> ":" <+> msg
  | otherwise =
      MM.throwSystemError $
        "Found conflict between overlapping instances for classes"
          <+> squotes (pretty (className inst1))
          <+> "and"
          <+> squotes (pretty (className inst2))
          <> ":" <+> msg

{- | Merge two typeclass instances, checking for conflicting class names,
types, and parameter counts.
-}
mergeTypeclasses :: Instance -> Instance -> MorlocMonad Instance
mergeTypeclasses inst1@(Instance cls1 vs1 t1 ts1) inst2@(Instance cls2 vs2 t2 ts2)
  | cls1 /= cls2 = throwConflictingInstancesError "Mismatched class names" inst1 inst2
  | not (equivalent (etype t1) (etype t2)) =
      throwConflictingInstancesError "Conflicting typeclass term general type" inst1 inst2
  | length vs1 /= length vs2 =
      throwConflictingInstancesError "Conflicting typeclass parameter count" inst1 inst2
  -- here I should do reciprocal subtyping
  | otherwise = return $ Instance cls1 vs1 t1 (unionTermTypes ts1 ts2)

-- | Merge two indexed typeclass instances, keeping the left index.
mergeIndexedInstances ::
  Indexed Instance ->
  Indexed Instance ->
  MorlocMonad (Indexed Instance)
mergeIndexedInstances = mergeFirstIndexM mergeTypeclasses

throwSignatureUnificationError :: SignatureSet -> SignatureSet -> MorlocMonad a
throwSignatureUnificationError s1 s2 =
  MM.throwSystemError $
    "Cannot unify signatures for the polymorphic signature sets below:"
      <> "\n  s1:" <+> pretty s1
      <> "\n  s2:" <+> pretty s2

-- | Merge two 'SignatureSet' values (both must be the same variant).
mergeSignatureSet :: SignatureSet -> SignatureSet -> MorlocMonad SignatureSet
mergeSignatureSet s1@(Polymorphic cls1 v1 t1 ts1) s2@(Polymorphic cls2 v2 t2 ts2)
  | cls1 == cls2 && equivalent (etype t1) (etype t2) && v1 == v2 =
      return $ Polymorphic cls1 v1 t1 (unionTermTypes ts1 ts2)
  | otherwise = throwSignatureUnificationError s1 s2
mergeSignatureSet (Monomorphic ts1) (Monomorphic ts2) = Monomorphic <$> mergeTermTypes ts1 ts2
mergeSignatureSet s1 s2 = throwSignatureUnificationError s1 s2

-- | Union two lists of 'TermTypes' by weaving each element from the first list.
unionTermTypes :: [TermTypes] -> [TermTypes] -> [TermTypes]
unionTermTypes ts1 ts2 = foldr weaveTermTypes ts2 ts1


================================================
FILE: library/Morloc/Frontend/Namespace.hs
================================================
{- |
Module      : Morloc.Frontend.Namespace
Description : Re-exports of core namespace types plus frontend-specific helpers
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Aggregates all core namespace modules ('Prim', 'Type', 'Expr', 'State') into
a single import for frontend code. Also provides expression tree traversals
('mapExpr', 'mapExprM') and state-index copying ('copyState').
-}
module Morloc.Frontend.Namespace
  ( module Morloc.Namespace.Prim
  , module Morloc.Namespace.Type
  , module Morloc.Namespace.Expr
  , module Morloc.Namespace.State
  , mapExpr
  , mapExprM
  , isGeneric
  , copyState
  ) where

import qualified Data.Char as DC
import Data.Text (Text)
import qualified Data.Text as DT
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import qualified Morloc.Monad as MM
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type

-- | Determine if a type term is generic (i.e., is the first letter lowercase?)
isGeneric :: Text -> Bool
isGeneric typeStr = maybe False (DC.isLower . fst) (DT.uncons typeStr)

-- | Bottom-up map over the 'Expr' layer of an 'ExprI' tree.
mapExpr :: (Expr -> Expr) -> ExprI -> ExprI
mapExpr f = g
  where
    g (ExprI i (ModE v xs)) = ExprI i . f $ ModE v (map g xs)
    g (ExprI i (AssE v e es)) = ExprI i . f $ AssE v (g e) (map g es)
    g (ExprI i (LstE es)) = ExprI i . f $ LstE (map g es)
    g (ExprI i (TupE es)) = ExprI i . f $ TupE (map g es)
    g (ExprI i (AppE e es)) = ExprI i . f $ AppE (g e) (map g es)
    g (ExprI i (NamE rs)) = ExprI i . f $ NamE [(k, g e) | (k, e) <- rs]
    g (ExprI i (LamE vs e)) = ExprI i . f $ LamE vs (g e)
    g (ExprI i (AnnE e ts)) = ExprI i . f $ AnnE (g e) ts
    g (ExprI i e) = ExprI i (f e)

-- | Monadic bottom-up map over the 'Expr' layer of an 'ExprI' tree.
mapExprM :: (Monad m) => (Expr -> m Expr) -> ExprI -> m ExprI
mapExprM f = g
  where
    g (ExprI i (ModE v xs)) = ExprI i <$> (mapM g xs >>= f . ModE v)
    g (ExprI i (AssE v e es)) = ExprI i <$> ((AssE v <$> g e <*> mapM g es) >>= f)
    g (ExprI i (LstE es)) = ExprI i <$> (mapM g es >>= f . LstE)
    g (ExprI i (TupE es)) = ExprI i <$> (mapM g es >>= f . TupE)
    g (ExprI i (AppE e es)) = ExprI i <$> ((AppE <$> g e <*> mapM g es) >>= f)
    g (ExprI i (NamE rs)) = do
      es' <- mapM (g . snd) rs
      ExprI i <$> f (NamE (zip (map fst rs) es'))
    g (ExprI i (LamE vs e)) = ExprI i <$> (g e >>= f . LamE vs)
    g (ExprI i (AnnE e ts)) = ExprI i <$> ((AnnE <$> g e <*> pure ts) >>= f)
    g (ExprI i e) = ExprI i <$> f e

{- | Copy all index-keyed state entries from @oldIndex@ to @newIndex@.
Used when a module is re-indexed (e.g., after merging duplicate imports).
-}
copyState :: Int -> Int -> MorlocMonad ()
copyState oldIndex newIndex = do
  s <- MM.get

  -- Could be defined more succinctly, but it is IMPERATIVE that every index
  -- is copied. Listing all fields will ensure that an error is raised if a
  -- new MorlocState field is added but included in this function.
  MM.put $
    MorlocState
      { statePackageMeta = statePackageMeta s
      , stateVerbosity = stateVerbosity s
      , stateCounter = stateCounter s
      , stateDepth = stateDepth s
      , stateSignatures = updateGMap (stateSignatures s)
      , stateTypeclasses = stateTypeclasses s
      , stateConcreteTypedefs = updateGMap (stateConcreteTypedefs s)
      , stateGeneralTypedefs = updateGMap (stateGeneralTypedefs s)
      , stateUniversalGeneralTypedefs = stateUniversalGeneralTypedefs s
      , stateUniversalConcreteTypedefs = stateUniversalConcreteTypedefs s
      , stateSources = updateGMap (stateSources s)
      , stateAnnotations = updateMap (stateAnnotations s)
      , stateOutfile = stateOutfile s
      , stateExports = updateList (stateExports s)
      , stateName = updateMap (stateName s)
      , stateTermDocs = stateTermDocs s
      , stateManifoldConfig = updateMap (stateManifoldConfig s)
      , stateSourceMap = updateMap (stateSourceMap s)
      , stateSourceText = stateSourceText s
      , stateBuildConfig = stateBuildConfig s
      , stateModuleName = stateModuleName s
      , stateInstall = stateInstall s
      , stateInstallForce = stateInstallForce s
      , stateInstallDir = stateInstallDir s
      , stateClassDefs = stateClassDefs s
      , stateLangRegistry = stateLangRegistry s
      , stateExportGroups = stateExportGroups s
      , stateManifoldLang = stateManifoldLang s
      , stateManifoldEffects = stateManifoldEffects s
      , stateProjectRoot = stateProjectRoot s
      , stateEvalMode = stateEvalMode s
      , stateModuleDoc = stateModuleDoc s
      , stateModuleEpilogues = stateModuleEpilogues s
      }
  where
    updateGMap g = case GMap.yIsX oldIndex newIndex g of
      (Just g') -> g'
      Nothing -> g

    updateMap m = case Map.lookup oldIndex m of
      (Just x) -> Map.insert newIndex x m
      Nothing -> m

    updateList xs = if oldIndex `elem` xs then newIndex : xs else xs


================================================
FILE: library/Morloc/Frontend/Parser.hs
================================================
{-# OPTIONS_GHC -w #-}
{-# LANGUAGE CPP #-}
{-# LANGUAGE MagicHash #-}
{-# LANGUAGE BangPatterns #-}
{-# LANGUAGE TypeSynonymInstances #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE PatternGuards #-}
{-# LANGUAGE NoStrictData #-}
{-# LANGUAGE UnboxedTuples #-}
{-# LANGUAGE PartialTypeSignatures #-}
{-# LANGUAGE OverloadedStrings #-}

module Morloc.Frontend.Parser
  ( readProgram
  , readType
  , PState (..)
  , emptyPState
  ) where

import Data.Text (Text)
import qualified Data.Text as T
import qualified Data.Map.Strict as Map
import qualified Data.Set as Set
import qualified Data.Scientific as DS
import Data.List (sortBy, foldl')
import qualified Control.Monad.State.Strict as State
import Morloc.Frontend.Token
import Morloc.Frontend.Lexer (lexMorloc, showLexError)
import Morloc.Frontend.CST
import Morloc.Frontend.Desugar (DState(..), D, ParseError(..), showParseError, desugarProgram, desugarExpr)
import Morloc.Namespace.Prim
import Morloc.Namespace.Type
import Morloc.Namespace.Expr
import qualified Morloc.BaseTypes as BT
import qualified Control.Monad as Happy_Prelude
import qualified Data.Bool as Happy_Prelude
import qualified Data.Function as Happy_Prelude
import qualified Data.Int as Happy_Prelude
import qualified Data.List as Happy_Prelude
import qualified Data.Maybe as Happy_Prelude
import qualified Data.String as Happy_Prelude
import qualified Data.Tuple as Happy_Prelude
import qualified GHC.Err as Happy_Prelude
import qualified GHC.Num as Happy_Prelude
import qualified Text.Show as Happy_Prelude
import qualified Data.Array as Happy_Data_Array
import qualified Data.Bits as Bits
import qualified GHC.Exts as Happy_GHC_Exts
import Control.Applicative(Applicative(..))
import Control.Monad (ap)

-- parser produced by Happy Version 2.1.7

data HappyAbsSyn 
        = HappyTerminal (Located)
        | HappyErrorToken Happy_Prelude.Int
        | HappyAbsSyn7 (([Loc CstExpr], Bool))
        | HappyAbsSyn8 (TypeU)
        | HappyAbsSyn9 (Loc CstExpr)
        | HappyAbsSyn10 ([Loc CstExpr])
        | HappyAbsSyn17 ([(Loc CstExpr, Loc CstExpr)])
        | HappyAbsSyn18 ((Loc CstExpr, Loc CstExpr))
        | HappyAbsSyn19 (Text)
        | HappyAbsSyn20 ([Text])
        | HappyAbsSyn22 (CstExport)
        | HappyAbsSyn23 ([Located])
        | HappyAbsSyn24 (Located)
        | HappyAbsSyn28 (Maybe [AliasedSymbol])
        | HappyAbsSyn29 ([AliasedSymbol])
        | HappyAbsSyn30 (AliasedSymbol)
        | HappyAbsSyn32 ((Located, NamType))
        | HappyAbsSyn33 ((Text, Bool))
        | HappyAbsSyn34 ([(Key, TypeU)])
        | HappyAbsSyn36 ((TVar, [Either (TVar, Kind) TypeU]))
        | HappyAbsSyn37 ([Either (TVar, Kind) TypeU])
        | HappyAbsSyn38 ((Key, TypeU))
        | HappyAbsSyn39 ((Located, Key, TypeU))
        | HappyAbsSyn40 ([(Located, Key, TypeU)])
        | HappyAbsSyn42 ((TypeU, Bool))
        | HappyAbsSyn43 ([TypeU])
        | HappyAbsSyn51 (CstClassHead)
        | HappyAbsSyn52 ([Constraint])
        | HappyAbsSyn53 ([CstSigItem])
        | HappyAbsSyn54 (CstSigItem)
        | HappyAbsSyn56 ([(ClassName, [TypeU])])
        | HappyAbsSyn57 ([[Loc CstExpr]])
        | HappyAbsSyn60 ([EVar])
        | HappyAbsSyn61 (EVar)
        | HappyAbsSyn63 (Maybe Text)
        | HappyAbsSyn64 ([(Text, Maybe Text)])
        | HappyAbsSyn65 ((Text, Maybe Text))
        | HappyAbsSyn67 ([(Bool, Text, Located)])
        | HappyAbsSyn68 ((Bool, Text, Located))
        | HappyAbsSyn69 ((Text, Located))
        | HappyAbsSyn73 ([(EVar, Loc CstExpr)])
        | HappyAbsSyn75 ((EVar, Loc CstExpr))
        | HappyAbsSyn88 ([(Key, Loc CstExpr)])
        | HappyAbsSyn89 ((Key, Loc CstExpr))
        | HappyAbsSyn92 ([CstDoStmt])
        | HappyAbsSyn96 (CstAccessorBody)
        | HappyAbsSyn97 (CstAccessorTail)
        | HappyAbsSyn98 ([CstAccessorBody])
        | HappyAbsSyn106 (([Loc CstExpr], [Text]))
        | HappyAbsSyn116 ([EffectLabel])
        | HappyAbsSyn117 (CstSigType)
        | HappyAbsSyn118 ([(Pos, TypeU)])
        | HappyAbsSyn119 ((Pos, TypeU))
        | HappyAbsSyn124 (Constraint)

{-# NOINLINE happyTokenStrings #-}
happyTokenStrings = ["VLBRACE","VRBRACE","VSEMI","'('","')'","'['","']'","'{'","'}'","'<'","'>'","','","'\\\\'","'_'","'!'","'?'","'.'","GDOT","NSDOT","LABELCOLON","GDOTCHAIN","'='","'::'","'->'","'=>'","'<-'","'*'","'-'","':'","'module'","'import'","'source'","'from'","'where'","'as'","'True'","'False'","'type'","'record'","'object'","'table'","'class'","'instance'","'infixl'","'infixr'","'infix'","'let'","'in'","'do'","'Null'","LOWER","UPPER","'+'","'/'","OPERATOR","INTEGER","FLOAT","STRING","STRSTART","STRMID","STREND","INTERPOPEN","INTERPCLOSE","INTRINSIC","';'","'%inline'","EOF","%eof"]

happyActOffsets :: HappyAddr
happyActOffsets = HappyA# "\x48\x01\x00\x00\xf3\x06\x00\x00\x69\x05\x00\x00\xee\xff\xff\xff\x09\x00\x00\x00\x00\x00\x00\x00\xfe\xff\xff\xff\xd3\xff\xff\xff\x18\x01\x00\x00\x00\x00\x00\x00\x3b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x00\x00\x00\x97\x06\x00\x00\x00\x00\x00\x00\x98\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x15\x05\x00\x00\x50\x05\x00\x00\x8c\x00\x00\x00\x9b\x00\x00\x00\x00\x00\x00\x00\xb0\x06\x00\x00\x69\x05\x00\x00\x4d\x00\x00\x00\x4d\x00\x00\x00\xc7\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd3\x00\x00\x00\xa8\x01\x00\x00\x00\x00\x00\x00\x3b\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x99\x00\x00\x00\x00\x00\x00\x00\xb1\x00\x00\x00\xf3\x00\x00\x00\x00\x00\x00\x00\x28\x01\x00\x00\xeb\x00\x00\x00\xb2\x00\x00\x00\x6a\x07\x00\x00\x00\x00\x00\x00\xcc\x04\x00\x00\xf3\x06\x00\x00\x2a\x01\x00\x00\x6a\x07\x00\x00\x4b\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x41\x01\x00\x00\x7d\x01\x00\x00\xb9\x04\x00\x00\xcb\x04\x00\x00\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x30\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xb6\x01\x00\x00\xd6\x07\x00\x00\x00\x00\x00\x00\xb8\x00\x00\x00\x42\x01\x00\x00\x88\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x72\x07\x00\x00\xb0\x01\x00\x00\xb9\x01\x00\x00\xd3\x01\x00\x00\x10\x02\x00\x00\x00\x00\x00\x00\xe7\x01\x00\x00\x6c\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf3\x06\x00\x00\x00\x00\x00\x00\xf1\x01\x00\x00\x47\x02\x00\x00\x00\x00\x00\x00\x4f\x02\x00\x00\x61\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x88\x07\x00\x00\x88\x07\x00\x00\x88\x07\x00\x00\x88\x07\x00\x00\xf3\x06\x00\x00\x00\x00\x00\x00\xbf\x02\x00\x00\x69\x05\x00\x00\x56\x02\x00\x00\x5c\x02\x00\x00\xa2\x05\x00\x00\xa2\x05\x00\x00\x8b\x00\x00\x00\x8b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x32\x02\x00\x00\x0a\x03\x00\x00\x0a\x03\x00\x00\x00\x00\x00\x00\x93\x02\x00\x00\x00\x00\x00\x00\xdc\x00\x00\x00\x00\x00\x00\x00\x7e\x02\x00\x00\x00\x00\x00\x00\x9a\x02\x00\x00\x00\x00\x00\x00\x64\x02\x00\x00\x00\x00\x00\x00\xca\x00\x00\x00\x7d\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc8\x02\x00\x00\x00\x00\x00\x00\x67\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x98\x06\x00\x00\xbb\x05\x00\x00\xbb\x05\x00\x00\xbb\x05\x00\x00\xf3\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xbb\x05\x00\x00\xb2\x02\x00\x00\x89\x04\x00\x00\xb8\x02\x00\x00\x72\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xda\x02\x00\x00\xe8\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xda\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc6\x02\x00\x00\xce\x02\x00\x00\xce\x02\x00\x00\xce\x02\x00\x00\xce\x02\x00\x00\x72\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\xbb\x05\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\xd3\x02\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\x4f\x00\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\xc3\x01\x00\x00\x00\x00\x00\x00\x4f\x00\x00\x00\x4f\x00\x00\x00\x15\x00\x00\x00\x00\x00\x00\x00\x02\x03\x00\x00\xac\x01\x00\x00\x25\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x00\x00\x00\x00\x00\x00\x00\xcf\x01\x00\x00\xa7\x01\x00\x00\x27\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xde\x02\x00\x00\xe7\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf8\x00\x00\x00\xf8\x00\x00\x00\x88\x07\x00\x00\x88\x07\x00\x00\x00\x00\x00\x00\xf3\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf3\x06\x00\x00\xff\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe9\x04\x00\x00\x00\x00\x00\x00\xce\x07\x00\x00\xce\x07\x00\x00\xce\x07\x00\x00\x5b\x01\x00\x00\x88\x07\x00\x00\x1d\x03\x00\x00\x08\x05\x00\x00\xd5\x06\x00\x00\x05\x03\x00\x00\x2b\x03\x00\x00\x33\x03\x00\x00\x3c\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xad\x00\x00\x00\x65\x00\x00\x00\x30\x03\x00\x00\x63\x03\x00\x00\x6b\x03\x00\x00\x79\x03\x00\x00\x23\x01\x00\x00\xfb\x06\x00\x00\x1d\x00\x00\x00\x50\x03\x00\x00\x71\x03\x00\x00\x76\x03\x00\x00\x00\x00\x00\x00\xe9\x04\x00\x00\x00\x00\x00\x00\x2a\x00\x00\x00\x37\x00\x00\x00\x37\x00\x00\x00\x00\x00\x00\x00\xb2\x01\x00\x00\x96\x03\x00\x00\x00\x00\x00\x00\x95\x03\x00\x00\x90\x03\x00\x00\xf2\x00\x00\x00\x2f\x01\x00\x00\x88\x07\x00\x00\x00\x00\x00\x00\xe8\x06\x00\x00\x06\x07\x00\x00\xfe\x02\x00\x00\x90\x07\x00\x00\x9e\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x53\x01\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xb9\x00\x00\x00\x00\x00\x00\x00\x90\x00\x00\x00\x80\x03\x00\x00\x9c\x03\x00\x00\xd1\x00\x00\x00\x9b\x03\x00\x00\x27\x00\x00\x00\x37\x00\x00\x00\x37\x00\x00\x00\x00\x00\x00\x00\xef\x01\x00\x00\x00\x00\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\xc8\x03\x00\x00\x00\x00\x00\x00\x9b\x07\x00\x00\xa6\x03\x00\x00\xf2\x03\x00\x00\xd6\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe2\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd6\x03\x00\x00\xd6\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf9\x01\x00\x00\xbb\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf4\x05\x00\x00\x0d\x06\x00\x00\x8b\x00\x00\x00\x00\x00\x00\x00\x46\x06\x00\x00\x08\x03\x00\x00\x8b\x00\x00\x00\x67\x01\x00\x00\x5f\x06\x00\x00\x5f\x06\x00\x00\x17\x03\x00\x00\x8b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x9c\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x02\x00\x00\xf4\x03\x00\x00\xe2\x03\x00\x00\xe2\x03\x00\x00\xe2\x03\x00\x00\xe2\x03\x00\x00\x00\x00\x00\x00\x01\x04\x00\x00\x0f\x04\x00\x00\x15\x04\x00\x00\x98\x00\x00\x00\x0b\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x0b\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5f\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5f\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5f\x06\x00\x00\x00\x00\x00\x00\x4c\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe6\x03\x00\x00\x00\x00\x00\x00\x06\x07\x00\x00\xce\x07\x00\x00\x1b\x04\x00\x00\x28\x04\x00\x00\x37\x04\x00\x00\x28\x00\x00\x00\x9b\x07\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x24\x04\x00\x00\x0a\x04\x00\x00\xbd\x00\x00\x00\x2e\x04\x00\x00\x00\x00\x00\x00\x33\x04\x00\x00\x0e\x07\x00\x00\x2c\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x4a\x04\x00\x00\x00\x00\x00\x00\x48\x04\x00\x00\x16\x02\x00\x00\x00\x00\x00\x00\xee\x07\x00\x00\x30\x04\x00\x00\x31\x04\x00\x00\x00\x00\x00\x00\x1e\x04\x00\x00\x34\x04\x00\x00\x5f\x06\x00\x00\x2c\x07\x00\x00\x00\x00\x00\x00\x45\x03\x00\x00\x52\x04\x00\x00\x4e\x04\x00\x00\x2b\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x39\x07\x00\x00\x39\x07\x00\x00\x2b\x04\x00\x00\x57\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xce\x00\x00\x00\x4d\x04\x00\x00\x4f\x04\x00\x00\xb2\x01\x00\x00\xb2\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x38\x04\x00\x00\x00\x00\x00\x00\x59\x03\x00\x00\x59\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x54\x01\x00\x00\x54\x01\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x00\x00\x00\x00\x41\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x49\x07\x00\x00\x00\x00\x00\x00\x42\x04\x00\x00\x00\x00\x00\x00\x3e\x02\x00\x00\x6e\x04\x00\x00\x3f\x04\x00\x00\x45\x04\x00\x00\x75\x04\x00\x00\x76\x04\x00\x00\x77\x04\x00\x00\x00\x00\x00\x00\x9d\x00\x00\x00\x00\x00\x00\x00\x10\x00\x00\x00\x44\x02\x00\x00\x00\x00\x00\x00\x5a\x04\x00\x00\x0b\x08\x00\x00\x64\x04\x00\x00\x00\x00\x00\x00\x83\x04\x00\x00\xdc\x01\x00\x00\x4c\x07\x00\x00\x4c\x07\x00\x00\x73\x04\x00\x00\x00\x00\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x68\x03\x00\x00\x00\x00\x00\x00\x78\x04\x00\x00\x9b\x07\x00\x00\x00\x00\x00\x00\x70\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x74\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4d\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x57\x07\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x9b\x07\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x7e\x04\x00\x00\x0a\x01\x00\x00\x56\x01\x00\x00\x9b\x07\x00\x00\x00\x00\x00\x00\xf0\x06\x00\x00\x5f\x07\x00\x00\x4f\x03\x00\x00\xaa\x07\x00\x00\x7a\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x6b\x04\x00\x00\x00\x00\x00\x00\xee\x00\x00\x00\x9b\x04\x00\x00\x9c\x04\x00\x00\xa3\x04\x00\x00\x14\x01\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x72\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x10\x08\x00\x00\x00\x00\x00\x00\xd9\x00\x00\x00\x00\x00\x00\x00\x86\x04\x00\x00\x87\x04\x00\x00\x8b\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe6\x00\x00\x00\xe6\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4c\x02\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x7c\x04\x00\x00\x00\x00\x00\x00\xc9\x02\x00\x00\x99\x04\x00\x00\xae\x04\x00\x00\xae\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x8e\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x20\x00\x00\x00\x00\x00\x00\x00\x8f\x03\x00\x00\x00\x00\x00\x00\x8f\x04\x00\x00\x90\x04\x00\x00\x92\x04\x00\x00\x00\x00\x00\x00\xc1\x04\x00\x00\xc2\x04\x00\x00\xc3\x04\x00\x00\x00\x00\x00\x00\x10\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xce\x04\x00\x00\x9b\x07\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x8e\x03\x00\x00\xb3\x04\x00\x00\xd0\x04\x00\x00\x52\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xaa\x07\x00\x00\xaa\x07\x00\x00\xaa\x07\x00\x00\xaa\x07\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x56\x01\x00\x00\x56\x01\x00\x00\x9b\x07\x00\x00\x9b\x07\x00\x00\x00\x00\x00\x00\x5f\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa3\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe6\x00\x00\x00\x00\x00\x00\x00\xe6\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x61\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00"#

happyGotoOffsets :: HappyAddr
happyGotoOffsets = HappyA# "\x21\x02\x00\x00\x4a\x00\x00\x00\x9a\x00\x00\x00\x99\x03\x00\x00\xd2\x04\x00\x00\x00\x00\x00\x00\x82\x01\x00\x00\x00\x00\x00\x00\xd1\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x65\x04\x00\x00\x00\x00\x00\x00\xec\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4b\x00\x00\x00\x0d\x01\x00\x00\x56\x03\x00\x00\x61\x04\x00\x00\x00\x00\x00\x00\x1e\x08\x00\x00\xa3\x01\x00\x00\x91\x04\x00\x00\x96\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x8d\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x7f\x04\x00\x00\x00\x00\x00\x00\xcf\x04\x00\x00\x80\x05\x00\x00\x72\x04\x00\x00\x93\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x00\x00\x00\x0b\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd4\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x82\x04\x00\x00\x85\x04\x00\x00\x00\x00\x00\x00\x8e\x01\x00\x00\xe6\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf6\xff\xff\xff\xd3\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd5\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf7\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x55\x03\x00\x00\x57\x03\x00\x00\x4a\x01\x00\x00\x71\x01\x00\x00\xd2\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xca\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xbe\x00\x00\x00\xe5\x00\x00\x00\x65\x01\x00\x00\x73\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x6d\x03\x00\x00\xa9\x04\x00\x00\xac\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x06\x08\x00\x00\xee\x01\x00\x00\x15\x02\x00\x00\x39\x02\x00\x00\x24\x06\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x60\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x83\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x95\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xfa\x04\x00\x00\x11\x05\x00\x00\x1b\x05\x00\x00\x1c\x05\x00\x00\xaa\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x34\x01\x00\x00\x00\x00\x00\x00\x84\x02\x00\x00\xab\x02\x00\x00\x00\x00\x00\x00\xdb\x04\x00\x00\xcf\x02\x00\x00\x00\x00\x00\x00\xf6\x02\x00\x00\x00\x00\x00\x00\xd6\x04\x00\x00\x1a\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd7\x04\x00\x00\xe5\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc4\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc4\x04\x00\x00\xc4\x04\x00\x00\x00\x00\x00\x00\x1d\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4f\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x18\x00\x00\x00\x00\x00\x00\x00\xdb\xff\xff\xff\xe4\xff\xff\xff\xf0\xff\xff\xff\x00\x00\x00\x00\xaf\x01\x00\x00\x00\x00\x00\x00\xc4\x04\x00\x00\x51\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x21\x05\x00\x00\x0a\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2b\x05\x00\x00\x6f\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd3\x03\x00\x00\xc0\x07\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x26\x05\x00\x00\x00\x00\x00\x00\x50\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x05\x00\x00\x2d\x05\x00\x00\x34\x05\x00\x00\x39\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xea\x04\x00\x00\x00\x00\x00\x00\x35\x08\x00\x00\x3c\x08\x00\x00\xed\x04\x00\x00\xe7\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x51\x05\x00\x00\x41\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x48\x05\x00\x00\x00\x00\x00\x00\xcf\x03\x00\x00\x00\x00\x00\x00\x90\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x45\x05\x00\x00\x47\x05\x00\x00\x53\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc6\x01\x00\x00\x7e\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x05\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xfd\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x65\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x58\x01\x00\x00\x8c\x03\x00\x00\xfb\x01\x00\x00\x00\x00\x00\x00\x7f\x01\x00\x00\x33\x05\x00\x00\x37\x05\x00\x00\x72\x05\x00\x00\xb0\x03\x00\x00\xd7\x03\x00\x00\x3d\x05\x00\x00\x41\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x25\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe1\x03\x00\x00\x82\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x83\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xfb\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x22\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x46\x04\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x43\x08\x00\x00\xd1\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x06\x00\x00\x00\xfa\x01\x00\x00\x00\x00\x00\x00\xd7\xff\xff\xff\x23\x05\x00\x00\x2e\x05\x00\x00\x00\x00\x00\x00\x2a\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x7c\x05\x00\x00\x00\x00\x00\x00\x4a\x08\x00\x00\x51\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x69\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x89\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x30\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x28\x05\x00\x00\x6d\x04\x00\x00\x87\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x98\x03\x00\x00\xa0\x03\x00\x00\x5e\x02\x00\x00\x7f\x02\x00\x00\x4a\x05\x00\x00\x9c\x05\x00\x00\xeb\x03\x00\x00\x86\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x8e\x05\x00\x00\x92\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xbc\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x43\x05\x00\x00\x43\x05\x00\x00\x00\x00\x00\x00\x25\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x83\x08\x00\x00\x00\x00\x00\x00\x36\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x9a\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x9d\x05\x00\x00\x00\x00\x00\x00\xb1\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x40\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x05\x00\x00\x6d\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x73\x02\x00\x00\xaa\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4d\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x8a\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x84\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x0e\x00\x00\x00\x4e\x08\x00\x00\x00\x00\x00\x00\xd9\xff\xff\xff\x59\x05\x00\x00\x5f\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5c\x05\x00\x00\x00\x00\x00\x00\x66\x08\x00\x00\x6d\x08\x00\x00\x60\x05\x00\x00\xa5\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xac\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x98\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x9e\x05\x00\x00\x00\x00\x00\x00\xdf\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x61\x05\x00\x00\x00\x00\x00\x00\xa1\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf8\xff\xff\xff\xfb\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x74\x08\x00\x00\x00\x00\x00\x00\xba\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc7\x05\x00\x00\xd1\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x7b\x08\x00\x00\x00\x00\x00\x00\xd3\x05\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf3\x03\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x87\x05\x00\x00\x92\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xff\x03\x00\x00\x09\x04\x00\x00\xdc\x02\x00\x00\xe9\x02\x00\x00\x82\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x90\x05\x00\x00\x90\x05\x00\x00\x00\x00\x00\x00\x2d\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd7\x08\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf9\xff\xff\xff\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00"#

happyDefActions :: HappyAddr
happyDefActions = HappyA# "\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf8\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xe1\xff\xff\xff\x00\x00\x00\x00\x44\xff\xff\xff\x46\xff\xff\xff\x45\xff\xff\xff\x43\xff\xff\xff\x34\xff\xff\xff\x30\xff\xff\xff\x2d\xff\xff\xff\x2a\xff\xff\xff\x1d\xff\xff\xff\x1c\xff\xff\xff\x27\xff\xff\xff\x21\xff\xff\xff\x22\xff\xff\xff\x1e\xff\xff\xff\x26\xff\xff\xff\x20\xff\xff\xff\x1f\xff\xff\xff\x24\xff\xff\xff\x23\xff\xff\xff\x25\xff\xff\xff\xed\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf3\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf2\xfe\xff\xff\xf1\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x1b\xff\xff\xff\xf4\xfe\xff\xff\xf0\xfe\xff\xff\xef\xfe\xff\xff\xee\xfe\xff\xff\x00\x00\x00\x00\x1a\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xe9\xfe\xff\xff\xe8\xfe\xff\xff\xe4\xfe\xff\xff\xe1\xfe\xff\xff\xde\xfe\xff\xff\xdc\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xd4\xfe\xff\xff\xd6\xfe\xff\xff\xd2\xfe\xff\xff\xd3\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xee\xff\xff\xff\xe5\xff\xff\xff\xec\xff\xff\xff\xeb\xff\xff\xff\x00\x00\x00\x00\xea\xff\xff\xff\xe9\xff\xff\xff\xe8\xff\xff\xff\xe7\xff\xff\xff\x9f\xfe\xff\xff\x00\x00\x00\x00\xf1\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xae\xff\xff\xff\xad\xff\xff\xff\xac\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xab\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xf0\xff\xff\xff\xf3\xff\xff\xff\xfb\xff\xff\xff\x00\x00\x00\x00\xd7\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xcd\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xdb\xfe\xff\xff\xdd\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xfa\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2f\xff\xff\xff\x2e\xff\xff\xff\x01\xff\xff\xff\x00\x00\x00\x00\xfd\xfe\xff\xff\xfd\xfe\xff\xff\x02\xff\xff\xff\x00\x00\x00\x00\x2b\xff\xff\xff\x00\x00\x00\x00\x9d\xfe\xff\xff\x00\x00\x00\x00\x10\xff\xff\xff\x00\x00\x00\x00\x13\xff\xff\xff\x00\x00\x00\x00\x0d\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x19\xff\xff\xff\xae\xfe\xff\xff\xad\xfe\xff\xff\x00\x00\x00\x00\xaf\xfe\xff\xff\x00\x00\x00\x00\xb0\xfe\xff\xff\xac\xfe\xff\xff\xb1\xfe\xff\xff\x29\xff\xff\xff\x2c\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf9\xff\xff\xff\xe0\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xde\xff\xff\xff\xdd\xff\xff\xff\x00\x00\x00\x00\xd8\xff\xff\xff\xf7\xff\xff\xff\xfc\xff\xff\xff\x00\x00\x00\x00\xd5\xff\xff\xff\xd4\xff\xff\xff\xd2\xff\xff\xff\x00\x00\x00\x00\xd6\xff\xff\xff\xd1\xff\xff\xff\xcd\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x41\xff\xff\xff\x42\xff\xff\xff\x32\xff\xff\xff\x31\xff\xff\xff\x33\xff\xff\xff\x28\xff\xff\xff\x17\xff\xff\xff\x16\xff\xff\xff\x18\xff\xff\xff\x15\xff\xff\xff\x00\x00\x00\x00\x0c\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x11\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x9c\xfe\xff\xff\x00\x00\x00\x00\xff\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\x00\x00\x00\x00\xfa\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x3a\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x3c\xff\xff\xff\x03\xff\xff\xff\x00\x00\x00\x00\x07\xff\xff\xff\x00\x00\x00\x00\xf4\xfe\xff\xff\x00\x00\x00\x00\x09\xff\xff\xff\xf5\xfe\xff\xff\xf6\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xec\xfe\xff\xff\xe7\xfe\xff\xff\xe3\xfe\xff\xff\xe2\xfe\xff\xff\xdf\xfe\xff\xff\xe0\xfe\xff\xff\xda\xfe\xff\xff\x00\x00\x00\x00\xd8\xfe\xff\xff\xe6\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xd5\xfe\xff\xff\xf4\xff\xff\xff\x00\x00\x00\x00\xe6\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x73\xff\xff\xff\x00\x00\x00\x00\x7d\xff\xff\xff\x7a\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa2\xff\xff\xff\x5d\xff\xff\xff\xa5\xff\xff\xff\xa6\xff\xff\xff\xc7\xff\xff\xff\xdd\xff\xff\xff\xc6\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa2\xff\xff\xff\xf2\xff\xff\xff\x00\x00\x00\x00\xed\xff\xff\xff\xa4\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xa2\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xe4\xff\xff\xff\xca\xfe\xff\xff\xc8\xfe\xff\xff\xc5\xfe\xff\xff\xc2\xfe\xff\xff\xbf\xfe\xff\xff\xbd\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xb5\xfe\xff\xff\xb7\xfe\xff\xff\xb3\xfe\xff\xff\xb4\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x9e\xfe\xff\xff\xa9\xfe\xff\xff\xa8\xfe\xff\xff\xaa\xfe\xff\xff\xc6\xff\xff\xff\xcc\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xb5\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xa2\xff\xff\xff\x00\x00\x00\x00\x79\xff\xff\xff\xd6\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xcf\xfe\xff\xff\x72\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x6b\xff\xff\xff\x68\xff\xff\xff\x63\xff\xff\xff\x00\x00\x00\x00\x62\xff\xff\xff\x61\xff\xff\xff\x60\xff\xff\xff\x6a\xff\xff\xff\x69\xff\xff\xff\xef\xff\xff\xff\xcc\xfe\xff\xff\xe5\xfe\xff\xff\xd1\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xeb\xfe\xff\xff\x0b\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x0a\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf7\xfe\xff\xff\xf8\xfe\xff\xff\xfe\xfe\xff\xff\x00\x00\x00\x00\xfc\xfe\xff\xff\xfb\xfe\xff\xff\xdf\xff\xff\xff\x35\xff\xff\xff\x0f\xff\xff\xff\x0e\xff\xff\xff\x12\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xd9\xff\xff\xff\xda\xff\xff\xff\xdb\xff\xff\xff\xdc\xff\xff\xff\xd7\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xf5\xff\xff\xff\xd3\xff\xff\xff\xcf\xff\xff\xff\xce\xff\xff\xff\xd0\xff\xff\xff\x00\x00\x00\x00\x14\xff\xff\xff\xf9\xfe\xff\xff\x39\xff\xff\xff\x3d\xff\xff\xff\x00\x00\x00\x00\x37\xff\xff\xff\x38\xff\xff\xff\x00\x00\x00\x00\x3b\xff\xff\xff\x3f\xff\xff\xff\x00\x00\x00\x00\x06\xff\xff\xff\x00\x00\x00\x00\x05\xff\xff\xff\x08\xff\xff\xff\x00\x00\x00\x00\xd9\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xce\xfe\xff\xff\x00\x00\x00\x00\x7c\xff\xff\xff\xb2\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa2\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa1\xff\xff\xff\x5c\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xc8\xff\xff\xff\xc6\xff\xff\xff\x00\x00\x00\x00\xc4\xff\xff\xff\x00\x00\x00\x00\xc2\xff\xff\xff\xba\xff\xff\xff\xca\xff\xff\xff\x00\x00\x00\x00\xa7\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xb8\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xbc\xfe\xff\xff\xbe\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa8\xff\xff\xff\xa9\xff\xff\xff\xaa\xff\xff\xff\xab\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xa3\xff\xff\xff\xb1\xff\xff\xff\x00\x00\x00\x00\x9c\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xcb\xfe\xff\xff\xc9\xfe\xff\xff\xc4\xfe\xff\xff\xc3\xfe\xff\xff\xc0\xfe\xff\xff\xc1\xfe\xff\xff\xbb\xfe\xff\xff\x00\x00\x00\x00\xb9\xfe\xff\xff\xc7\xfe\xff\xff\x00\x00\x00\x00\xb6\xfe\xff\xff\xa7\xfe\xff\xff\xe3\xff\xff\xff\x00\x00\x00\x00\xc6\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xc5\xff\xff\xff\x00\x00\x00\x00\xcb\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x5b\xff\xff\xff\x55\xff\xff\xff\x00\x00\x00\x00\x59\xff\xff\xff\xb6\xff\xff\xff\x00\x00\x00\x00\xd4\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xb3\xff\xff\xff\x78\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x77\xff\xff\xff\x00\x00\x00\x00\x71\xff\xff\xff\x6c\xff\xff\xff\x00\x00\x00\x00\x70\xff\xff\xff\x6e\xff\xff\xff\x00\x00\x00\x00\x65\xff\xff\xff\x64\xff\xff\xff\x66\xff\xff\xff\x67\xff\xff\xff\xd0\xfe\xff\xff\xea\xfe\xff\xff\x04\xff\xff\xff\x40\xff\xff\xff\x36\xff\xff\xff\x3e\xff\xff\xff\xf6\xff\xff\xff\x6d\xff\xff\xff\x74\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x7e\xff\xff\xff\x00\x00\x00\x00\x7b\xff\xff\xff\x00\x00\x00\x00\xb7\xff\xff\xff\x97\xff\xff\xff\x93\xff\xff\xff\x90\xff\xff\xff\x8d\xff\xff\xff\x8a\xff\xff\xff\x88\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x80\xff\xff\xff\x82\xff\xff\xff\x7f\xff\xff\xff\x96\xff\xff\xff\xb8\xff\xff\xff\x00\x00\x00\x00\x9f\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5f\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x4e\xff\xff\xff\x4b\xff\xff\xff\x00\x00\x00\x00\x4a\xff\xff\xff\x00\x00\x00\x00\xc3\xff\xff\xff\xbd\xff\xff\xff\xbb\xff\xff\xff\xbf\xff\xff\xff\xc1\xff\xff\xff\xb9\xff\xff\xff\xc9\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xe2\xff\xff\xff\xc6\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xb2\xff\xff\xff\x00\x00\x00\x00\x9a\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\xa8\xff\xff\xff\xa8\xff\xff\xff\xb0\xff\xff\xff\xaf\xff\xff\xff\x00\x00\x00\x00\xa7\xff\xff\xff\x00\x00\x00\x00\x9b\xff\xff\xff\x9d\xff\xff\xff\xba\xfe\xff\xff\xa0\xfe\xff\xff\x00\x00\x00\x00\xa2\xfe\xff\xff\x00\x00\x00\x00\xa4\xfe\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x4c\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x5e\xff\xff\xff\x00\x00\x00\x00\x5a\xff\xff\xff\x54\xff\xff\xff\x53\xff\xff\xff\x52\xff\xff\xff\x50\xff\xff\xff\x4f\xff\xff\xff\x51\xff\xff\xff\x56\xff\xff\xff\x58\xff\xff\xff\x57\xff\xff\xff\x00\x00\x00\x00\x98\xff\xff\xff\x00\x00\x00\x00\x83\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x87\xff\xff\xff\x89\xff\xff\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xb4\xff\xff\xff\x76\xff\xff\xff\x75\xff\xff\xff\x6f\xff\xff\xff\x94\xff\xff\xff\x8f\xff\xff\xff\x8e\xff\xff\xff\x8b\xff\xff\xff\x8c\xff\xff\xff\x86\xff\xff\xff\x00\x00\x00\x00\x84\xff\xff\xff\x92\xff\xff\xff\x00\x00\x00\x00\x81\xff\xff\xff\x95\xff\xff\xff\xa0\xff\xff\xff\x4d\xff\xff\xff\x48\xff\xff\xff\x47\xff\xff\xff\x49\xff\xff\xff\xbe\xff\xff\xff\xbc\xff\xff\xff\xc0\xff\xff\xff\xa6\xfe\xff\xff\x00\x00\x00\x00\xa5\xfe\xff\xff\x00\x00\x00\x00\x99\xff\xff\xff\x9e\xff\xff\xff\xa1\xfe\xff\xff\xa3\xfe\xff\xff\x91\xff\xff\xff\x00\x00\x00\x00\x85\xff\xff\xff"#

happyCheck :: HappyAddr
happyCheck = HappyA# "\xff\xff\xff\xff\x09\x00\x00\x00\x09\x00\x00\x00\x05\x00\x00\x00\x09\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x36\x00\x00\x00\x2f\x00\x00\x00\x06\x00\x00\x00\x09\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x1f\x00\x00\x00\x0a\x00\x00\x00\x09\x00\x00\x00\x35\x00\x00\x00\x36\x00\x00\x00\x07\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x05\x00\x00\x00\x13\x00\x00\x00\x09\x00\x00\x00\x45\x00\x00\x00\x35\x00\x00\x00\x36\x00\x00\x00\x18\x00\x00\x00\x19\x00\x00\x00\x18\x00\x00\x00\x13\x00\x00\x00\x0a\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x2c\x00\x00\x00\x18\x00\x00\x00\x19\x00\x00\x00\x35\x00\x00\x00\x36\x00\x00\x00\x05\x00\x00\x00\x1f\x00\x00\x00\x0a\x00\x00\x00\x0a\x00\x00\x00\x13\x00\x00\x00\x05\x00\x00\x00\x05\x00\x00\x00\x2b\x00\x00\x00\x05\x00\x00\x00\x18\x00\x00\x00\x19\x00\x00\x00\x34\x00\x00\x00\x30\x00\x00\x00\x17\x00\x00\x00\x05\x00\x00\x00\x2b\x00\x00\x00\x34\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x37\x00\x00\x00\x30\x00\x00\x00\x05\x00\x00\x00\x37\x00\x00\x00\x17\x00\x00\x00\x34\x00\x00\x00\x23\x00\x00\x00\x33\x00\x00\x00\x37\x00\x00\x00\x2b\x00\x00\x00\x34\x00\x00\x00\x37\x00\x00\x00\x42\x00\x00\x00\x76\x00\x00\x00\x30\x00\x00\x00\x21\x00\x00\x00\x05\x00\x00\x00\x01\x00\x00\x00\x34\x00\x00\x00\x44\x00\x00\x00\x77\x00\x00\x00\x37\x00\x00\x00\x77\x00\x00\x00\x76\x00\x00\x00\x05\x00\x00\x00\x43\x00\x00\x00\x05\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x42\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x76\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x3b\x00\x00\x00\x34\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x42\x00\x00\x00\x42\x00\x00\x00\x13\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x76\x00\x00\x00\x06\x00\x00\x00\x18\x00\x00\x00\x19\x00\x00\x00\x05\x00\x00\x00\x43\x00\x00\x00\x35\x00\x00\x00\x06\x00\x00\x00\x0d\x00\x00\x00\x77\x00\x00\x00\x77\x00\x00\x00\x79\x00\x00\x00\x77\x00\x00\x00\x7b\x00\x00\x00\x7b\x00\x00\x00\x7a\x00\x00\x00\x7b\x00\x00\x00\x05\x00\x00\x00\x77\x00\x00\x00\x34\x00\x00\x00\x77\x00\x00\x00\x2b\x00\x00\x00\x7b\x00\x00\x00\x77\x00\x00\x00\x2d\x00\x00\x00\x44\x00\x00\x00\x30\x00\x00\x00\x34\x00\x00\x00\x77\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x77\x00\x00\x00\x39\x00\x00\x00\x37\x00\x00\x00\x39\x00\x00\x00\x24\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x05\x00\x00\x00\x1c\x00\x00\x00\x77\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x05\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x0f\x00\x00\x00\x50\x00\x00\x00\x02\x00\x00\x00\x05\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x05\x00\x00\x00\x58\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x76\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x75\x00\x00\x00\x77\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x1d\x00\x00\x00\x13\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x1c\x00\x00\x00\x34\x00\x00\x00\x06\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x02\x00\x00\x00\x05\x00\x00\x00\x0d\x00\x00\x00\x3f\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x09\x00\x00\x00\x24\x00\x00\x00\x05\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x37\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x37\x00\x00\x00\x50\x00\x00\x00\x05\x00\x00\x00\x34\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x05\x00\x00\x00\x23\x00\x00\x00\x19\x00\x00\x00\x45\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x34\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x1d\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x34\x00\x00\x00\x50\x00\x00\x00\x1d\x00\x00\x00\x34\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x55\x00\x00\x00\x1c\x00\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x05\x00\x00\x00\x34\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x36\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x1d\x00\x00\x00\x36\x00\x00\x00\x11\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x37\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x11\x00\x00\x00\x50\x00\x00\x00\x1e\x00\x00\x00\x44\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x17\x00\x00\x00\x56\x00\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x36\x00\x00\x00\x19\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x02\x00\x00\x00\x1c\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x09\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x34\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x4f\x00\x00\x00\x50\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x11\x00\x00\x00\x58\x00\x00\x00\x37\x00\x00\x00\x1f\x00\x00\x00\x0d\x00\x00\x00\x1e\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x1c\x00\x00\x00\x1e\x00\x00\x00\x1c\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x11\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x23\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x4f\x00\x00\x00\x50\x00\x00\x00\x1e\x00\x00\x00\x45\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x37\x00\x00\x00\x58\x00\x00\x00\x37\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x14\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x42\x00\x00\x00\x50\x00\x00\x00\x44\x00\x00\x00\x02\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x09\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x11\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x44\x00\x00\x00\x1b\x00\x00\x00\x17\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x06\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x18\x00\x00\x00\x50\x00\x00\x00\x0d\x00\x00\x00\x02\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x09\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x35\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x3b\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x39\x00\x00\x00\x50\x00\x00\x00\x18\x00\x00\x00\x06\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x1e\x00\x00\x00\x58\x00\x00\x00\x0d\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x06\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x0d\x00\x00\x00\x06\x00\x00\x00\x21\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x39\x00\x00\x00\x02\x00\x00\x00\x0d\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x09\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x6a\x00\x00\x00\x50\x00\x00\x00\x6c\x00\x00\x00\x06\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x00\x00\x00\x00\x58\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x05\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x6a\x00\x00\x00\x06\x00\x00\x00\x6c\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x0d\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x42\x00\x00\x00\x50\x00\x00\x00\x44\x00\x00\x00\x02\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x13\x00\x00\x00\x58\x00\x00\x00\x09\x00\x00\x00\x16\x00\x00\x00\x39\x00\x00\x00\x06\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x0d\x00\x00\x00\x06\x00\x00\x00\x0c\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x08\x00\x00\x00\x06\x00\x00\x00\x0d\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x0d\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x6a\x00\x00\x00\x50\x00\x00\x00\x6c\x00\x00\x00\x06\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x08\x00\x00\x00\x58\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x0d\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x06\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x0a\x00\x00\x00\x50\x00\x00\x00\x34\x00\x00\x00\x0d\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x12\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x17\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x13\x00\x00\x00\x50\x00\x00\x00\x17\x00\x00\x00\x16\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x05\x00\x00\x00\x58\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x12\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x06\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x0a\x00\x00\x00\x50\x00\x00\x00\x1d\x00\x00\x00\x0d\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x1f\x00\x00\x00\x58\x00\x00\x00\x6a\x00\x00\x00\x22\x00\x00\x00\x6c\x00\x00\x00\x06\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x3c\x00\x00\x00\x3d\x00\x00\x00\x3e\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x0d\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x34\x00\x00\x00\x50\x00\x00\x00\x3d\x00\x00\x00\x3e\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x34\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x17\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x40\x00\x00\x00\x50\x00\x00\x00\x16\x00\x00\x00\x17\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x3f\x00\x00\x00\x58\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x35\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x30\x00\x00\x00\x31\x00\x00\x00\x35\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x23\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x1a\x00\x00\x00\x50\x00\x00\x00\x30\x00\x00\x00\x31\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x1a\x00\x00\x00\x58\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x22\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x34\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x06\x00\x00\x00\x50\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x06\x00\x00\x00\x58\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x30\x00\x00\x00\x31\x00\x00\x00\x06\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x35\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x1a\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x1a\x00\x00\x00\x50\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x02\x00\x00\x00\x58\x00\x00\x00\x0c\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x04\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x51\x00\x00\x00\x52\x00\x00\x00\x19\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x1a\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x34\x00\x00\x00\x50\x00\x00\x00\x43\x00\x00\x00\x44\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x1e\x00\x00\x00\x58\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x5b\x00\x00\x00\x5c\x00\x00\x00\x02\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x3b\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x35\x00\x00\x00\x50\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x0d\x00\x00\x00\x58\x00\x00\x00\x16\x00\x00\x00\x17\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x11\x00\x00\x00\x12\x00\x00\x00\x02\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x06\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x1d\x00\x00\x00\x50\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x06\x00\x00\x00\x58\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x20\x00\x00\x00\x21\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x06\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x06\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x06\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x40\x00\x00\x00\x50\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x06\x00\x00\x00\x58\x00\x00\x00\x3d\x00\x00\x00\x3e\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x06\x00\x00\x00\x1a\x00\x00\x00\x35\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x17\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x17\x00\x00\x00\x50\x00\x00\x00\x02\x00\x00\x00\x05\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x24\x00\x00\x00\x24\x00\x00\x00\x08\x00\x00\x00\x23\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x0c\x00\x00\x00\x34\x00\x00\x00\x09\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x17\x00\x00\x00\x23\x00\x00\x00\x17\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x34\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x18\x00\x00\x00\x50\x00\x00\x00\x05\x00\x00\x00\x35\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x06\x00\x00\x00\x06\x00\x00\x00\x06\x00\x00\x00\x24\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x24\x00\x00\x00\x06\x00\x00\x00\x17\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x18\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x21\x00\x00\x00\x50\x00\x00\x00\x19\x00\x00\x00\x1e\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x58\x00\x00\x00\x16\x00\x00\x00\x35\x00\x00\x00\x06\x00\x00\x00\x06\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x06\x00\x00\x00\x24\x00\x00\x00\x24\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x41\x00\x00\x00\x24\x00\x00\x00\x34\x00\x00\x00\x18\x00\x00\x00\x45\x00\x00\x00\x46\x00\x00\x00\x47\x00\x00\x00\x48\x00\x00\x00\x49\x00\x00\x00\x09\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x03\x00\x00\x00\x50\x00\x00\x00\x05\x00\x00\x00\x0c\x00\x00\x00\x53\x00\x00\x00\x54\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x58\x00\x00\x00\x34\x00\x00\x00\x06\x00\x00\x00\x06\x00\x00\x00\x06\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x05\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x07\x00\x00\x00\x06\x00\x00\x00\x0a\x00\x00\x00\x04\x00\x00\x00\x0b\x00\x00\x00\x08\x00\x00\x00\x20\x00\x00\x00\x21\x00\x00\x00\x76\x00\x00\x00\x0b\x00\x00\x00\x11\x00\x00\x00\x7d\x00\x00\x00\x6d\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x2d\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x6a\x00\x00\x00\x59\x00\x00\x00\x20\x00\x00\x00\x21\x00\x00\x00\x34\x00\x00\x00\x05\x00\x00\x00\x59\x00\x00\x00\x63\x00\x00\x00\x1d\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x2d\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x76\x00\x00\x00\x43\x00\x00\x00\x6a\x00\x00\x00\x7c\x00\x00\x00\x34\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x1c\x00\x00\x00\x5a\x00\x00\x00\x31\x00\x00\x00\x39\x00\x00\x00\x5a\x00\x00\x00\x3b\x00\x00\x00\x0e\x00\x00\x00\x20\x00\x00\x00\x21\x00\x00\x00\x76\x00\x00\x00\x37\x00\x00\x00\x05\x00\x00\x00\x43\x00\x00\x00\x07\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x2d\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x11\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x07\x00\x00\x00\x34\x00\x00\x00\x09\x00\x00\x00\x0e\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x1a\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x0e\x00\x00\x00\x0e\x00\x00\x00\x16\x00\x00\x00\x43\x00\x00\x00\x52\x00\x00\x00\x6a\x00\x00\x00\x59\x00\x00\x00\x59\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x59\x00\x00\x00\x1e\x00\x00\x00\x15\x00\x00\x00\x39\x00\x00\x00\x38\x00\x00\x00\x3b\x00\x00\x00\x1e\x00\x00\x00\x30\x00\x00\x00\x1d\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x1d\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x1e\x00\x00\x00\x1a\x00\x00\x00\x6a\x00\x00\x00\x05\x00\x00\x00\x41\x00\x00\x00\x07\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x6d\x00\x00\x00\x74\x00\x00\x00\x0b\x00\x00\x00\x15\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x1d\x00\x00\x00\x13\x00\x00\x00\x1d\x00\x00\x00\x23\x00\x00\x00\x16\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x1d\x00\x00\x00\x05\x00\x00\x00\x6a\x00\x00\x00\x07\x00\x00\x00\x1e\x00\x00\x00\x09\x00\x00\x00\x76\x00\x00\x00\x41\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x44\x00\x00\x00\x13\x00\x00\x00\x0b\x00\x00\x00\x41\x00\x00\x00\x16\x00\x00\x00\x30\x00\x00\x00\x5c\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x44\x00\x00\x00\x1d\x00\x00\x00\x05\x00\x00\x00\x05\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x6a\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x23\x00\x00\x00\x41\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\x6a\x00\x00\x00\x30\x00\x00\x00\x1e\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x15\x00\x00\x00\x75\x00\x00\x00\x78\x00\x00\x00\x1b\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x76\x00\x00\x00\x05\x00\x00\x00\x1a\x00\x00\x00\x07\x00\x00\x00\x41\x00\x00\x00\x09\x00\x00\x00\x1a\x00\x00\x00\x6a\x00\x00\x00\x78\x00\x00\x00\x15\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x17\x00\x00\x00\x13\x00\x00\x00\x76\x00\x00\x00\x6a\x00\x00\x00\x16\x00\x00\x00\x6f\x00\x00\x00\x70\x00\x00\x00\x71\x00\x00\x00\x72\x00\x00\x00\x73\x00\x00\x00\x74\x00\x00\x00\x1d\x00\x00\x00\x05\x00\x00\x00\x37\x00\x00\x00\x07\x00\x00\x00\x6a\x00\x00\x00\x09\x00\x00\x00\x41\x00\x00\x00\x6a\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x6d\x00\x00\x00\x13\x00\x00\x00\x2a\x00\x00\x00\x24\x00\x00\x00\x16\x00\x00\x00\x30\x00\x00\x00\x3b\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x76\x00\x00\x00\x1d\x00\x00\x00\x3b\x00\x00\x00\x20\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x3e\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x1b\x00\x00\x00\x41\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x30\x00\x00\x00\x1b\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\x6a\x00\x00\x00\x1f\x00\x00\x00\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x6a\x00\x00\x00\x07\x00\x00\x00\x41\x00\x00\x00\x09\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\x6f\x00\x00\x00\x70\x00\x00\x00\x71\x00\x00\x00\x72\x00\x00\x00\x73\x00\x00\x00\x74\x00\x00\x00\x1d\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\xff\xff\xff\xff\x09\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x25\x00\x00\x00\x26\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\x30\x00\x00\x00\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\x1d\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xff\xff\xff\xff\x25\x00\x00\x00\x26\x00\x00\x00\xff\xff\xff\xff\x41\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x30\x00\x00\x00\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x41\x00\x00\x00\x09\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\xff\xff\xff\xff\x1d\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\xff\xff\xff\xff\x09\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x25\x00\x00\x00\x26\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\x30\x00\x00\x00\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\x1d\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xff\xff\xff\xff\x25\x00\x00\x00\x26\x00\x00\x00\xff\xff\xff\xff\x41\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x30\x00\x00\x00\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x41\x00\x00\x00\x09\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x0f\x00\x00\x00\x10\x00\x00\x00\x12\x00\x00\x00\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\xff\xff\xff\xff\x09\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x25\x00\x00\x00\x26\x00\x00\x00\x0f\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x13\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x16\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x41\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x07\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x05\x00\x00\x00\x06\x00\x00\x00\x07\x00\x00\x00\xff\xff\xff\xff\x41\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x06\x00\x00\x00\x07\x00\x00\x00\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\xff\xff\xff\xff\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\x05\x00\x00\x00\x39\x00\x00\x00\x07\x00\x00\x00\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x39\x00\x00\x00\x07\x00\x00\x00\x3b\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x11\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x0b\x00\x00\x00\xff\xff\xff\xff\x05\x00\x00\x00\x39\x00\x00\x00\x07\x00\x00\x00\x3b\x00\x00\x00\x11\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x39\x00\x00\x00\x11\x00\x00\x00\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x39\x00\x00\x00\x11\x00\x00\x00\x3b\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x39\x00\x00\x00\x11\x00\x00\x00\x3b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\x11\x00\x00\x00\x07\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\x39\x00\x00\x00\x11\x00\x00\x00\x3b\x00\x00\x00\x0b\x00\x00\x00\x05\x00\x00\x00\xff\xff\xff\xff\x07\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x11\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\xff\xff\xff\xff\x11\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x05\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x3b\x00\x00\x00\x34\x00\x00\x00\x35\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xff\xff\xff\xff\x39\x00\x00\x00\xff\xff\xff\xff\x34\x00\x00\x00\x35\x00\x00\x00\x12\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x39\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\x0c\x00\x00\x00\xff\xff\xff\xff\x12\x00\x00\x00\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x12\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x12\x00\x00\x00\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\xff\xff\xff\xff\x0b\x00\x00\x00\x0c\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x12\x00\x00\x00\xff\xff\xff\xff\x34\x00\x00\x00\xff\xff\xff\xff\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\xff\xff\xff\xff\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x0b\x00\x00\x00\x0c\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x12\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x12\x00\x00\x00\xff\xff\xff\xff\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x1c\x00\x00\x00\x1d\x00\x00\x00\x6e\x00\x00\x00\x6f\x00\x00\x00\x70\x00\x00\x00\x71\x00\x00\x00\x72\x00\x00\x00\x73\x00\x00\x00\x74\x00\x00\x00\x49\x00\x00\x00\x4a\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\xff\xff\xff\xff\x50\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x53\x00\x00\x00\x54\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x58\x00\x00\x00\xff\xff\xff\xff\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x49\x00\x00\x00\xff\xff\xff\xff\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\xff\xff\xff\xff\x50\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x53\x00\x00\x00\x54\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x58\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x4b\x00\x00\x00\x4c\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\xff\xff\xff\xff\x50\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\x53\x00\x00\x00\x54\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x58\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x6b\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x6b\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x6b\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x6e\x00\x00\x00\x6f\x00\x00\x00\x70\x00\x00\x00\x71\x00\x00\x00\x72\x00\x00\x00\x73\x00\x00\x00\x74\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x64\x00\x00\x00\x65\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\xff\xff\xff\xff\x70\x00\x00\x00\x71\x00\x00\x00\x72\x00\x00\x00\x73\x00\x00\x00\x74\x00\x00\x00\x66\x00\x00\x00\x67\x00\x00\x00\x68\x00\x00\x00\x69\x00\x00\x00\x6a\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x28\x00\x00\x00\x29\x00\x00\x00\x2a\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff"#

happyTable :: HappyAddr
happyTable = HappyA# "\x00\x00\x00\x00\x4a\x02\x00\x00\x4a\x02\x00\x00\xa7\x00\x00\x00\x4a\x02\x00\x00\xf3\x01\x00\x00\xf4\x01\x00\x00\xff\x01\x00\x00\x72\x02\x00\x00\x63\x00\x00\x00\x4a\x02\x00\x00\x64\x00\x00\x00\x4b\x00\x00\x00\x07\x00\x00\x00\x10\x01\x00\x00\xf7\x01\x00\x00\x49\x01\x00\x00\x42\x01\x00\x00\x49\x00\x00\x00\x4a\x00\x00\x00\x4b\x00\x00\x00\x2c\x02\x00\x00\x4c\x00\x00\x00\xf7\x01\x00\x00\xff\xff\xff\xff\x48\x01\x00\x00\x42\x01\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\xa0\x00\x00\x00\x4c\x00\x00\x00\x5d\x01\x00\x00\x4a\x01\x00\x00\x4b\x00\x00\x00\xf9\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x41\x01\x00\x00\x42\x01\x00\x00\xe9\x01\x00\x00\x07\x00\x00\x00\x56\x01\x00\x00\x8c\x02\x00\x00\x4c\x00\x00\x00\x9e\x01\x00\x00\x55\x00\x00\x00\x4f\x00\x00\x00\x9e\x01\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\xa8\x00\x00\x00\x50\x00\x00\x00\x17\x01\x00\x00\x0d\x01\x00\x00\x4f\x00\x00\x00\x51\x00\x00\x00\xf8\x01\x00\x00\xf9\x01\x00\x00\x52\x00\x00\x00\x50\x00\x00\x00\x0d\x01\x00\x00\xfa\x01\x00\x00\x9f\x01\x00\x00\x51\x00\x00\x00\x18\x01\x00\x00\x74\x02\x00\x00\x52\x00\x00\x00\x4f\x00\x00\x00\x2d\x02\x00\x00\xfa\x01\x00\x00\x11\x01\x00\x00\x43\x01\x00\x00\x50\x00\x00\x00\x58\x00\x00\x00\x55\x00\x00\x00\x35\x00\x00\x00\x51\x00\x00\x00\xaa\x00\x00\x00\xf5\x01\x00\x00\x52\x00\x00\x00\xf5\x01\x00\x00\x43\x01\x00\x00\x82\x00\x00\x00\x2e\x02\x00\x00\x82\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x5e\x01\x00\x00\x11\x01\x00\x00\x4b\x00\x00\x00\x43\x01\x00\x00\xa0\x01\x00\x00\x62\x00\x00\x00\xea\x01\x00\x00\xa0\x01\x00\x00\xfa\x00\x00\x00\x3c\x00\x00\x00\x57\x01\x00\x00\x8d\x02\x00\x00\x4c\x00\x00\x00\x0e\x01\x00\x00\x0f\x01\x00\x00\x43\x01\x00\x00\xeb\x00\x00\x00\x4d\x00\x00\x00\x4e\x00\x00\x00\x30\x01\x00\x00\xfc\x01\x00\x00\x9c\x01\x00\x00\xbf\x00\x00\x00\xec\x00\x00\x00\x53\x00\x00\x00\x53\x00\x00\x00\x4d\x02\x00\x00\x53\x00\x00\x00\x4e\x02\x00\x00\x90\x02\x00\x00\x4b\x02\x00\x00\x4c\x02\x00\x00\xaf\x00\x00\x00\x53\x00\x00\x00\x62\x00\x00\x00\x53\x00\x00\x00\x4f\x00\x00\x00\x8f\x02\x00\x00\x53\x00\x00\x00\x38\x01\x00\x00\xa1\x00\x00\x00\x50\x00\x00\x00\x83\x00\x00\x00\x53\x00\x00\x00\x83\x00\x00\x00\x51\x00\x00\x00\x53\x00\x00\x00\x84\x00\x00\x00\x52\x00\x00\x00\x84\x00\x00\x00\x31\x01\x00\x00\x8f\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xfd\x00\x00\x00\xb0\x00\x00\x00\x53\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xa8\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xd6\x00\x00\x00\x16\x00\x00\x00\x07\x00\x00\x00\xaf\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x7f\x00\x00\x00\x80\x00\x00\x00\xa8\x01\x00\x00\x19\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xb1\x00\x00\x00\xb2\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x36\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x6d\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xfe\x00\x00\x00\xff\x00\x00\x00\x30\x01\x00\x00\xd7\x00\x00\x00\x8c\x00\x00\x00\x90\x00\x00\x00\x9e\x01\x00\x00\xf0\x01\x00\x00\xa9\x01\x00\x00\xaa\x01\x00\x00\x39\x01\x00\x00\x53\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xb3\x00\x00\x00\x06\x01\x00\x00\xb1\x00\x00\x00\xb2\x00\x00\x00\x71\x00\x00\x00\x89\x00\x00\x00\xc2\x00\x00\x00\xa9\x01\x00\x00\xaa\x01\x00\x00\x9e\x01\x00\x00\xc7\x01\x00\x00\x7d\x00\x00\x00\xa2\x01\x00\x00\xc3\x00\x00\x00\x78\x00\x00\x00\x0a\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x7e\x00\x00\x00\xac\x01\x00\x00\x2c\x02\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x32\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x72\x00\x00\x00\x16\x00\x00\x00\x55\x00\x00\x00\xa8\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xa0\x01\x00\x00\x19\x00\x00\x00\xe9\x01\x00\x00\xa3\x01\x00\x00\xc9\x00\x00\x00\xff\xff\xff\xff\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xd9\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x7f\x00\x00\x00\x80\x00\x00\x00\xa0\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x73\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x2d\x02\x00\x00\x16\x00\x00\x00\xb9\x01\x00\x00\xca\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\xde\x00\x00\x00\x71\x00\x00\x00\xdf\x00\x00\x00\x19\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xe9\x01\x00\x00\x62\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x74\x00\x00\x00\x61\x02\x00\x00\x62\x02\x00\x00\xd9\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x6f\x02\x00\x00\xba\x01\x00\x00\x27\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x72\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x27\x00\x00\x00\x16\x00\x00\x00\xa3\x00\x00\x00\x76\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x29\x01\x00\x00\xda\x00\x00\x00\xdb\x00\x00\x00\x19\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x70\x02\x00\x00\x75\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x5b\x02\x00\x00\x5c\x02\x00\x00\x48\x00\x00\x00\xb7\x01\x00\x00\x8c\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x79\x00\x00\x00\x7a\x00\x00\x00\x49\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x2a\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x8d\x00\x00\x00\x16\x00\x00\x00\x6b\x00\x00\x00\x6c\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x27\x00\x00\x00\x19\x00\x00\x00\xb8\x01\x00\x00\x07\x00\x00\x00\x40\x01\x00\x00\x68\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x71\x00\x00\x00\xae\x01\x00\x00\x6d\x02\x00\x00\x8c\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x01\x01\x00\x00\x02\x01\x00\x00\x27\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x41\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x69\x01\x00\x00\x16\x00\x00\x00\x83\x01\x00\x00\xff\xff\xff\xff\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x72\x00\x00\x00\x19\x00\x00\x00\x6e\x02\x00\x00\xa3\x00\x00\x00\xa4\x00\x00\x00\xa5\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xd9\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x02\x01\x00\x00\xa4\x00\x00\x00\x03\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x04\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xd7\x00\x00\x00\x16\x00\x00\x00\xd8\x00\x00\x00\x7b\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x89\x01\x00\x00\x19\x00\x00\x00\x7c\x00\x00\x00\xe7\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x79\x00\x00\x00\x7a\x00\x00\x00\x27\x00\x00\x00\xd9\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x67\x00\x00\x00\x54\x01\x00\x00\x5b\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x61\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x0b\x01\x00\x00\x16\x00\x00\x00\x62\x01\x00\x00\x55\x01\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x86\x01\x00\x00\x19\x00\x00\x00\x7e\x00\x00\x00\xe6\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x85\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xf9\x00\x00\x00\xbf\x01\x00\x00\xc0\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xc1\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xf7\x00\x00\x00\x16\x00\x00\x00\x20\x02\x00\x00\x98\x01\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x68\x00\x00\x00\x19\x00\x00\x00\x99\x01\x00\x00\xef\x00\x00\x00\xf0\x00\x00\x00\x8c\x01\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x8d\x01\x00\x00\x7c\x01\x00\x00\x58\x00\x00\x00\xe2\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xf6\x00\x00\x00\x48\x00\x00\x00\xc5\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x49\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x3d\x01\x00\x00\x16\x00\x00\x00\x3e\x01\x00\x00\xe2\x01\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x45\x00\x00\x00\x19\x00\x00\x00\xe3\x01\x00\x00\x04\x00\x00\x00\x05\x00\x00\x00\x46\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xbc\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x3d\x01\x00\x00\xd3\x01\x00\x00\x96\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xd4\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x87\x01\x00\x00\x16\x00\x00\x00\xd8\x00\x00\x00\x36\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xd2\x00\x00\x00\x19\x00\x00\x00\x37\x02\x00\x00\xd3\x00\x00\x00\xf5\x00\x00\x00\x27\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x28\x02\x00\x00\x4a\x02\x00\x00\xee\x00\x00\x00\xbb\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xed\x00\x00\x00\x7b\x02\x00\x00\x8d\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x7c\x02\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x3d\x01\x00\x00\x16\x00\x00\x00\xf6\x01\x00\x00\x94\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xc4\x00\x00\x00\x19\x00\x00\x00\x8d\x01\x00\x00\xf2\x00\x00\x00\xf3\x00\x00\x00\xc5\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xba\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x2d\x01\x00\x00\xa4\x00\x00\x00\xa5\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xc1\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xc7\x00\x00\x00\x16\x00\x00\x00\xe2\x00\x00\x00\xc8\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xe1\x00\x00\x00\x19\x00\x00\x00\xaa\x00\x00\x00\xab\x00\x00\x00\xac\x00\x00\x00\xad\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xa3\x01\x00\x00\xa4\x00\x00\x00\xa5\x00\x00\x00\xb8\x00\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xe5\x01\x00\x00\xe6\x01\x00\x00\xe7\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xcb\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xd2\x00\x00\x00\x16\x00\x00\x00\xc6\x00\x00\x00\xd3\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xb8\x00\x00\x00\x19\x00\x00\x00\x6a\x01\x00\x00\xab\x00\x00\x00\xac\x00\x00\x00\xad\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x68\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xcf\x01\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xc0\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x46\x02\x00\x00\x16\x00\x00\x00\xb3\x00\x00\x00\x47\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x3d\x02\x00\x00\x19\x00\x00\x00\x3d\x01\x00\x00\x3e\x02\x00\x00\x96\x01\x00\x00\x75\x01\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xce\x01\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x67\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x28\x02\x00\x00\x29\x02\x00\x00\x2a\x02\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x74\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x70\x01\x00\x00\x16\x00\x00\x00\xe4\x00\x00\x00\xe5\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xa8\x00\x00\x00\x19\x00\x00\x00\x77\x02\x00\x00\x14\x02\x00\x00\x15\x02\x00\x00\x8c\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x65\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x76\x02\x00\x00\x14\x02\x00\x00\x15\x02\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x5c\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x51\x01\x00\x00\x16\x00\x00\x00\xcd\x00\x00\x00\xce\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x50\x01\x00\x00\x19\x00\x00\x00\x58\x01\x00\x00\x59\x01\x00\x00\x52\x01\x00\x00\x53\x01\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xb2\x01\x00\x00\x6c\x00\x00\x00\x4c\x01\x00\x00\x64\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x2d\x00\x00\x00\x86\x01\x00\x00\x38\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x3d\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x37\x01\x00\x00\x16\x00\x00\x00\x2d\x00\x00\x00\x80\x01\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x36\x01\x00\x00\x19\x00\x00\x00\x03\x02\x00\x00\x59\x01\x00\x00\xd7\x01\x00\x00\xf0\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x62\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x3c\x02\x00\x00\x3d\x02\x00\x00\x34\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xa8\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x2d\x01\x00\x00\x16\x00\x00\x00\x0c\x02\x00\x00\x0d\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x2c\x01\x00\x00\x19\x00\x00\x00\x09\x02\x00\x00\x0a\x02\x00\x00\x57\x02\x00\x00\x58\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x2d\x00\x00\x00\x86\x01\x00\x00\x2b\x01\x00\x00\xac\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x68\x02\x00\x00\x6c\x00\x00\x00\x16\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x15\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x14\x01\x00\x00\x16\x00\x00\x00\x8a\x02\x00\x00\x8b\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xbd\x01\x00\x00\x19\x00\x00\x00\x7f\x02\x00\x00\xf0\x00\x00\x00\x04\x00\x00\x00\x05\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x8a\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x89\x00\x00\x00\x8a\x00\x00\x00\xbb\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xbc\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xa5\x01\x00\x00\x16\x00\x00\x00\xd3\x00\x00\x00\xd4\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xaf\x01\x00\x00\x19\x00\x00\x00\xe9\x00\x00\x00\x3c\x00\x00\x00\xe8\x00\x00\x00\x3c\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xcf\x00\x00\x00\xd0\x00\x00\x00\x95\x01\x00\x00\x88\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x59\x01\x00\x00\x09\x00\x00\x00\xa8\x00\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xa1\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x93\x01\x00\x00\x16\x00\x00\x00\x27\x01\x00\x00\x09\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x8e\x01\x00\x00\x19\x00\x00\x00\xa5\x01\x00\x00\xa6\x01\x00\x00\x95\x01\x00\x00\x3c\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x81\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x76\x01\x00\x00\xad\x00\x00\x00\x92\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x7b\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xb3\x00\x00\x00\x16\x00\x00\x00\xd1\x01\x00\x00\x3c\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x7a\x01\x00\x00\x19\x00\x00\x00\xd0\x01\x00\x00\x3c\x00\x00\x00\xc9\x01\x00\x00\xca\x01\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x0d\x02\x00\x00\x3c\x00\x00\x00\x79\x01\x00\x00\x80\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x58\x02\x00\x00\xe7\x01\x00\x00\x78\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xff\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x02\x02\x00\x00\x16\x00\x00\x00\x79\x02\x00\x00\x15\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xfe\x01\x00\x00\x19\x00\x00\x00\x82\x02\x00\x00\x2a\x02\x00\x00\x78\x02\x00\x00\x15\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x05\x02\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xfd\x01\x00\x00\xf3\x01\x00\x00\xf2\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xef\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\xee\x01\x00\x00\x16\x00\x00\x00\xe5\x01\x00\x00\x30\x01\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\xdc\x01\x00\x00\x19\x00\x00\x00\xde\x01\x00\x00\xdd\x01\x00\x00\xd5\x01\x00\x00\xdb\x01\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xd6\x01\x00\x00\xcc\x01\x00\x00\xc9\x01\x00\x00\x04\x02\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\xc6\x01\x00\x00\xdb\x01\x00\x00\xc5\x01\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x40\x02\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x3b\x02\x00\x00\x16\x00\x00\x00\x30\x01\x00\x00\x34\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x08\x00\x00\x00\x09\x00\x00\x00\x33\x02\x00\x00\x19\x00\x00\x00\x32\x02\x00\x00\x31\x02\x00\x00\x30\x02\x00\x00\x26\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x03\x02\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x22\x02\x00\x00\x21\x02\x00\x00\x0f\x02\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\x0b\x02\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x58\x00\x00\x00\x16\x00\x00\x00\x71\x02\x00\x00\x65\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\xb4\x00\x00\x00\xb5\x00\x00\x00\xb6\x00\x00\x00\x19\x00\x00\x00\xb7\x00\x00\x00\x63\x02\x00\x00\x5f\x02\x00\x00\x5e\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x5d\x02\x00\x00\x52\x02\x00\x00\x51\x02\x00\x00\xd8\x01\x00\x00\x0b\x00\x00\x00\x0c\x00\x00\x00\x50\x02\x00\x00\xcc\x01\x00\x00\x45\x02\x00\x00\x0d\x00\x00\x00\x0e\x00\x00\x00\x0f\x00\x00\x00\x10\x00\x00\x00\x11\x00\x00\x00\xc9\x01\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x66\x00\x00\x00\x16\x00\x00\x00\x55\x00\x00\x00\x7e\x02\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x40\x02\x00\x00\x89\x02\x00\x00\x88\x02\x00\x00\x19\x00\x00\x00\x87\x02\x00\x00\x86\x02\x00\x00\x85\x02\x00\x00\x84\x02\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x55\x00\x00\x00\x3e\x00\x00\x00\x6f\x00\x00\x00\x3f\x00\x00\x00\x82\x02\x00\x00\x56\x00\x00\x00\xa8\x00\x00\x00\x40\x00\x00\x00\x7d\x02\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x9c\x00\x00\x00\xa1\x00\x00\x00\x41\x00\x00\x00\x87\x00\x00\x00\x69\x00\x00\x00\x59\x00\x00\x00\x5a\x00\x00\x00\x5b\x00\x00\x00\x5c\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x6f\x00\x00\x00\x84\x00\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x62\x00\x00\x00\x55\x00\x00\x00\x80\x00\x00\x00\x76\x00\x00\x00\x0b\x01\x00\x00\x59\x00\x00\x00\x5a\x00\x00\x00\x5b\x00\x00\x00\x5c\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x06\x01\x00\x00\x63\x00\x00\x00\x68\x00\x00\x00\x09\x01\x00\x00\x62\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\xff\x00\x00\x00\xce\x00\x00\x00\xf7\x00\x00\x00\x44\x00\x00\x00\xcb\x00\x00\x00\x45\x00\x00\x00\x6e\x01\x00\x00\x57\x00\x00\x00\x58\x00\x00\x00\x70\x01\x00\x00\xf3\x00\x00\x00\x3e\x00\x00\x00\x63\x00\x00\x00\x3f\x00\x00\x00\x59\x00\x00\x00\x5a\x00\x00\x00\x5b\x00\x00\x00\x5c\x00\x00\x00\x5d\x00\x00\x00\x5e\x00\x00\x00\x5f\x00\x00\x00\x60\x00\x00\x00\x61\x00\x00\x00\x41\x00\x00\x00\x21\x00\x00\x00\x92\x00\x00\x00\x22\x00\x00\x00\x62\x00\x00\x00\x23\x00\x00\x00\x6d\x01\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x3c\x01\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x95\x00\x00\x00\x28\x00\x00\x00\x6c\x01\x00\x00\x6b\x01\x00\x00\x29\x00\x00\x00\x63\x00\x00\x00\x66\x01\x00\x00\x6f\x00\x00\x00\x63\x01\x00\x00\x5f\x01\x00\x00\x96\x00\x00\x00\x97\x00\x00\x00\x6d\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x5e\x01\x00\x00\x34\x01\x00\x00\x2e\x01\x00\x00\x44\x00\x00\x00\x32\x01\x00\x00\x45\x00\x00\x00\x12\x01\x00\x00\x2d\x00\x00\x00\xc3\x01\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\xc2\x01\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xc1\x01\x00\x00\xbd\x01\x00\x00\xb5\x01\x00\x00\x21\x00\x00\x00\x35\x00\x00\x00\x22\x00\x00\x00\x8f\x00\x00\x00\x23\x00\x00\x00\xb0\x01\x00\x00\xaf\x01\x00\x00\xa1\x00\x00\x00\xaa\x01\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x9c\x01\x00\x00\x28\x00\x00\x00\x9a\x01\x00\x00\x1e\x02\x00\x00\x29\x00\x00\x00\x10\x02\x00\x00\x11\x02\x00\x00\x12\x02\x00\x00\x13\x02\x00\x00\x14\x02\x00\x00\x15\x02\x00\x00\x2a\x00\x00\x00\x21\x00\x00\x00\x93\x01\x00\x00\x22\x00\x00\x00\x99\x01\x00\x00\x23\x00\x00\x00\x8e\x01\x00\x00\x84\x01\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x83\x01\x00\x00\x28\x00\x00\x00\xa1\x00\x00\x00\x7e\x01\x00\x00\x29\x00\x00\x00\x2d\x00\x00\x00\x7c\x01\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x7d\x01\x00\x00\x2a\x00\x00\x00\x75\x01\x00\x00\x06\x02\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x6f\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x0f\x02\x00\x00\x35\x00\x00\x00\x10\x02\x00\x00\x11\x02\x00\x00\x12\x02\x00\x00\x13\x02\x00\x00\x14\x02\x00\x00\x15\x02\x00\x00\x93\x01\x00\x00\x2d\x00\x00\x00\x12\x01\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\xe3\x01\x00\x00\xf0\x01\x00\x00\xd9\x01\x00\x00\xc7\x01\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\xde\x01\x00\x00\x21\x00\x00\x00\x41\x02\x00\x00\x22\x00\x00\x00\x35\x00\x00\x00\x23\x00\x00\x00\x40\x02\x00\x00\x6f\x00\x00\x00\x37\x02\x00\x00\x34\x02\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x2e\x02\x00\x00\x28\x00\x00\x00\x22\x02\x00\x00\x93\x01\x00\x00\x29\x00\x00\x00\xcd\x01\x00\x00\x1a\x01\x00\x00\x1b\x01\x00\x00\x1c\x01\x00\x00\x1d\x01\x00\x00\x1e\x01\x00\x00\x2a\x00\x00\x00\x21\x00\x00\x00\x07\x02\x00\x00\x22\x00\x00\x00\x6f\x00\x00\x00\x23\x00\x00\x00\x84\x01\x00\x00\x6b\x02\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x66\x02\x00\x00\x28\x00\x00\x00\x65\x02\x00\x00\x63\x02\x00\x00\x29\x00\x00\x00\xdd\x00\x00\x00\x5f\x02\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\xde\x00\x00\x00\x53\x02\x00\x00\x2a\x00\x00\x00\x59\x02\x00\x00\x47\x02\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x52\x02\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x43\x02\x00\x00\x35\x00\x00\x00\x6c\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x2d\x00\x00\x00\x42\x02\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x00\x00\x00\x00\x80\x02\x00\x00\x8d\x02\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x00\x00\x00\x00\x21\x00\x00\x00\x6b\x02\x00\x00\x22\x00\x00\x00\x35\x00\x00\x00\x23\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\xcc\x01\x00\x00\x1a\x01\x00\x00\x1b\x01\x00\x00\x1c\x01\x00\x00\x1d\x01\x00\x00\x1e\x01\x00\x00\x2a\x00\x00\x00\x21\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x00\x00\x00\x00\x23\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\xdd\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\xde\x00\x00\x00\x00\x00\x00\x00\x2a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x00\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x00\x00\x00\x00\x35\x00\x00\x00\xe5\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x2d\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x00\x00\x00\x00\x21\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x35\x00\x00\x00\x23\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\xf0\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x00\x00\x00\x00\x2a\x00\x00\x00\x21\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x00\x00\x00\x00\x23\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x24\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x27\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\xdd\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\xde\x00\x00\x00\x00\x00\x00\x00\x2a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x00\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x00\x00\x00\x00\x35\x00\x00\x00\xb9\x00\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x2d\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x00\x00\x00\x00\x21\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x35\x00\x00\x00\x23\x00\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x25\x00\x00\x00\x26\x00\x00\x00\x9e\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x9f\x00\x00\x00\x21\x00\x00\x00\x00\x00\x00\x00\x22\x00\x00\x00\x00\x00\x00\x00\x23\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x25\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x28\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x29\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x2b\x00\x00\x00\x2c\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x35\x00\x00\x00\x3e\x00\x00\x00\x6f\x00\x00\x00\x3f\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x2e\x00\x00\x00\x2f\x00\x00\x00\x30\x00\x00\x00\x00\x00\x00\x00\x41\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x31\x00\x00\x00\x32\x00\x00\x00\x33\x00\x00\x00\x34\x00\x00\x00\x3e\x00\x00\x00\xb5\x01\x00\x00\x3f\x00\x00\x00\x00\x00\x00\x00\x35\x00\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x3e\x00\x00\x00\x6b\x02\x00\x00\x3f\x00\x00\x00\x3e\x00\x00\x00\x41\x00\x00\x00\x3f\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x20\x01\x00\x00\x41\x00\x00\x00\x21\x01\x00\x00\x00\x00\x00\x00\x41\x00\x00\x00\x00\x00\x00\x00\x22\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x3b\x01\x00\x00\x3e\x00\x00\x00\x23\x01\x00\x00\x3f\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x3e\x00\x00\x00\x00\x00\x00\x00\x3f\x00\x00\x00\x00\x00\x00\x00\x41\x00\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x00\x00\x00\x00\x41\x00\x00\x00\x00\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x24\x01\x00\x00\x25\x01\x00\x00\x3e\x00\x00\x00\x00\x00\x00\x00\x3f\x00\x00\x00\x26\x01\x00\x00\x00\x00\x00\x00\x27\x01\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x00\x00\x00\x00\x41\x00\x00\x00\x20\x01\x00\x00\x44\x00\x00\x00\x21\x01\x00\x00\x45\x00\x00\x00\xed\x01\x00\x00\x43\x00\x00\x00\x22\x01\x00\x00\x00\x00\x00\x00\x3e\x00\x00\x00\x44\x00\x00\x00\x3f\x00\x00\x00\x45\x00\x00\x00\x23\x01\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x20\x01\x00\x00\x00\x00\x00\x00\x21\x01\x00\x00\x17\x02\x00\x00\x41\x00\x00\x00\x18\x02\x00\x00\x22\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x19\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x23\x01\x00\x00\x00\x00\x00\x00\x20\x01\x00\x00\x1a\x02\x00\x00\x21\x01\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x22\x01\x00\x00\x00\x00\x00\x00\x3e\x00\x00\x00\x44\x00\x00\x00\x3f\x00\x00\x00\x45\x00\x00\x00\x23\x01\x00\x00\x00\x00\x00\x00\x40\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x24\x01\x00\x00\x25\x01\x00\x00\x3e\x00\x00\x00\x41\x00\x00\x00\x3f\x00\x00\x00\x26\x01\x00\x00\x00\x00\x00\x00\x27\x01\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\xfc\x00\x00\x00\x00\x00\x00\x00\x3f\x00\x00\x00\x44\x00\x00\x00\x41\x00\x00\x00\x45\x00\x00\x00\x24\x01\x00\x00\x25\x01\x00\x00\x00\x00\x00\x00\x1b\x02\x00\x00\x1c\x02\x00\x00\x26\x01\x00\x00\x41\x00\x00\x00\x27\x01\x00\x00\x1d\x02\x00\x00\x00\x00\x00\x00\x1e\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x24\x01\x00\x00\x25\x01\x00\x00\x3e\x00\x00\x00\x00\x00\x00\x00\x3f\x00\x00\x00\x26\x01\x00\x00\x00\x00\x00\x00\x27\x01\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x20\x01\x00\x00\x00\x00\x00\x00\x21\x01\x00\x00\x44\x00\x00\x00\x41\x00\x00\x00\x45\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x3e\x00\x00\x00\x23\x01\x00\x00\x3f\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x17\x02\x00\x00\x00\x00\x00\x00\x18\x02\x00\x00\x44\x00\x00\x00\x41\x00\x00\x00\x45\x00\x00\x00\x19\x02\x00\x00\x17\x02\x00\x00\x00\x00\x00\x00\x18\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1a\x02\x00\x00\x4c\x01\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x00\x00\x00\x00\x1a\x02\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x24\x01\x00\x00\x25\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x26\x01\x00\x00\x00\x00\x00\x00\x27\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x42\x00\x00\x00\x43\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x45\x01\x00\x00\x44\x00\x00\x00\x00\x00\x00\x00\x45\x00\x00\x00\x1b\x02\x00\x00\x1c\x02\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x00\x00\x00\x00\x1d\x02\x00\x00\x00\x00\x00\x00\x1b\x02\x00\x00\x1c\x02\x00\x00\x46\x01\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x1d\x02\x00\x00\x00\x00\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x00\x00\x00\x00\x08\x01\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x47\x01\x00\x00\x72\x01\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x09\x01\x00\x00\x90\x01\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x73\x01\x00\x00\x00\x00\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x91\x01\x00\x00\xe0\x01\x00\x00\x00\x00\x00\x00\x48\x01\x00\x00\x00\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\xe1\x01\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x00\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x93\x00\x00\x00\x94\x00\x00\x00\x24\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x55\x02\x00\x00\x00\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x96\x00\x00\x00\x25\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x96\x00\x00\x00\x56\x02\x00\x00\x18\x01\x00\x00\x19\x01\x00\x00\x1a\x01\x00\x00\x1b\x01\x00\x00\x1c\x01\x00\x00\x1d\x01\x00\x00\x1e\x01\x00\x00\x9a\x00\x00\x00\x9b\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x00\x00\x00\x00\x16\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x19\x00\x00\x00\x00\x00\x00\x00\x98\x00\x00\x00\x99\x00\x00\x00\x9a\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\xbd\x00\x00\x00\x00\x00\x00\x00\x12\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x00\x00\x00\x00\x16\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x19\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x86\x00\x00\x00\x13\x00\x00\x00\x14\x00\x00\x00\x15\x00\x00\x00\x00\x00\x00\x00\x16\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x17\x00\x00\x00\x18\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x19\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1a\x00\x00\x00\x1b\x00\x00\x00\x1c\x00\x00\x00\x1d\x00\x00\x00\x1e\x00\x00\x00\x1f\x00\x00\x00\x4d\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x4e\x01\x00\x00\x4d\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x39\x02\x00\x00\x4d\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x92\x02\x00\x00\xb3\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xb2\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x00\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xeb\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xea\x01\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x73\x02\x00\x00\x19\x01\x00\x00\x1a\x01\x00\x00\x1b\x01\x00\x00\x1c\x01\x00\x00\x1d\x01\x00\x00\x1e\x01\x00\x00\x71\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x69\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x68\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x48\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x8e\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x75\x02\x00\x00\x37\x00\x00\x00\x38\x00\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\xd7\x01\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x00\x00\x00\x00\x38\x02\x00\x00\x1b\x01\x00\x00\x1c\x01\x00\x00\x1d\x01\x00\x00\x1e\x01\x00\x00\x7f\x02\x00\x00\x39\x00\x00\x00\x3a\x00\x00\x00\x3b\x00\x00\x00\x3c\x00\x00\x00\x91\x02\x00\x00\x12\x02\x00\x00\x13\x02\x00\x00\x14\x02\x00\x00\x15\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00"#

happyReduceArr = Happy_Data_Array.array (3, 355) [
        (3 , happyReduce_3),
        (4 , happyReduce_4),
        (5 , happyReduce_5),
        (6 , happyReduce_6),
        (7 , happyReduce_7),
        (8 , happyReduce_8),
        (9 , happyReduce_9),
        (10 , happyReduce_10),
        (11 , happyReduce_11),
        (12 , happyReduce_12),
        (13 , happyReduce_13),
        (14 , happyReduce_14),
        (15 , happyReduce_15),
        (16 , happyReduce_16),
        (17 , happyReduce_17),
        (18 , happyReduce_18),
        (19 , happyReduce_19),
        (20 , happyReduce_20),
        (21 , happyReduce_21),
        (22 , happyReduce_22),
        (23 , happyReduce_23),
        (24 , happyReduce_24),
        (25 , happyReduce_25),
        (26 , happyReduce_26),
        (27 , happyReduce_27),
        (28 , happyReduce_28),
        (29 , happyReduce_29),
        (30 , happyReduce_30),
        (31 , happyReduce_31),
        (32 , happyReduce_32),
        (33 , happyReduce_33),
        (34 , happyReduce_34),
        (35 , happyReduce_35),
        (36 , happyReduce_36),
        (37 , happyReduce_37),
        (38 , happyReduce_38),
        (39 , happyReduce_39),
        (40 , happyReduce_40),
        (41 , happyReduce_41),
        (42 , happyReduce_42),
        (43 , happyReduce_43),
        (44 , happyReduce_44),
        (45 , happyReduce_45),
        (46 , happyReduce_46),
        (47 , happyReduce_47),
        (48 , happyReduce_48),
        (49 , happyReduce_49),
        (50 , happyReduce_50),
        (51 , happyReduce_51),
        (52 , happyReduce_52),
        (53 , happyReduce_53),
        (54 , happyReduce_54),
        (55 , happyReduce_55),
        (56 , happyReduce_56),
        (57 , happyReduce_57),
        (58 , happyReduce_58),
        (59 , happyReduce_59),
        (60 , happyReduce_60),
        (61 , happyReduce_61),
        (62 , happyReduce_62),
        (63 , happyReduce_63),
        (64 , happyReduce_64),
        (65 , happyReduce_65),
        (66 , happyReduce_66),
        (67 , happyReduce_67),
        (68 , happyReduce_68),
        (69 , happyReduce_69),
        (70 , happyReduce_70),
        (71 , happyReduce_71),
        (72 , happyReduce_72),
        (73 , happyReduce_73),
        (74 , happyReduce_74),
        (75 , happyReduce_75),
        (76 , happyReduce_76),
        (77 , happyReduce_77),
        (78 , happyReduce_78),
        (79 , happyReduce_79),
        (80 , happyReduce_80),
        (81 , happyReduce_81),
        (82 , happyReduce_82),
        (83 , happyReduce_83),
        (84 , happyReduce_84),
        (85 , happyReduce_85),
        (86 , happyReduce_86),
        (87 , happyReduce_87),
        (88 , happyReduce_88),
        (89 , happyReduce_89),
        (90 , happyReduce_90),
        (91 , happyReduce_91),
        (92 , happyReduce_92),
        (93 , happyReduce_93),
        (94 , happyReduce_94),
        (95 , happyReduce_95),
        (96 , happyReduce_96),
        (97 , happyReduce_97),
        (98 , happyReduce_98),
        (99 , happyReduce_99),
        (100 , happyReduce_100),
        (101 , happyReduce_101),
        (102 , happyReduce_102),
        (103 , happyReduce_103),
        (104 , happyReduce_104),
        (105 , happyReduce_105),
        (106 , happyReduce_106),
        (107 , happyReduce_107),
        (108 , happyReduce_108),
        (109 , happyReduce_109),
        (110 , happyReduce_110),
        (111 , happyReduce_111),
        (112 , happyReduce_112),
        (113 , happyReduce_113),
        (114 , happyReduce_114),
        (115 , happyReduce_115),
        (116 , happyReduce_116),
        (117 , happyReduce_117),
        (118 , happyReduce_118),
        (119 , happyReduce_119),
        (120 , happyReduce_120),
        (121 , happyReduce_121),
        (122 , happyReduce_122),
        (123 , happyReduce_123),
        (124 , happyReduce_124),
        (125 , happyReduce_125),
        (126 , happyReduce_126),
        (127 , happyReduce_127),
        (128 , happyReduce_128),
        (129 , happyReduce_129),
        (130 , happyReduce_130),
        (131 , happyReduce_131),
        (132 , happyReduce_132),
        (133 , happyReduce_133),
        (134 , happyReduce_134),
        (135 , happyReduce_135),
        (136 , happyReduce_136),
        (137 , happyReduce_137),
        (138 , happyReduce_138),
        (139 , happyReduce_139),
        (140 , happyReduce_140),
        (141 , happyReduce_141),
        (142 , happyReduce_142),
        (143 , happyReduce_143),
        (144 , happyReduce_144),
        (145 , happyReduce_145),
        (146 , happyReduce_146),
        (147 , happyReduce_147),
        (148 , happyReduce_148),
        (149 , happyReduce_149),
        (150 , happyReduce_150),
        (151 , happyReduce_151),
        (152 , happyReduce_152),
        (153 , happyReduce_153),
        (154 , happyReduce_154),
        (155 , happyReduce_155),
        (156 , happyReduce_156),
        (157 , happyReduce_157),
        (158 , happyReduce_158),
        (159 , happyReduce_159),
        (160 , happyReduce_160),
        (161 , happyReduce_161),
        (162 , happyReduce_162),
        (163 , happyReduce_163),
        (164 , happyReduce_164),
        (165 , happyReduce_165),
        (166 , happyReduce_166),
        (167 , happyReduce_167),
        (168 , happyReduce_168),
        (169 , happyReduce_169),
        (170 , happyReduce_170),
        (171 , happyReduce_171),
        (172 , happyReduce_172),
        (173 , happyReduce_173),
        (174 , happyReduce_174),
        (175 , happyReduce_175),
        (176 , happyReduce_176),
        (177 , happyReduce_177),
        (178 , happyReduce_178),
        (179 , happyReduce_179),
        (180 , happyReduce_180),
        (181 , happyReduce_181),
        (182 , happyReduce_182),
        (183 , happyReduce_183),
        (184 , happyReduce_184),
        (185 , happyReduce_185),
        (186 , happyReduce_186),
        (187 , happyReduce_187),
        (188 , happyReduce_188),
        (189 , happyReduce_189),
        (190 , happyReduce_190),
        (191 , happyReduce_191),
        (192 , happyReduce_192),
        (193 , happyReduce_193),
        (194 , happyReduce_194),
        (195 , happyReduce_195),
        (196 , happyReduce_196),
        (197 , happyReduce_197),
        (198 , happyReduce_198),
        (199 , happyReduce_199),
        (200 , happyReduce_200),
        (201 , happyReduce_201),
        (202 , happyReduce_202),
        (203 , happyReduce_203),
        (204 , happyReduce_204),
        (205 , happyReduce_205),
        (206 , happyReduce_206),
        (207 , happyReduce_207),
        (208 , happyReduce_208),
        (209 , happyReduce_209),
        (210 , happyReduce_210),
        (211 , happyReduce_211),
        (212 , happyReduce_212),
        (213 , happyReduce_213),
        (214 , happyReduce_214),
        (215 , happyReduce_215),
        (216 , happyReduce_216),
        (217 , happyReduce_217),
        (218 , happyReduce_218),
        (219 , happyReduce_219),
        (220 , happyReduce_220),
        (221 , happyReduce_221),
        (222 , happyReduce_222),
        (223 , happyReduce_223),
        (224 , happyReduce_224),
        (225 , happyReduce_225),
        (226 , happyReduce_226),
        (227 , happyReduce_227),
        (228 , happyReduce_228),
        (229 , happyReduce_229),
        (230 , happyReduce_230),
        (231 , happyReduce_231),
        (232 , happyReduce_232),
        (233 , happyReduce_233),
        (234 , happyReduce_234),
        (235 , happyReduce_235),
        (236 , happyReduce_236),
        (237 , happyReduce_237),
        (238 , happyReduce_238),
        (239 , happyReduce_239),
        (240 , happyReduce_240),
        (241 , happyReduce_241),
        (242 , happyReduce_242),
        (243 , happyReduce_243),
        (244 , happyReduce_244),
        (245 , happyReduce_245),
        (246 , happyReduce_246),
        (247 , happyReduce_247),
        (248 , happyReduce_248),
        (249 , happyReduce_249),
        (250 , happyReduce_250),
        (251 , happyReduce_251),
        (252 , happyReduce_252),
        (253 , happyReduce_253),
        (254 , happyReduce_254),
        (255 , happyReduce_255),
        (256 , happyReduce_256),
        (257 , happyReduce_257),
        (258 , happyReduce_258),
        (259 , happyReduce_259),
        (260 , happyReduce_260),
        (261 , happyReduce_261),
        (262 , happyReduce_262),
        (263 , happyReduce_263),
        (264 , happyReduce_264),
        (265 , happyReduce_265),
        (266 , happyReduce_266),
        (267 , happyReduce_267),
        (268 , happyReduce_268),
        (269 , happyReduce_269),
        (270 , happyReduce_270),
        (271 , happyReduce_271),
        (272 , happyReduce_272),
        (273 , happyReduce_273),
        (274 , happyReduce_274),
        (275 , happyReduce_275),
        (276 , happyReduce_276),
        (277 , happyReduce_277),
        (278 , happyReduce_278),
        (279 , happyReduce_279),
        (280 , happyReduce_280),
        (281 , happyReduce_281),
        (282 , happyReduce_282),
        (283 , happyReduce_283),
        (284 , happyReduce_284),
        (285 , happyReduce_285),
        (286 , happyReduce_286),
        (287 , happyReduce_287),
        (288 , happyReduce_288),
        (289 , happyReduce_289),
        (290 , happyReduce_290),
        (291 , happyReduce_291),
        (292 , happyReduce_292),
        (293 , happyReduce_293),
        (294 , happyReduce_294),
        (295 , happyReduce_295),
        (296 , happyReduce_296),
        (297 , happyReduce_297),
        (298 , happyReduce_298),
        (299 , happyReduce_299),
        (300 , happyReduce_300),
        (301 , happyReduce_301),
        (302 , happyReduce_302),
        (303 , happyReduce_303),
        (304 , happyReduce_304),
        (305 , happyReduce_305),
        (306 , happyReduce_306),
        (307 , happyReduce_307),
        (308 , happyReduce_308),
        (309 , happyReduce_309),
        (310 , happyReduce_310),
        (311 , happyReduce_311),
        (312 , happyReduce_312),
        (313 , happyReduce_313),
        (314 , happyReduce_314),
        (315 , happyReduce_315),
        (316 , happyReduce_316),
        (317 , happyReduce_317),
        (318 , happyReduce_318),
        (319 , happyReduce_319),
        (320 , happyReduce_320),
        (321 , happyReduce_321),
        (322 , happyReduce_322),
        (323 , happyReduce_323),
        (324 , happyReduce_324),
        (325 , happyReduce_325),
        (326 , happyReduce_326),
        (327 , happyReduce_327),
        (328 , happyReduce_328),
        (329 , happyReduce_329),
        (330 , happyReduce_330),
        (331 , happyReduce_331),
        (332 , happyReduce_332),
        (333 , happyReduce_333),
        (334 , happyReduce_334),
        (335 , happyReduce_335),
        (336 , happyReduce_336),
        (337 , happyReduce_337),
        (338 , happyReduce_338),
        (339 , happyReduce_339),
        (340 , happyReduce_340),
        (341 , happyReduce_341),
        (342 , happyReduce_342),
        (343 , happyReduce_343),
        (344 , happyReduce_344),
        (345 , happyReduce_345),
        (346 , happyReduce_346),
        (347 , happyReduce_347),
        (348 , happyReduce_348),
        (349 , happyReduce_349),
        (350 , happyReduce_350),
        (351 , happyReduce_351),
        (352 , happyReduce_352),
        (353 , happyReduce_353),
        (354 , happyReduce_354),
        (355 , happyReduce_355)
        ]

happyRuleArr :: HappyAddr
happyRuleArr = HappyA# "\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x01\x00\x00\x00\x02\x00\x00\x00\x02\x00\x00\x00\x02\x00\x00\x00\x03\x00\x00\x00\x01\x00\x00\x00\x03\x00\x00\x00\x02\x00\x00\x00\x04\x00\x00\x00\x06\x00\x00\x00\x04\x00\x00\x00\x05\x00\x00\x00\x05\x00\x00\x00\x03\x00\x00\x00\x05\x00\x00\x00\x02\x00\x00\x00\x05\x00\x00\x00\x03\x00\x00\x00\x05\x00\x00\x00\x02\x00\x00\x00\x06\x00\x00\x00\x01\x00\x00\x00\x06\x00\x00\x00\x03\x00\x00\x00\x07\x00\x00\x00\x01\x00\x00\x00\x07\x00\x00\x00\x03\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x08\x00\x00\x00\x02\x00\x00\x00\x08\x00\x00\x00\x01\x00\x00\x00\x09\x00\x00\x00\x03\x00\x00\x00\x09\x00\x00\x00\x05\x00\x00\x00\x09\x00\x00\x00\x06\x00\x00\x00\x0a\x00\x00\x00\x01\x00\x00\x00\x0a\x00\x00\x00\x02\x00\x00\x00\x0b\x00\x00\x00\x04\x00\x00\x00\x0c\x00\x00\x00\x01\x00\x00\x00\x0d\x00\x00\x00\x01\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x0d\x00\x00\x00\x03\x00\x00\x00\x0e\x00\x00\x00\x01\x00\x00\x00\x0e\x00\x00\x00\x03\x00\x00\x00\x0f\x00\x00\x00\x01\x00\x00\x00\x0f\x00\x00\x00\x01\x00\x00\x00\x10\x00\x00\x00\x01\x00\x00\x00\x10\x00\x00\x00\x03\x00\x00\x00\x11\x00\x00\x00\x01\x00\x00\x00\x12\x00\x00\x00\x01\x00\x00\x00\x12\x00\x00\x00\x03\x00\x00\x00\x12\x00\x00\x00\x03\x00\x00\x00\x12\x00\x00\x00\x03\x00\x00\x00\x12\x00\x00\x00\x01\x00\x00\x00\x13\x00\x00\x00\x03\x00\x00\x00\x13\x00\x00\x00\x05\x00\x00\x00\x13\x00\x00\x00\x04\x00\x00\x00\x13\x00\x00\x00\x06\x00\x00\x00\x14\x00\x00\x00\x03\x00\x00\x00\x14\x00\x00\x00\x01\x00\x00\x00\x15\x00\x00\x00\x00\x00\x00\x00\x15\x00\x00\x00\x03\x00\x00\x00\x16\x00\x00\x00\x01\x00\x00\x00\x16\x00\x00\x00\x03\x00\x00\x00\x17\x00\x00\x00\x01\x00\x00\x00\x17\x00\x00\x00\x03\x00\x00\x00\x17\x00\x00\x00\x05\x00\x00\x00\x17\x00\x00\x00\x03\x00\x00\x00\x17\x00\x00\x00\x05\x00\x00\x00\x17\x00\x00\x00\x03\x00\x00\x00\x17\x00\x00\x00\x05\x00\x00\x00\x17\x00\x00\x00\x03\x00\x00\x00\x17\x00\x00\x00\x01\x00\x00\x00\x17\x00\x00\x00\x03\x00\x00\x00\x18\x00\x00\x00\x06\x00\x00\x00\x18\x00\x00\x00\x06\x00\x00\x00\x18\x00\x00\x00\x05\x00\x00\x00\x18\x00\x00\x00\x03\x00\x00\x00\x18\x00\x00\x00\x07\x00\x00\x00\x18\x00\x00\x00\x05\x00\x00\x00\x18\x00\x00\x00\x06\x00\x00\x00\x18\x00\x00\x00\x05\x00\x00\x00\x18\x00\x00\x00\x07\x00\x00\x00\x18\x00\x00\x00\x07\x00\x00\x00\x19\x00\x00\x00\x01\x00\x00\x00\x19\x00\x00\x00\x01\x00\x00\x00\x19\x00\x00\x00\x01\x00\x00\x00\x1a\x00\x00\x00\x01\x00\x00\x00\x1a\x00\x00\x00\x01\x00\x00\x00\x1a\x00\x00\x00\x01\x00\x00\x00\x1b\x00\x00\x00\x00\x00\x00\x00\x1b\x00\x00\x00\x03\x00\x00\x00\x1c\x00\x00\x00\x01\x00\x00\x00\x1c\x00\x00\x00\x01\x00\x00\x00\x1d\x00\x00\x00\x02\x00\x00\x00\x1d\x00\x00\x00\x04\x00\x00\x00\x1e\x00\x00\x00\x00\x00\x00\x00\x1e\x00\x00\x00\x02\x00\x00\x00\x1e\x00\x00\x00\x06\x00\x00\x00\x1e\x00\x00\x00\x04\x00\x00\x00\x1f\x00\x00\x00\x03\x00\x00\x00\x20\x00\x00\x00\x03\x00\x00\x00\x21\x00\x00\x00\x01\x00\x00\x00\x21\x00\x00\x00\x03\x00\x00\x00\x22\x00\x00\x00\x01\x00\x00\x00\x22\x00\x00\x00\x03\x00\x00\x00\x23\x00\x00\x00\x02\x00\x00\x00\x23\x00\x00\x00\x01\x00\x00\x00\x24\x00\x00\x00\x00\x00\x00\x00\x24\x00\x00\x00\x02\x00\x00\x00\x25\x00\x00\x00\x03\x00\x00\x00\x25\x00\x00\x00\x01\x00\x00\x00\x26\x00\x00\x00\x03\x00\x00\x00\x26\x00\x00\x00\x04\x00\x00\x00\x26\x00\x00\x00\x01\x00\x00\x00\x27\x00\x00\x00\x03\x00\x00\x00\x27\x00\x00\x00\x03\x00\x00\x00\x27\x00\x00\x00\x01\x00\x00\x00\x28\x00\x00\x00\x03\x00\x00\x00\x28\x00\x00\x00\x03\x00\x00\x00\x28\x00\x00\x00\x01\x00\x00\x00\x29\x00\x00\x00\x02\x00\x00\x00\x29\x00\x00\x00\x01\x00\x00\x00\x2a\x00\x00\x00\x02\x00\x00\x00\x2a\x00\x00\x00\x03\x00\x00\x00\x2a\x00\x00\x00\x05\x00\x00\x00\x2a\x00\x00\x00\x03\x00\x00\x00\x2a\x00\x00\x00\x02\x00\x00\x00\x2a\x00\x00\x00\x01\x00\x00\x00\x2a\x00\x00\x00\x03\x00\x00\x00\x2a\x00\x00\x00\x01\x00\x00\x00\x2a\x00\x00\x00\x01\x00\x00\x00\x2b\x00\x00\x00\x06\x00\x00\x00\x2b\x00\x00\x00\x02\x00\x00\x00\x2c\x00\x00\x00\x03\x00\x00\x00\x2c\x00\x00\x00\x05\x00\x00\x00\x2c\x00\x00\x00\x01\x00\x00\x00\x2d\x00\x00\x00\x01\x00\x00\x00\x2d\x00\x00\x00\x03\x00\x00\x00\x2e\x00\x00\x00\x01\x00\x00\x00\x2e\x00\x00\x00\x03\x00\x00\x00\x2f\x00\x00\x00\x03\x00\x00\x00\x30\x00\x00\x00\x06\x00\x00\x00\x30\x00\x00\x00\x02\x00\x00\x00\x31\x00\x00\x00\x02\x00\x00\x00\x31\x00\x00\x00\x04\x00\x00\x00\x32\x00\x00\x00\x01\x00\x00\x00\x32\x00\x00\x00\x03\x00\x00\x00\x33\x00\x00\x00\x01\x00\x00\x00\x33\x00\x00\x00\x02\x00\x00\x00\x33\x00\x00\x00\x01\x00\x00\x00\x34\x00\x00\x00\x03\x00\x00\x00\x34\x00\x00\x00\x03\x00\x00\x00\x34\x00\x00\x00\x03\x00\x00\x00\x35\x00\x00\x00\x01\x00\x00\x00\x35\x00\x00\x00\x03\x00\x00\x00\x36\x00\x00\x00\x03\x00\x00\x00\x36\x00\x00\x00\x03\x00\x00\x00\x36\x00\x00\x00\x03\x00\x00\x00\x36\x00\x00\x00\x01\x00\x00\x00\x36\x00\x00\x00\x01\x00\x00\x00\x36\x00\x00\x00\x01\x00\x00\x00\x36\x00\x00\x00\x01\x00\x00\x00\x37\x00\x00\x00\x06\x00\x00\x00\x37\x00\x00\x00\x07\x00\x00\x00\x38\x00\x00\x00\x00\x00\x00\x00\x38\x00\x00\x00\x02\x00\x00\x00\x39\x00\x00\x00\x01\x00\x00\x00\x39\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x01\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x01\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3a\x00\x00\x00\x03\x00\x00\x00\x3b\x00\x00\x00\x03\x00\x00\x00\x3b\x00\x00\x00\x03\x00\x00\x00\x3b\x00\x00\x00\x03\x00\x00\x00\x3c\x00\x00\x00\x01\x00\x00\x00\x3c\x00\x00\x00\x03\x00\x00\x00\x3d\x00\x00\x00\x02\x00\x00\x00\x3d\x00\x00\x00\x01\x00\x00\x00\x3e\x00\x00\x00\x01\x00\x00\x00\x3e\x00\x00\x00\x03\x00\x00\x00\x3e\x00\x00\x00\x03\x00\x00\x00\x3e\x00\x00\x00\x03\x00\x00\x00\x3f\x00\x00\x00\x01\x00\x00\x00\x3f\x00\x00\x00\x01\x00\x00\x00\x3f\x00\x00\x00\x01\x00\x00\x00\x3f\x00\x00\x00\x01\x00\x00\x00\x3f\x00\x00\x00\x03\x00\x00\x00\x40\x00\x00\x00\x03\x00\x00\x00\x41\x00\x00\x00\x06\x00\x00\x00\x41\x00\x00\x00\x05\x00\x00\x00\x41\x00\x00\x00\x06\x00\x00\x00\x41\x00\x00\x00\x05\x00\x00\x00\x42\x00\x00\x00\x01\x00\x00\x00\x42\x00\x00\x00\x03\x00\x00\x00\x43\x00\x00\x00\x01\x00\x00\x00\x43\x00\x00\x00\x03\x00\x00\x00\x44\x00\x00\x00\x03\x00\x00\x00\x44\x00\x00\x00\x03\x00\x00\x00\x44\x00\x00\x00\x04\x00\x00\x00\x45\x00\x00\x00\x04\x00\x00\x00\x46\x00\x00\x00\x01\x00\x00\x00\x46\x00\x00\x00\x03\x00\x00\x00\x46\x00\x00\x00\x03\x00\x00\x00\x46\x00\x00\x00\x03\x00\x00\x00\x47\x00\x00\x00\x01\x00\x00\x00\x47\x00\x00\x00\x02\x00\x00\x00\x47\x00\x00\x00\x02\x00\x00\x00\x48\x00\x00\x00\x01\x00\x00\x00\x48\x00\x00\x00\x02\x00\x00\x00\x49\x00\x00\x00\x02\x00\x00\x00\x49\x00\x00\x00\x01\x00\x00\x00\x4a\x00\x00\x00\x01\x00\x00\x00\x4a\x00\x00\x00\x02\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4b\x00\x00\x00\x01\x00\x00\x00\x4c\x00\x00\x00\x01\x00\x00\x00\x4d\x00\x00\x00\x01\x00\x00\x00\x4e\x00\x00\x00\x02\x00\x00\x00\x4e\x00\x00\x00\x03\x00\x00\x00\x4e\x00\x00\x00\x03\x00\x00\x00\x4e\x00\x00\x00\x03\x00\x00\x00\x4e\x00\x00\x00\x03\x00\x00\x00\x4e\x00\x00\x00\x05\x00\x00\x00\x4f\x00\x00\x00\x01\x00\x00\x00\x4f\x00\x00\x00\x03\x00\x00\x00\x50\x00\x00\x00\x03\x00\x00\x00\x51\x00\x00\x00\x01\x00\x00\x00\x51\x00\x00\x00\x03\x00\x00\x00\x52\x00\x00\x00\x03\x00\x00\x00\x53\x00\x00\x00\x02\x00\x00\x00\x53\x00\x00\x00\x03\x00\x00\x00\x54\x00\x00\x00\x04\x00\x00\x00\x54\x00\x00\x00\x04\x00\x00\x00\x55\x00\x00\x00\x01\x00\x00\x00\x55\x00\x00\x00\x03\x00\x00\x00\x56\x00\x00\x00\x01\x00\x00\x00\x56\x00\x00\x00\x03\x00\x00\x00\x57\x00\x00\x00\x03\x00\x00\x00\x57\x00\x00\x00\x04\x00\x00\x00\x57\x00\x00\x00\x01\x00\x00\x00\x58\x00\x00\x00\x02\x00\x00\x00\x58\x00\x00\x00\x02\x00\x00\x00\x59\x00\x00\x00\x02\x00\x00\x00\x59\x00\x00\x00\x02\x00\x00\x00\x59\x00\x00\x00\x03\x00\x00\x00\x5a\x00\x00\x00\x00\x00\x00\x00\x5a\x00\x00\x00\x02\x00\x00\x00\x5a\x00\x00\x00\x02\x00\x00\x00\x5b\x00\x00\x00\x01\x00\x00\x00\x5b\x00\x00\x00\x03\x00\x00\x00\x5c\x00\x00\x00\x02\x00\x00\x00\x5c\x00\x00\x00\x02\x00\x00\x00\x5d\x00\x00\x00\x03\x00\x00\x00\x5d\x00\x00\x00\x03\x00\x00\x00\x5d\x00\x00\x00\x01\x00\x00\x00\x5e\x00\x00\x00\x01\x00\x00\x00\x5f\x00\x00\x00\x01\x00\x00\x00\x5f\x00\x00\x00\x01\x00\x00\x00\x60\x00\x00\x00\x01\x00\x00\x00\x60\x00\x00\x00\x01\x00\x00\x00\x61\x00\x00\x00\x01\x00\x00\x00\x61\x00\x00\x00\x01\x00\x00\x00\x62\x00\x00\x00\x03\x00\x00\x00\x63\x00\x00\x00\x03\x00\x00\x00\x63\x00\x00\x00\x05\x00\x00\x00\x64\x00\x00\x00\x01\x00\x00\x00\x64\x00\x00\x00\x01\x00\x00\x00\x65\x00\x00\x00\x03\x00\x00\x00\x66\x00\x00\x00\x03\x00\x00\x00\x66\x00\x00\x00\x04\x00\x00\x00\x66\x00\x00\x00\x01\x00\x00\x00\x67\x00\x00\x00\x03\x00\x00\x00\x67\x00\x00\x00\x03\x00\x00\x00\x67\x00\x00\x00\x01\x00\x00\x00\x68\x00\x00\x00\x03\x00\x00\x00\x68\x00\x00\x00\x03\x00\x00\x00\x68\x00\x00\x00\x01\x00\x00\x00\x69\x00\x00\x00\x02\x00\x00\x00\x69\x00\x00\x00\x01\x00\x00\x00\x6a\x00\x00\x00\x02\x00\x00\x00\x6a\x00\x00\x00\x03\x00\x00\x00\x6a\x00\x00\x00\x05\x00\x00\x00\x6a\x00\x00\x00\x03\x00\x00\x00\x6a\x00\x00\x00\x02\x00\x00\x00\x6a\x00\x00\x00\x01\x00\x00\x00\x6a\x00\x00\x00\x03\x00\x00\x00\x6a\x00\x00\x00\x01\x00\x00\x00\x6a\x00\x00\x00\x01\x00\x00\x00\x6a\x00\x00\x00\x01\x00\x00\x00\x6b\x00\x00\x00\x01\x00\x00\x00\x6b\x00\x00\x00\x03\x00\x00\x00\x6c\x00\x00\x00\x01\x00\x00\x00\x6c\x00\x00\x00\x02\x00\x00\x00\x6d\x00\x00\x00\x01\x00\x00\x00\x6d\x00\x00\x00\x03\x00\x00\x00\x6e\x00\x00\x00\x03\x00\x00\x00\x6e\x00\x00\x00\x01\x00\x00\x00\x6f\x00\x00\x00\x03\x00\x00\x00\x6f\x00\x00\x00\x01\x00\x00\x00\x70\x00\x00\x00\x03\x00\x00\x00\x70\x00\x00\x00\x04\x00\x00\x00\x70\x00\x00\x00\x01\x00\x00\x00\x71\x00\x00\x00\x03\x00\x00\x00\x71\x00\x00\x00\x03\x00\x00\x00\x71\x00\x00\x00\x01\x00\x00\x00\x72\x00\x00\x00\x03\x00\x00\x00\x72\x00\x00\x00\x03\x00\x00\x00\x72\x00\x00\x00\x01\x00\x00\x00\x73\x00\x00\x00\x02\x00\x00\x00\x73\x00\x00\x00\x01\x00\x00\x00\x74\x00\x00\x00\x02\x00\x00\x00\x74\x00\x00\x00\x03\x00\x00\x00\x74\x00\x00\x00\x05\x00\x00\x00\x74\x00\x00\x00\x03\x00\x00\x00\x74\x00\x00\x00\x02\x00\x00\x00\x74\x00\x00\x00\x01\x00\x00\x00\x74\x00\x00\x00\x03\x00\x00\x00\x74\x00\x00\x00\x01\x00\x00\x00\x74\x00\x00\x00\x01\x00\x00\x00\x74\x00\x00\x00\x01\x00\x00\x00\x75\x00\x00\x00\x02\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x76\x00\x00\x00\x01\x00\x00\x00\x77\x00\x00\x00\x01\x00\x00\x00\x77\x00\x00\x00\x03\x00\x00\x00\x77\x00\x00\x00\x03\x00\x00\x00\x77\x00\x00\x00\x03\x00\x00\x00\x78\x00\x00\x00\x00\x00\x00\x00\x78\x00\x00\x00\x04\x00\x00\x00\x78\x00\x00\x00\x04\x00\x00\x00\x79\x00\x00\x00\x01\x00\x00\x00\x79\x00\x00\x00\x03\x00\x00\x00\x7a\x00\x00\x00\x01\x00\x00\x00\x7a\x00\x00\x00\x03\x00\x00\x00\x7b\x00\x00\x00\x01\x00\x00\x00\x7c\x00\x00\x00\x00\x00\x00\x00\x7c\x00\x00\x00\x02\x00\x00\x00\x7d\x00\x00\x00\x01\x00\x00\x00\x7d\x00\x00\x00\x02\x00\x00\x00"#

happyCatchStates :: [Happy_Prelude.Int]
happyCatchStates = []

happy_n_terms = 70 :: Happy_Prelude.Int
happy_n_nonterms = 126 :: Happy_Prelude.Int

happy_n_starts = 3 :: Happy_Prelude.Int

happyReduce_3 = happySpecReduce_2  0# happyReduction_3
happyReduction_3 _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn7
                 ((happy_var_1, False)
        )
happyReduction_3 _ _  = notHappyAtAll 

happyReduce_4 = happySpecReduce_2  0# happyReduction_4
happyReduction_4 _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn7
                 ((happy_var_1, True)
        )
happyReduction_4 _ _  = notHappyAtAll 

happyReduce_5 = happySpecReduce_2  1# happyReduction_5
happyReduction_5 _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_5 _ _  = notHappyAtAll 

happyReduce_6 = happySpecReduce_2  2# happyReduction_6
happyReduction_6 _
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_6 _ _  = notHappyAtAll 

happyReduce_7 = happySpecReduce_1  3# happyReduction_7
happyReduction_7 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_7 _  = notHappyAtAll 

happyReduce_8 = happySpecReduce_2  3# happyReduction_8
happyReduction_8 (HappyAbsSyn9  happy_var_2)
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ [happy_var_2]
        )
happyReduction_8 _ _  = notHappyAtAll 

happyReduce_9 = happyReduce 6# 4# happyReduction_9
happyReduction_9 ((HappyAbsSyn10  happy_var_6) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn22  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn19  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CModE (Just happy_var_2) happy_var_4 happy_var_6)
        ) `HappyStk` happyRest

happyReduce_10 = happyReduce 5# 4# happyReduction_10
happyReduction_10 ((HappyAbsSyn10  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn22  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CModE Nothing happy_var_3 happy_var_5)
        ) `HappyStk` happyRest

happyReduce_11 = happySpecReduce_3  5# happyReduction_11
happyReduction_11 _
        (HappyAbsSyn10  happy_var_2)
        _
         =  HappyAbsSyn10
                 (happy_var_2
        )
happyReduction_11 _ _ _  = notHappyAtAll 

happyReduce_12 = happySpecReduce_2  5# happyReduction_12
happyReduction_12 _
        _
         =  HappyAbsSyn10
                 ([]
        )

happyReduce_13 = happySpecReduce_3  5# happyReduction_13
happyReduction_13 _
        (HappyAbsSyn10  happy_var_2)
        _
         =  HappyAbsSyn10
                 (happy_var_2
        )
happyReduction_13 _ _ _  = notHappyAtAll 

happyReduce_14 = happySpecReduce_2  5# happyReduction_14
happyReduction_14 _
        _
         =  HappyAbsSyn10
                 ([]
        )

happyReduce_15 = happySpecReduce_1  6# happyReduction_15
happyReduction_15 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_15 _  = notHappyAtAll 

happyReduce_16 = happySpecReduce_3  6# happyReduction_16
happyReduction_16 (HappyAbsSyn10  happy_var_3)
        _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_16 _ _ _  = notHappyAtAll 

happyReduce_17 = happySpecReduce_1  7# happyReduction_17
happyReduction_17 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_17 _  = notHappyAtAll 

happyReduce_18 = happySpecReduce_3  7# happyReduction_18
happyReduction_18 (HappyAbsSyn10  happy_var_3)
        _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_18 _ _ _  = notHappyAtAll 

happyReduce_19 = happySpecReduce_1  8# happyReduction_19
happyReduction_19 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_19 _  = notHappyAtAll 

happyReduce_20 = happySpecReduce_1  8# happyReduction_20
happyReduction_20 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_20 _  = notHappyAtAll 

happyReduce_21 = happySpecReduce_1  8# happyReduction_21
happyReduction_21 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_21 _  = notHappyAtAll 

happyReduce_22 = happySpecReduce_1  8# happyReduction_22
happyReduction_22 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_22 _  = notHappyAtAll 

happyReduce_23 = happySpecReduce_1  8# happyReduction_23
happyReduction_23 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_23 _  = notHappyAtAll 

happyReduce_24 = happySpecReduce_1  8# happyReduction_24
happyReduction_24 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_24 _  = notHappyAtAll 

happyReduce_25 = happySpecReduce_2  8# happyReduction_25
happyReduction_25 (HappyAbsSyn10  happy_var_2)
        _
         =  HappyAbsSyn10
                 (map (\(Loc sp e) -> Loc sp (CInlineE (Loc sp e))) happy_var_2
        )
happyReduction_25 _ _  = notHappyAtAll 

happyReduce_26 = happySpecReduce_1  8# happyReduction_26
happyReduction_26 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_26 _  = notHappyAtAll 

happyReduce_27 = happySpecReduce_3  9# happyReduction_27
happyReduction_27 (HappyAbsSyn117  happy_var_3)
        _
        (HappyAbsSyn24  happy_var_1)
         =  HappyAbsSyn10
                 ([at happy_var_1 (CSigE (toEVar happy_var_1) happy_var_3)]
        )
happyReduction_27 _ _ _  = notHappyAtAll 

happyReduce_28 = happyReduce 5# 9# happyReduction_28
happyReduction_28 ((HappyAbsSyn10  happy_var_5) `HappyStk`
        (HappyAbsSyn9  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn20  happy_var_2) `HappyStk`
        (HappyAbsSyn24  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 ([at happy_var_1 (CAssE (toEVar happy_var_1) happy_var_2 happy_var_4 happy_var_5)]
        ) `HappyStk` happyRest

happyReduce_29 = happyReduce 6# 9# happyReduction_29
happyReduction_29 ((HappyAbsSyn10  happy_var_6) `HappyStk`
        (HappyAbsSyn9  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn17  happy_var_3) `HappyStk`
        (HappyAbsSyn20  happy_var_2) `HappyStk`
        (HappyAbsSyn24  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 ([at happy_var_1 (CGuardedAssE (toEVar happy_var_1) happy_var_2 happy_var_3 happy_var_5 happy_var_6)]
        ) `HappyStk` happyRest

happyReduce_30 = happySpecReduce_1  10# happyReduction_30
happyReduction_30 (HappyAbsSyn18  happy_var_1)
         =  HappyAbsSyn17
                 ([happy_var_1]
        )
happyReduction_30 _  = notHappyAtAll 

happyReduce_31 = happySpecReduce_2  10# happyReduction_31
happyReduction_31 (HappyAbsSyn18  happy_var_2)
        (HappyAbsSyn17  happy_var_1)
         =  HappyAbsSyn17
                 (happy_var_1 ++ [happy_var_2]
        )
happyReduction_31 _ _  = notHappyAtAll 

happyReduce_32 = happyReduce 4# 11# happyReduction_32
happyReduction_32 ((HappyAbsSyn9  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn9  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn18
                 ((happy_var_2, happy_var_4)
        ) `HappyStk` happyRest

happyReduce_33 = happySpecReduce_1  12# happyReduction_33
happyReduction_33 (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn19
                 (T.intercalate "." happy_var_1
        )
happyReduction_33 _  = notHappyAtAll 

happyReduce_34 = happySpecReduce_1  13# happyReduction_34
happyReduction_34 (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn20
                 ([happy_var_1]
        )
happyReduction_34 _  = notHappyAtAll 

happyReduce_35 = happySpecReduce_3  13# happyReduction_35
happyReduction_35 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_35 _ _ _  = notHappyAtAll 

happyReduce_36 = happySpecReduce_3  13# happyReduction_36
happyReduction_36 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_36 _ _ _  = notHappyAtAll 

happyReduce_37 = happySpecReduce_3  13# happyReduction_37
happyReduction_37 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_37 _ _ _  = notHappyAtAll 

happyReduce_38 = happySpecReduce_3  13# happyReduction_38
happyReduction_38 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_38 _ _ _  = notHappyAtAll 

happyReduce_39 = happySpecReduce_1  14# happyReduction_39
happyReduction_39 (HappyTerminal happy_var_1)
         =  HappyAbsSyn19
                 (getName happy_var_1
        )
happyReduction_39 _  = notHappyAtAll 

happyReduce_40 = happySpecReduce_3  14# happyReduction_40
happyReduction_40 (HappyTerminal happy_var_3)
        _
        (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn19
                 (happy_var_1 <> "-" <> getName happy_var_3
        )
happyReduction_40 _ _ _  = notHappyAtAll 

happyReduce_41 = happySpecReduce_1  15# happyReduction_41
happyReduction_41 _
         =  HappyAbsSyn22
                 (CstExportAll
        )

happyReduce_42 = happySpecReduce_1  15# happyReduction_42
happyReduction_42 (HappyAbsSyn23  happy_var_1)
         =  HappyAbsSyn22
                 (CstExportMany happy_var_1
        )
happyReduction_42 _  = notHappyAtAll 

happyReduce_43 = happySpecReduce_1  16# happyReduction_43
happyReduction_43 (HappyAbsSyn24  happy_var_1)
         =  HappyAbsSyn23
                 ([happy_var_1]
        )
happyReduction_43 _  = notHappyAtAll 

happyReduce_44 = happySpecReduce_3  16# happyReduction_44
happyReduction_44 (HappyAbsSyn24  happy_var_3)
        _
        (HappyAbsSyn23  happy_var_1)
         =  HappyAbsSyn23
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_44 _ _ _  = notHappyAtAll 

happyReduce_45 = happySpecReduce_1  17# happyReduction_45
happyReduction_45 (HappyAbsSyn24  happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_45 _  = notHappyAtAll 

happyReduce_46 = happySpecReduce_1  18# happyReduction_46
happyReduction_46 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_46 _  = notHappyAtAll 

happyReduce_47 = happySpecReduce_3  18# happyReduction_47
happyReduction_47 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_47 _ _ _  = notHappyAtAll 

happyReduce_48 = happySpecReduce_3  18# happyReduction_48
happyReduction_48 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_48 _ _ _  = notHappyAtAll 

happyReduce_49 = happySpecReduce_3  18# happyReduction_49
happyReduction_49 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_49 _ _ _  = notHappyAtAll 

happyReduce_50 = happySpecReduce_1  18# happyReduction_50
happyReduction_50 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_50 _  = notHappyAtAll 

happyReduce_51 = happySpecReduce_3  19# happyReduction_51
happyReduction_51 (HappyAbsSyn28  happy_var_3)
        (HappyAbsSyn19  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CImpE (Import (MV happy_var_2) happy_var_3 [] Nothing))
        )
happyReduction_51 _ _ _  = notHappyAtAll 

happyReduce_52 = happyReduce 5# 19# happyReduction_52
happyReduction_52 ((HappyAbsSyn28  happy_var_5) `HappyStk`
        (HappyTerminal happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn19  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CImpE (Import (MV happy_var_2) happy_var_5 [] (Just (EV (getName happy_var_4)))))
        ) `HappyStk` happyRest

happyReduce_53 = happyReduce 4# 19# happyReduction_53
happyReduction_53 ((HappyAbsSyn28  happy_var_4) `HappyStk`
        (HappyAbsSyn19  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CImpE (Import (MV ("." <> happy_var_3)) happy_var_4 [] Nothing))
        ) `HappyStk` happyRest

happyReduce_54 = happyReduce 6# 19# happyReduction_54
happyReduction_54 ((HappyAbsSyn28  happy_var_6) `HappyStk`
        (HappyTerminal happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn19  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CImpE (Import (MV ("." <> happy_var_3)) happy_var_6 [] (Just (EV (getName happy_var_5)))))
        ) `HappyStk` happyRest

happyReduce_55 = happySpecReduce_3  20# happyReduction_55
happyReduction_55 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn19
                 (happy_var_1 <> "/" <> happy_var_3
        )
happyReduction_55 _ _ _  = notHappyAtAll 

happyReduce_56 = happySpecReduce_1  20# happyReduction_56
happyReduction_56 (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn19
                 (happy_var_1
        )
happyReduction_56 _  = notHappyAtAll 

happyReduce_57 = happySpecReduce_0  21# happyReduction_57
happyReduction_57  =  HappyAbsSyn28
                 (Nothing
        )

happyReduce_58 = happySpecReduce_3  21# happyReduction_58
happyReduction_58 _
        (HappyAbsSyn29  happy_var_2)
        _
         =  HappyAbsSyn28
                 (Just happy_var_2
        )
happyReduction_58 _ _ _  = notHappyAtAll 

happyReduce_59 = happySpecReduce_1  22# happyReduction_59
happyReduction_59 (HappyAbsSyn30  happy_var_1)
         =  HappyAbsSyn29
                 ([happy_var_1]
        )
happyReduction_59 _  = notHappyAtAll 

happyReduce_60 = happySpecReduce_3  22# happyReduction_60
happyReduction_60 (HappyAbsSyn30  happy_var_3)
        _
        (HappyAbsSyn29  happy_var_1)
         =  HappyAbsSyn29
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_60 _ _ _  = notHappyAtAll 

happyReduce_61 = happySpecReduce_1  23# happyReduction_61
happyReduction_61 (HappyTerminal happy_var_1)
         =  HappyAbsSyn30
                 (AliasedTerm (EV (getName happy_var_1)) (EV (getName happy_var_1))
        )
happyReduction_61 _  = notHappyAtAll 

happyReduce_62 = happySpecReduce_3  23# happyReduction_62
happyReduction_62 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn30
                 (AliasedTerm (EV (getName happy_var_1)) (EV (getName happy_var_3))
        )
happyReduction_62 _ _ _  = notHappyAtAll 

happyReduce_63 = happyReduce 5# 23# happyReduction_63
happyReduction_63 ((HappyTerminal happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn24  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn30
                 (AliasedTerm (EV (getOp happy_var_2)) (EV (getName happy_var_5))
        ) `HappyStk` happyRest

happyReduce_64 = happySpecReduce_3  23# happyReduction_64
happyReduction_64 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn30
                 (AliasedTerm (EV (getOp happy_var_2)) (EV (getOp happy_var_2))
        )
happyReduction_64 _ _ _  = notHappyAtAll 

happyReduce_65 = happyReduce 5# 23# happyReduction_65
happyReduction_65 ((HappyTerminal happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn30
                 (AliasedTerm (EV "-") (EV (getName happy_var_5))
        ) `HappyStk` happyRest

happyReduce_66 = happySpecReduce_3  23# happyReduction_66
happyReduction_66 _
        _
        _
         =  HappyAbsSyn30
                 (AliasedTerm (EV "-") (EV "-")
        )

happyReduce_67 = happyReduce 5# 23# happyReduction_67
happyReduction_67 ((HappyTerminal happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn30
                 (AliasedTerm (EV ".") (EV (getName happy_var_5))
        ) `HappyStk` happyRest

happyReduce_68 = happySpecReduce_3  23# happyReduction_68
happyReduction_68 _
        _
        _
         =  HappyAbsSyn30
                 (AliasedTerm (EV ".") (EV ".")
        )

happyReduce_69 = happySpecReduce_1  23# happyReduction_69
happyReduction_69 (HappyTerminal happy_var_1)
         =  HappyAbsSyn30
                 (AliasedType (TV (getName happy_var_1)) (TV (getName happy_var_1))
        )
happyReduction_69 _  = notHappyAtAll 

happyReduce_70 = happySpecReduce_3  23# happyReduction_70
happyReduction_70 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn30
                 (AliasedType (TV (getName happy_var_1)) (TV (getName happy_var_3))
        )
happyReduction_70 _ _ _  = notHappyAtAll 

happyReduce_71 = happyReduce 6# 24# happyReduction_71
happyReduction_71 ((HappyAbsSyn42  happy_var_6) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAlias (Just happy_var_2) happy_var_4 happy_var_6))
        ) `HappyStk` happyRest

happyReduce_72 = happyReduce 6# 24# happyReduction_72
happyReduction_72 ((HappyAbsSyn42  happy_var_6) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAlias (Just happy_var_2) happy_var_4 happy_var_6))
        ) `HappyStk` happyRest

happyReduce_73 = happyReduce 5# 24# happyReduction_73
happyReduction_73 ((HappyAbsSyn8  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn37  happy_var_3) `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAlias Nothing (TV (getName happy_var_2), happy_var_3) (happy_var_5, False)))
        ) `HappyStk` happyRest

happyReduce_74 = happySpecReduce_3  24# happyReduction_74
happyReduction_74 (HappyAbsSyn37  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAliasForward (TV (getName happy_var_2), happy_var_3)))
        )
happyReduction_74 _ _ _  = notHappyAtAll 

happyReduce_75 = happyReduce 7# 24# happyReduction_75
happyReduction_75 ((HappyAbsSyn8  happy_var_7) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn37  happy_var_4) `HappyStk`
        (HappyTerminal happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAlias Nothing (TV (getName happy_var_3), happy_var_4) (happy_var_7, False)))
        ) `HappyStk` happyRest

happyReduce_76 = happyReduce 5# 24# happyReduction_76
happyReduction_76 (_ `HappyStk`
        (HappyAbsSyn37  happy_var_4) `HappyStk`
        (HappyTerminal happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CTypE (CstTypeAliasForward (TV (getName happy_var_3), happy_var_4)))
        ) `HappyStk` happyRest

happyReduce_77 = happyReduce 6# 24# happyReduction_77
happyReduction_77 (_ `HappyStk`
        (HappyAbsSyn40  happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_2) `HappyStk`
        (HappyAbsSyn32  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at (fst happy_var_1) (CTypE (CstNamTypeWhere (snd happy_var_1) happy_var_2 happy_var_5))
        ) `HappyStk` happyRest

happyReduce_78 = happyReduce 5# 24# happyReduction_78
happyReduction_78 ((HappyAbsSyn34  happy_var_5) `HappyStk`
        (HappyAbsSyn33  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_2) `HappyStk`
        (HappyAbsSyn32  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at (fst happy_var_1) (CTypE (CstNamTypeLegacy Nothing (snd happy_var_1) happy_var_2 happy_var_4 happy_var_5))
        ) `HappyStk` happyRest

happyReduce_79 = happyReduce 7# 24# happyReduction_79
happyReduction_79 ((HappyAbsSyn34  happy_var_7) `HappyStk`
        (HappyAbsSyn33  happy_var_6) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyAbsSyn32  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at (fst happy_var_1) (CTypE (CstNamTypeLegacy (Just happy_var_2) (snd happy_var_1) happy_var_4 happy_var_6 happy_var_7))
        ) `HappyStk` happyRest

happyReduce_80 = happyReduce 7# 24# happyReduction_80
happyReduction_80 ((HappyAbsSyn34  happy_var_7) `HappyStk`
        (HappyAbsSyn33  happy_var_6) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn36  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyAbsSyn32  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at (fst happy_var_1) (CTypE (CstNamTypeLegacy (Just happy_var_2) (snd happy_var_1) happy_var_4 happy_var_6 happy_var_7))
        ) `HappyStk` happyRest

happyReduce_81 = happySpecReduce_1  25# happyReduction_81
happyReduction_81 (HappyTerminal happy_var_1)
         =  HappyAbsSyn32
                 ((happy_var_1, NamRecord)
        )
happyReduction_81 _  = notHappyAtAll 

happyReduce_82 = happySpecReduce_1  25# happyReduction_82
happyReduction_82 (HappyTerminal happy_var_1)
         =  HappyAbsSyn32
                 ((happy_var_1, NamObject)
        )
happyReduction_82 _  = notHappyAtAll 

happyReduce_83 = happySpecReduce_1  25# happyReduction_83
happyReduction_83 (HappyTerminal happy_var_1)
         =  HappyAbsSyn32
                 ((happy_var_1, NamTable)
        )
happyReduction_83 _  = notHappyAtAll 

happyReduce_84 = happySpecReduce_1  26# happyReduction_84
happyReduction_84 (HappyTerminal happy_var_1)
         =  HappyAbsSyn33
                 ((getString happy_var_1, True)
        )
happyReduction_84 _  = notHappyAtAll 

happyReduce_85 = happySpecReduce_1  26# happyReduction_85
happyReduction_85 (HappyTerminal happy_var_1)
         =  HappyAbsSyn33
                 ((getName happy_var_1, False)
        )
happyReduction_85 _  = notHappyAtAll 

happyReduce_86 = happySpecReduce_1  26# happyReduction_86
happyReduction_86 (HappyTerminal happy_var_1)
         =  HappyAbsSyn33
                 ((getName happy_var_1, False)
        )
happyReduction_86 _  = notHappyAtAll 

happyReduce_87 = happySpecReduce_0  27# happyReduction_87
happyReduction_87  =  HappyAbsSyn34
                 ([]
        )

happyReduce_88 = happySpecReduce_3  27# happyReduction_88
happyReduction_88 _
        (HappyAbsSyn34  happy_var_2)
        _
         =  HappyAbsSyn34
                 (happy_var_2
        )
happyReduction_88 _ _ _  = notHappyAtAll 

happyReduce_89 = happySpecReduce_1  28# happyReduction_89
happyReduction_89 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_89 _  = notHappyAtAll 

happyReduce_90 = happySpecReduce_1  28# happyReduction_90
happyReduction_90 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_90 _  = notHappyAtAll 

happyReduce_91 = happySpecReduce_2  29# happyReduction_91
happyReduction_91 (HappyAbsSyn37  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn36
                 ((TV (getName happy_var_1), happy_var_2)
        )
happyReduction_91 _ _  = notHappyAtAll 

happyReduce_92 = happyReduce 4# 29# happyReduction_92
happyReduction_92 (_ `HappyStk`
        (HappyAbsSyn37  happy_var_3) `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn36
                 ((TV (getName happy_var_2), happy_var_3)
        ) `HappyStk` happyRest

happyReduce_93 = happySpecReduce_0  30# happyReduction_93
happyReduction_93  =  HappyAbsSyn37
                 ([]
        )

happyReduce_94 = happySpecReduce_2  30# happyReduction_94
happyReduction_94 (HappyTerminal happy_var_2)
        (HappyAbsSyn37  happy_var_1)
         =  HappyAbsSyn37
                 (happy_var_1 ++ [Left (TV (getName happy_var_2), KindType)]
        )
happyReduction_94 _ _  = notHappyAtAll 

happyReduce_95 = happyReduce 6# 30# happyReduction_95
happyReduction_95 (_ `HappyStk`
        (HappyTerminal happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn37  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn37
                 (happy_var_1 ++ [Left (TV (getName happy_var_3), parseKind (getName happy_var_5))]
        ) `HappyStk` happyRest

happyReduce_96 = happyReduce 4# 30# happyReduction_96
happyReduction_96 (_ `HappyStk`
        (HappyAbsSyn8  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn37  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn37
                 (happy_var_1 ++ [Right happy_var_3]
        ) `HappyStk` happyRest

happyReduce_97 = happySpecReduce_3  31# happyReduction_97
happyReduction_97 (HappyAbsSyn8  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn38
                 ((Key (getName happy_var_1), happy_var_3)
        )
happyReduction_97 _ _ _  = notHappyAtAll 

happyReduce_98 = happySpecReduce_3  32# happyReduction_98
happyReduction_98 (HappyAbsSyn8  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn39
                 ((happy_var_1, Key (getName happy_var_1), happy_var_3)
        )
happyReduction_98 _ _ _  = notHappyAtAll 

happyReduce_99 = happySpecReduce_1  33# happyReduction_99
happyReduction_99 (HappyAbsSyn39  happy_var_1)
         =  HappyAbsSyn40
                 ([happy_var_1]
        )
happyReduction_99 _  = notHappyAtAll 

happyReduce_100 = happySpecReduce_3  33# happyReduction_100
happyReduction_100 (HappyAbsSyn39  happy_var_3)
        _
        (HappyAbsSyn40  happy_var_1)
         =  HappyAbsSyn40
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_100 _ _ _  = notHappyAtAll 

happyReduce_101 = happySpecReduce_1  34# happyReduction_101
happyReduction_101 (HappyAbsSyn38  happy_var_1)
         =  HappyAbsSyn34
                 ([happy_var_1]
        )
happyReduction_101 _  = notHappyAtAll 

happyReduce_102 = happySpecReduce_3  34# happyReduction_102
happyReduction_102 (HappyAbsSyn38  happy_var_3)
        _
        (HappyAbsSyn34  happy_var_1)
         =  HappyAbsSyn34
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_102 _ _ _  = notHappyAtAll 

happyReduce_103 = happySpecReduce_2  35# happyReduction_103
happyReduction_103 (HappyAbsSyn43  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn42
                 ((case happy_var_2 of { [] -> VarU (TV (getString happy_var_1)); ts -> AppU (VarU (TV (getString happy_var_1))) ts }, True)
        )
happyReduction_103 _ _  = notHappyAtAll 

happyReduce_104 = happySpecReduce_1  35# happyReduction_104
happyReduction_104 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn42
                 ((happy_var_1, False)
        )
happyReduction_104 _  = notHappyAtAll 

happyReduce_105 = happySpecReduce_0  36# happyReduction_105
happyReduction_105  =  HappyAbsSyn43
                 ([]
        )

happyReduce_106 = happySpecReduce_2  36# happyReduction_106
happyReduction_106 (HappyAbsSyn8  happy_var_2)
        (HappyAbsSyn43  happy_var_1)
         =  HappyAbsSyn43
                 (happy_var_1 ++ [happy_var_2]
        )
happyReduction_106 _ _  = notHappyAtAll 

happyReduce_107 = happySpecReduce_3  37# happyReduction_107
happyReduction_107 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (case happy_var_3 of { FunU args ret -> FunU (happy_var_1 : args) ret; t -> FunU [happy_var_1] t }
        )
happyReduction_107 _ _ _  = notHappyAtAll 

happyReduce_108 = happySpecReduce_1  37# happyReduction_108
happyReduction_108 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_108 _  = notHappyAtAll 

happyReduce_109 = happySpecReduce_3  38# happyReduction_109
happyReduction_109 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn8
                 (ExistU (TV (getName happy_var_2)) ([], Open) ([], Open)
        )
happyReduction_109 _ _ _  = notHappyAtAll 

happyReduce_110 = happyReduce 4# 38# happyReduction_110
happyReduction_110 ((HappyAbsSyn8  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn116  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn8
                 (EffectU (EffectSet (Set.fromList happy_var_2)) happy_var_4
        ) `HappyStk` happyRest

happyReduce_111 = happySpecReduce_1  38# happyReduction_111
happyReduction_111 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_111 _  = notHappyAtAll 

happyReduce_112 = happySpecReduce_3  39# happyReduction_112
happyReduction_112 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatAddU happy_var_1 happy_var_3
        )
happyReduction_112 _ _ _  = notHappyAtAll 

happyReduce_113 = happySpecReduce_3  39# happyReduction_113
happyReduction_113 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatSubU happy_var_1 happy_var_3
        )
happyReduction_113 _ _ _  = notHappyAtAll 

happyReduce_114 = happySpecReduce_1  39# happyReduction_114
happyReduction_114 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_114 _  = notHappyAtAll 

happyReduce_115 = happySpecReduce_3  40# happyReduction_115
happyReduction_115 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatMulU happy_var_1 happy_var_3
        )
happyReduction_115 _ _ _  = notHappyAtAll 

happyReduce_116 = happySpecReduce_3  40# happyReduction_116
happyReduction_116 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatDivU happy_var_1 happy_var_3
        )
happyReduction_116 _ _ _  = notHappyAtAll 

happyReduce_117 = happySpecReduce_1  40# happyReduction_117
happyReduction_117 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_117 _  = notHappyAtAll 

happyReduce_118 = happySpecReduce_2  41# happyReduction_118
happyReduction_118 (HappyAbsSyn8  happy_var_2)
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (applyType happy_var_1 happy_var_2
        )
happyReduction_118 _ _  = notHappyAtAll 

happyReduce_119 = happySpecReduce_1  41# happyReduction_119
happyReduction_119 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_119 _  = notHappyAtAll 

happyReduce_120 = happySpecReduce_2  42# happyReduction_120
happyReduction_120 _
        _
         =  HappyAbsSyn8
                 (BT.unitU
        )

happyReduce_121 = happySpecReduce_3  42# happyReduction_121
happyReduction_121 _
        (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (happy_var_2
        )
happyReduction_121 _ _ _  = notHappyAtAll 

happyReduce_122 = happyReduce 5# 42# happyReduction_122
happyReduction_122 (_ `HappyStk`
        (HappyAbsSyn43  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn8  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn8
                 (BT.tupleU (happy_var_2 : happy_var_4)
        ) `HappyStk` happyRest

happyReduce_123 = happySpecReduce_3  42# happyReduction_123
happyReduction_123 _
        (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (BT.listU happy_var_2
        )
happyReduction_123 _ _ _  = notHappyAtAll 

happyReduce_124 = happySpecReduce_2  42# happyReduction_124
happyReduction_124 (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (OptionalU happy_var_2
        )
happyReduction_124 _ _  = notHappyAtAll 

happyReduce_125 = happySpecReduce_1  42# happyReduction_125
happyReduction_125 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (VarU (TV (getName happy_var_1))
        )
happyReduction_125 _  = notHappyAtAll 

happyReduce_126 = happySpecReduce_3  42# happyReduction_126
happyReduction_126 (HappyAbsSyn8  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (LabeledU (TV (getName happy_var_1)) happy_var_3
        )
happyReduction_126 _ _ _  = notHappyAtAll 

happyReduce_127 = happySpecReduce_1  42# happyReduction_127
happyReduction_127 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (VarU (TV (getName happy_var_1))
        )
happyReduction_127 _  = notHappyAtAll 

happyReduce_128 = happySpecReduce_1  42# happyReduction_128
happyReduction_128 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (NatLitU (getInt happy_var_1)
        )
happyReduction_128 _  = notHappyAtAll 

happyReduce_129 = happyReduce 6# 43# happyReduction_129
happyReduction_129 (_ `HappyStk`
        (HappyAbsSyn53  happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn51  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CClsE happy_var_2 happy_var_5)
        ) `HappyStk` happyRest

happyReduce_130 = happySpecReduce_2  43# happyReduction_130
happyReduction_130 (HappyAbsSyn51  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CClsE happy_var_2 [])
        )
happyReduction_130 _ _  = notHappyAtAll 

happyReduce_131 = happySpecReduce_3  44# happyReduction_131
happyReduction_131 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn51
                 (CCHConstrained happy_var_1 happy_var_3
        )
happyReduction_131 _ _ _  = notHappyAtAll 

happyReduce_132 = happyReduce 5# 44# happyReduction_132
happyReduction_132 ((HappyAbsSyn8  happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn52  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn51
                 (CCHMultiConstrained happy_var_2 happy_var_5
        ) `HappyStk` happyRest

happyReduce_133 = happySpecReduce_1  44# happyReduction_133
happyReduction_133 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn51
                 (CCHSimple happy_var_1
        )
happyReduction_133 _  = notHappyAtAll 

happyReduce_134 = happySpecReduce_1  45# happyReduction_134
happyReduction_134 (HappyAbsSyn124  happy_var_1)
         =  HappyAbsSyn52
                 ([happy_var_1]
        )
happyReduction_134 _  = notHappyAtAll 

happyReduce_135 = happySpecReduce_3  45# happyReduction_135
happyReduction_135 (HappyAbsSyn124  happy_var_3)
        _
        (HappyAbsSyn52  happy_var_1)
         =  HappyAbsSyn52
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_135 _ _ _  = notHappyAtAll 

happyReduce_136 = happySpecReduce_1  46# happyReduction_136
happyReduction_136 (HappyAbsSyn54  happy_var_1)
         =  HappyAbsSyn53
                 ([happy_var_1]
        )
happyReduction_136 _  = notHappyAtAll 

happyReduce_137 = happySpecReduce_3  46# happyReduction_137
happyReduction_137 (HappyAbsSyn54  happy_var_3)
        _
        (HappyAbsSyn53  happy_var_1)
         =  HappyAbsSyn53
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_137 _ _ _  = notHappyAtAll 

happyReduce_138 = happySpecReduce_3  47# happyReduction_138
happyReduction_138 (HappyAbsSyn117  happy_var_3)
        _
        (HappyAbsSyn24  happy_var_1)
         =  HappyAbsSyn54
                 (CstSigItem (toEVar happy_var_1) happy_var_3
        )
happyReduction_138 _ _ _  = notHappyAtAll 

happyReduce_139 = happyReduce 6# 48# happyReduction_139
happyReduction_139 (_ `HappyStk`
        (HappyAbsSyn57  happy_var_5) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn56  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 ([at happy_var_1 (CIstE cn ts (concat happy_var_5)) | (cn, ts) <- happy_var_2]
        ) `HappyStk` happyRest

happyReduce_140 = happySpecReduce_2  48# happyReduction_140
happyReduction_140 (HappyAbsSyn56  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn10
                 ([at happy_var_1 (CIstE cn ts []) | (cn, ts) <- happy_var_2]
        )
happyReduction_140 _ _  = notHappyAtAll 

happyReduce_141 = happySpecReduce_2  49# happyReduction_141
happyReduction_141 (HappyAbsSyn43  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn56
                 ([(ClassName (getName happy_var_1), happy_var_2)]
        )
happyReduction_141 _ _  = notHappyAtAll 

happyReduce_142 = happyReduce 4# 49# happyReduction_142
happyReduction_142 ((HappyAbsSyn43  happy_var_4) `HappyStk`
        (HappyTerminal happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn56  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn56
                 (happy_var_1 ++ [(ClassName (getName happy_var_3), happy_var_4)]
        ) `HappyStk` happyRest

happyReduce_143 = happySpecReduce_1  50# happyReduction_143
happyReduction_143 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn57
                 ([happy_var_1]
        )
happyReduction_143 _  = notHappyAtAll 

happyReduce_144 = happySpecReduce_3  50# happyReduction_144
happyReduction_144 (HappyAbsSyn10  happy_var_3)
        _
        (HappyAbsSyn57  happy_var_1)
         =  HappyAbsSyn57
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_144 _ _ _  = notHappyAtAll 

happyReduce_145 = happySpecReduce_1  51# happyReduction_145
happyReduction_145 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_145 _  = notHappyAtAll 

happyReduce_146 = happySpecReduce_2  51# happyReduction_146
happyReduction_146 (HappyAbsSyn10  happy_var_2)
        _
         =  HappyAbsSyn10
                 (map (\(Loc sp e) -> Loc sp (CInlineE (Loc sp e))) happy_var_2
        )
happyReduction_146 _ _  = notHappyAtAll 

happyReduce_147 = happySpecReduce_1  51# happyReduction_147
happyReduction_147 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_147 _  = notHappyAtAll 

happyReduce_148 = happySpecReduce_3  52# happyReduction_148
happyReduction_148 (HappyAbsSyn60  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CFixE InfixL (fromInteger (getInt happy_var_2)) happy_var_3)
        )
happyReduction_148 _ _ _  = notHappyAtAll 

happyReduce_149 = happySpecReduce_3  52# happyReduction_149
happyReduction_149 (HappyAbsSyn60  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CFixE InfixR (fromInteger (getInt happy_var_2)) happy_var_3)
        )
happyReduction_149 _ _ _  = notHappyAtAll 

happyReduce_150 = happySpecReduce_3  52# happyReduction_150
happyReduction_150 (HappyAbsSyn60  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CFixE InfixN (fromInteger (getInt happy_var_2)) happy_var_3)
        )
happyReduction_150 _ _ _  = notHappyAtAll 

happyReduce_151 = happySpecReduce_1  53# happyReduction_151
happyReduction_151 (HappyAbsSyn61  happy_var_1)
         =  HappyAbsSyn60
                 ([happy_var_1]
        )
happyReduction_151 _  = notHappyAtAll 

happyReduce_152 = happySpecReduce_3  53# happyReduction_152
happyReduction_152 (HappyAbsSyn61  happy_var_3)
        _
        (HappyAbsSyn60  happy_var_1)
         =  HappyAbsSyn60
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_152 _ _ _  = notHappyAtAll 

happyReduce_153 = happySpecReduce_3  54# happyReduction_153
happyReduction_153 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn61
                 (EV (getOp happy_var_2)
        )
happyReduction_153 _ _ _  = notHappyAtAll 

happyReduce_154 = happySpecReduce_3  54# happyReduction_154
happyReduction_154 _
        _
        _
         =  HappyAbsSyn61
                 (EV "-"
        )

happyReduce_155 = happySpecReduce_3  54# happyReduction_155
happyReduction_155 _
        _
        _
         =  HappyAbsSyn61
                 (EV "."
        )

happyReduce_156 = happySpecReduce_1  54# happyReduction_156
happyReduction_156 (HappyAbsSyn24  happy_var_1)
         =  HappyAbsSyn61
                 (EV (getOp happy_var_1)
        )
happyReduction_156 _  = notHappyAtAll 

happyReduce_157 = happySpecReduce_1  54# happyReduction_157
happyReduction_157 _
         =  HappyAbsSyn61
                 (EV "."
        )

happyReduce_158 = happySpecReduce_1  54# happyReduction_158
happyReduction_158 _
         =  HappyAbsSyn61
                 (EV "-"
        )

happyReduce_159 = happySpecReduce_1  54# happyReduction_159
happyReduction_159 (HappyTerminal happy_var_1)
         =  HappyAbsSyn61
                 (EV (getName happy_var_1)
        )
happyReduction_159 _  = notHappyAtAll 

happyReduce_160 = happyReduce 6# 55# happyReduction_160
happyReduction_160 (_ `HappyStk`
        (HappyAbsSyn64  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn63  happy_var_3) `HappyStk`
        (HappyAbsSyn24  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 ([at happy_var_1 (CSrcOldE happy_var_2 happy_var_3 happy_var_5)]
        ) `HappyStk` happyRest

happyReduce_161 = happyReduce 7# 55# happyReduction_161
happyReduction_161 (_ `HappyStk`
        (HappyAbsSyn67  happy_var_6) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn63  happy_var_3) `HappyStk`
        (HappyAbsSyn24  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 ([at happy_var_1 (CSrcNewE happy_var_2 happy_var_3 happy_var_6)]
        ) `HappyStk` happyRest

happyReduce_162 = happySpecReduce_0  56# happyReduction_162
happyReduction_162  =  HappyAbsSyn63
                 (Nothing
        )

happyReduce_163 = happySpecReduce_2  56# happyReduction_163
happyReduction_163 (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn63
                 (Just (getString happy_var_2)
        )
happyReduction_163 _ _  = notHappyAtAll 

happyReduce_164 = happySpecReduce_1  57# happyReduction_164
happyReduction_164 (HappyAbsSyn65  happy_var_1)
         =  HappyAbsSyn64
                 ([happy_var_1]
        )
happyReduction_164 _  = notHappyAtAll 

happyReduce_165 = happySpecReduce_3  57# happyReduction_165
happyReduction_165 (HappyAbsSyn65  happy_var_3)
        _
        (HappyAbsSyn64  happy_var_1)
         =  HappyAbsSyn64
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_165 _ _ _  = notHappyAtAll 

happyReduce_166 = happySpecReduce_1  58# happyReduction_166
happyReduction_166 (HappyTerminal happy_var_1)
         =  HappyAbsSyn65
                 ((getString happy_var_1, Nothing)
        )
happyReduction_166 _  = notHappyAtAll 

happyReduce_167 = happySpecReduce_3  58# happyReduction_167
happyReduction_167 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn65
                 ((getString happy_var_1, Just (getName happy_var_3))
        )
happyReduction_167 _ _ _  = notHappyAtAll 

happyReduce_168 = happySpecReduce_3  58# happyReduction_168
happyReduction_168 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn65
                 ((getString happy_var_1, Just (getName happy_var_3))
        )
happyReduction_168 _ _ _  = notHappyAtAll 

happyReduce_169 = happySpecReduce_3  58# happyReduction_169
happyReduction_169 (HappyAbsSyn19  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn65
                 ((getString happy_var_1, Just happy_var_3)
        )
happyReduction_169 _ _ _  = notHappyAtAll 

happyReduce_170 = happySpecReduce_1  58# happyReduction_170
happyReduction_170 (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn65
                 ((happy_var_1, Nothing)
        )
happyReduction_170 _  = notHappyAtAll 

happyReduce_171 = happySpecReduce_3  58# happyReduction_171
happyReduction_171 (HappyAbsSyn19  happy_var_3)
        _
        (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn65
                 ((happy_var_1, Just happy_var_3)
        )
happyReduction_171 _ _ _  = notHappyAtAll 

happyReduce_172 = happySpecReduce_3  58# happyReduction_172
happyReduction_172 (HappyTerminal happy_var_3)
        _
        (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn65
                 ((happy_var_1, Just (getName happy_var_3))
        )
happyReduction_172 _ _ _  = notHappyAtAll 

happyReduce_173 = happySpecReduce_3  58# happyReduction_173
happyReduction_173 (HappyTerminal happy_var_3)
        _
        (HappyAbsSyn19  happy_var_1)
         =  HappyAbsSyn65
                 ((happy_var_1, Just (getName happy_var_3))
        )
happyReduction_173 _ _ _  = notHappyAtAll 

happyReduce_174 = happySpecReduce_3  59# happyReduction_174
happyReduction_174 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn19
                 (getOp happy_var_2
        )
happyReduction_174 _ _ _  = notHappyAtAll 

happyReduce_175 = happySpecReduce_3  59# happyReduction_175
happyReduction_175 _
        _
        _
         =  HappyAbsSyn19
                 ("-"
        )

happyReduce_176 = happySpecReduce_3  59# happyReduction_176
happyReduction_176 _
        _
        _
         =  HappyAbsSyn19
                 ("."
        )

happyReduce_177 = happySpecReduce_1  60# happyReduction_177
happyReduction_177 (HappyAbsSyn68  happy_var_1)
         =  HappyAbsSyn67
                 ([happy_var_1]
        )
happyReduction_177 _  = notHappyAtAll 

happyReduce_178 = happySpecReduce_3  60# happyReduction_178
happyReduction_178 (HappyAbsSyn68  happy_var_3)
        _
        (HappyAbsSyn67  happy_var_1)
         =  HappyAbsSyn67
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_178 _ _ _  = notHappyAtAll 

happyReduce_179 = happySpecReduce_2  61# happyReduction_179
happyReduction_179 (HappyAbsSyn69  happy_var_2)
        _
         =  HappyAbsSyn68
                 ((True, fst happy_var_2, snd happy_var_2)
        )
happyReduction_179 _ _  = notHappyAtAll 

happyReduce_180 = happySpecReduce_1  61# happyReduction_180
happyReduction_180 (HappyAbsSyn69  happy_var_1)
         =  HappyAbsSyn68
                 ((False, fst happy_var_1, snd happy_var_1)
        )
happyReduction_180 _  = notHappyAtAll 

happyReduce_181 = happySpecReduce_1  62# happyReduction_181
happyReduction_181 (HappyTerminal happy_var_1)
         =  HappyAbsSyn69
                 ((getName happy_var_1, happy_var_1)
        )
happyReduction_181 _  = notHappyAtAll 

happyReduce_182 = happySpecReduce_3  62# happyReduction_182
happyReduction_182 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn69
                 ((getOp happy_var_2, happy_var_2)
        )
happyReduction_182 _ _ _  = notHappyAtAll 

happyReduce_183 = happySpecReduce_3  62# happyReduction_183
happyReduction_183 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn69
                 (("-", happy_var_2)
        )
happyReduction_183 _ _ _  = notHappyAtAll 

happyReduce_184 = happySpecReduce_3  62# happyReduction_184
happyReduction_184 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn69
                 ((".", happy_var_2)
        )
happyReduction_184 _ _ _  = notHappyAtAll 

happyReduce_185 = happySpecReduce_1  63# happyReduction_185
happyReduction_185 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_185 _  = notHappyAtAll 

happyReduce_186 = happySpecReduce_1  63# happyReduction_186
happyReduction_186 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_186 _  = notHappyAtAll 

happyReduce_187 = happySpecReduce_1  63# happyReduction_187
happyReduction_187 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_187 _  = notHappyAtAll 

happyReduce_188 = happySpecReduce_1  63# happyReduction_188
happyReduction_188 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_188 _  = notHappyAtAll 

happyReduce_189 = happySpecReduce_3  63# happyReduction_189
happyReduction_189 (HappyAbsSyn8  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_2 (CAnnE happy_var_1 happy_var_3)
        )
happyReduction_189 _ _ _  = notHappyAtAll 

happyReduce_190 = happySpecReduce_3  64# happyReduction_190
happyReduction_190 (HappyAbsSyn9  happy_var_3)
        _
        (HappyAbsSyn17  happy_var_1)
         =  HappyAbsSyn9
                 (Loc (fst (head happy_var_1) <-> happy_var_3) (CGuardExprE happy_var_1 happy_var_3)
        )
happyReduction_190 _ _ _  = notHappyAtAll 

happyReduce_191 = happyReduce 6# 65# happyReduction_191
happyReduction_191 ((HappyAbsSyn9  happy_var_6) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn73  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CLetE happy_var_3 happy_var_6)
        ) `HappyStk` happyRest

happyReduce_192 = happyReduce 5# 65# happyReduction_192
happyReduction_192 ((HappyAbsSyn9  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn73  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CLetE happy_var_3 happy_var_5)
        ) `HappyStk` happyRest

happyReduce_193 = happyReduce 6# 65# happyReduction_193
happyReduction_193 ((HappyAbsSyn9  happy_var_6) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn73  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CLetE happy_var_3 happy_var_6)
        ) `HappyStk` happyRest

happyReduce_194 = happyReduce 5# 65# happyReduction_194
happyReduction_194 ((HappyAbsSyn9  happy_var_5) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn73  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CLetE happy_var_3 happy_var_5)
        ) `HappyStk` happyRest

happyReduce_195 = happySpecReduce_1  66# happyReduction_195
happyReduction_195 (HappyAbsSyn75  happy_var_1)
         =  HappyAbsSyn73
                 ([happy_var_1]
        )
happyReduction_195 _  = notHappyAtAll 

happyReduce_196 = happySpecReduce_3  66# happyReduction_196
happyReduction_196 (HappyAbsSyn75  happy_var_3)
        _
        (HappyAbsSyn73  happy_var_1)
         =  HappyAbsSyn73
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_196 _ _ _  = notHappyAtAll 

happyReduce_197 = happySpecReduce_1  67# happyReduction_197
happyReduction_197 (HappyAbsSyn75  happy_var_1)
         =  HappyAbsSyn73
                 ([happy_var_1]
        )
happyReduction_197 _  = notHappyAtAll 

happyReduce_198 = happySpecReduce_3  67# happyReduction_198
happyReduction_198 (HappyAbsSyn75  happy_var_3)
        _
        (HappyAbsSyn73  happy_var_1)
         =  HappyAbsSyn73
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_198 _ _ _  = notHappyAtAll 

happyReduce_199 = happySpecReduce_3  68# happyReduction_199
happyReduction_199 (HappyAbsSyn9  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn75
                 ((EV (getName happy_var_1), happy_var_3)
        )
happyReduction_199 _ _ _  = notHappyAtAll 

happyReduce_200 = happySpecReduce_3  68# happyReduction_200
happyReduction_200 (HappyAbsSyn9  happy_var_3)
        _
        _
         =  HappyAbsSyn75
                 ((EV "_", happy_var_3)
        )
happyReduction_200 _ _ _  = notHappyAtAll 

happyReduce_201 = happyReduce 4# 68# happyReduction_201
happyReduction_201 ((HappyAbsSyn9  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn17  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn75
                 ((EV (getName happy_var_1), Loc (happy_var_1 <-> happy_var_4) (CGuardExprE happy_var_2 happy_var_4))
        ) `HappyStk` happyRest

happyReduce_202 = happyReduce 4# 69# happyReduction_202
happyReduction_202 ((HappyAbsSyn9  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn20  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (at happy_var_1 (CLamE (map EV happy_var_2) happy_var_4)
        ) `HappyStk` happyRest

happyReduce_203 = happySpecReduce_1  70# happyReduction_203
happyReduction_203 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_203 _  = notHappyAtAll 

happyReduce_204 = happySpecReduce_3  70# happyReduction_204
happyReduction_204 (HappyAbsSyn9  happy_var_3)
        (HappyAbsSyn24  happy_var_2)
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_2 (CBopE happy_var_1 happy_var_2 happy_var_3)
        )
happyReduction_204 _ _ _  = notHappyAtAll 

happyReduce_205 = happySpecReduce_3  70# happyReduction_205
happyReduction_205 (HappyAbsSyn9  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_2 (CBopE happy_var_1 happy_var_2 happy_var_3)
        )
happyReduction_205 _ _ _  = notHappyAtAll 

happyReduce_206 = happySpecReduce_3  70# happyReduction_206
happyReduction_206 (HappyAbsSyn9  happy_var_3)
        (HappyTerminal happy_var_2)
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_2 (CBopE happy_var_1 happy_var_2 happy_var_3)
        )
happyReduction_206 _ _ _  = notHappyAtAll 

happyReduce_207 = happySpecReduce_1  71# happyReduction_207
happyReduction_207 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_207 _  = notHappyAtAll 

happyReduce_208 = happySpecReduce_2  71# happyReduction_208
happyReduction_208 (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CIntE (negate (getInt happy_var_2)))
        )
happyReduction_208 _ _  = notHappyAtAll 

happyReduce_209 = happySpecReduce_2  71# happyReduction_209
happyReduction_209 (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CRealE (DS.fromFloatDigits (negate (getFloat happy_var_2))))
        )
happyReduction_209 _ _  = notHappyAtAll 

happyReduce_210 = happySpecReduce_1  72# happyReduction_210
happyReduction_210 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_210 _  = notHappyAtAll 

happyReduce_211 = happySpecReduce_2  72# happyReduction_211
happyReduction_211 (HappyAbsSyn10  happy_var_2)
        (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> last happy_var_2) (CAppE happy_var_1 happy_var_2)
        )
happyReduction_211 _ _  = notHappyAtAll 

happyReduce_212 = happySpecReduce_2  73# happyReduction_212
happyReduction_212 (HappyAbsSyn9  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_2) (CForceE happy_var_2)
        )
happyReduction_212 _ _  = notHappyAtAll 

happyReduce_213 = happySpecReduce_1  73# happyReduction_213
happyReduction_213 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_213 _  = notHappyAtAll 

happyReduce_214 = happySpecReduce_1  74# happyReduction_214
happyReduction_214 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_214 _  = notHappyAtAll 

happyReduce_215 = happySpecReduce_2  74# happyReduction_215
happyReduction_215 (HappyAbsSyn9  happy_var_2)
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ [happy_var_2]
        )
happyReduction_215 _ _  = notHappyAtAll 

happyReduce_216 = happySpecReduce_1  75# happyReduction_216
happyReduction_216 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_216 _  = notHappyAtAll 

happyReduce_217 = happySpecReduce_1  75# happyReduction_217
happyReduction_217 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_217 _  = notHappyAtAll 

happyReduce_218 = happySpecReduce_1  75# happyReduction_218
happyReduction_218 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_218 _  = notHappyAtAll 

happyReduce_219 = happySpecReduce_1  75# happyReduction_219
happyReduction_219 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_219 _  = notHappyAtAll 

happyReduce_220 = happySpecReduce_1  75# happyReduction_220
happyReduction_220 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_220 _  = notHappyAtAll 

happyReduce_221 = happySpecReduce_1  75# happyReduction_221
happyReduction_221 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_221 _  = notHappyAtAll 

happyReduce_222 = happySpecReduce_1  75# happyReduction_222
happyReduction_222 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_222 _  = notHappyAtAll 

happyReduce_223 = happySpecReduce_1  75# happyReduction_223
happyReduction_223 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_223 _  = notHappyAtAll 

happyReduce_224 = happySpecReduce_1  75# happyReduction_224
happyReduction_224 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_224 _  = notHappyAtAll 

happyReduce_225 = happySpecReduce_1  75# happyReduction_225
happyReduction_225 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_225 _  = notHappyAtAll 

happyReduce_226 = happySpecReduce_1  75# happyReduction_226
happyReduction_226 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_226 _  = notHappyAtAll 

happyReduce_227 = happySpecReduce_1  75# happyReduction_227
happyReduction_227 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_227 _  = notHappyAtAll 

happyReduce_228 = happySpecReduce_1  76# happyReduction_228
happyReduction_228 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 CNullE
        )
happyReduction_228 _  = notHappyAtAll 

happyReduce_229 = happySpecReduce_1  77# happyReduction_229
happyReduction_229 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CIntrinsicE (getIntrinsicName happy_var_1))
        )
happyReduction_229 _  = notHappyAtAll 

happyReduce_230 = happySpecReduce_2  78# happyReduction_230
happyReduction_230 _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 CUniE
        )
happyReduction_230 _ _  = notHappyAtAll 

happyReduce_231 = happySpecReduce_3  78# happyReduction_231
happyReduction_231 _
        (HappyAbsSyn24  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CVarE (EV (getOp happy_var_2)))
        )
happyReduction_231 _ _ _  = notHappyAtAll 

happyReduce_232 = happySpecReduce_3  78# happyReduction_232
happyReduction_232 _
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CVarE (EV "-"))
        )
happyReduction_232 _ _ _  = notHappyAtAll 

happyReduce_233 = happySpecReduce_3  78# happyReduction_233
happyReduction_233 _
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CVarE (EV "."))
        )
happyReduction_233 _ _ _  = notHappyAtAll 

happyReduce_234 = happySpecReduce_3  78# happyReduction_234
happyReduction_234 (HappyTerminal happy_var_3)
        (HappyAbsSyn9  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CParenE happy_var_2)
        )
happyReduction_234 _ _ _  = notHappyAtAll 

happyReduce_235 = happyReduce 5# 78# happyReduction_235
happyReduction_235 ((HappyTerminal happy_var_5) `HappyStk`
        (HappyAbsSyn10  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn9  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_5) (CTupE (happy_var_2 : happy_var_4))
        ) `HappyStk` happyRest

happyReduce_236 = happySpecReduce_1  79# happyReduction_236
happyReduction_236 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn10
                 ([happy_var_1]
        )
happyReduction_236 _  = notHappyAtAll 

happyReduce_237 = happySpecReduce_3  79# happyReduction_237
happyReduction_237 (HappyAbsSyn9  happy_var_3)
        _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_237 _ _ _  = notHappyAtAll 

happyReduce_238 = happySpecReduce_3  80# happyReduction_238
happyReduction_238 (HappyTerminal happy_var_3)
        (HappyAbsSyn88  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CNamE happy_var_2)
        )
happyReduction_238 _ _ _  = notHappyAtAll 

happyReduce_239 = happySpecReduce_1  81# happyReduction_239
happyReduction_239 (HappyAbsSyn89  happy_var_1)
         =  HappyAbsSyn88
                 ([happy_var_1]
        )
happyReduction_239 _  = notHappyAtAll 

happyReduce_240 = happySpecReduce_3  81# happyReduction_240
happyReduction_240 (HappyAbsSyn89  happy_var_3)
        _
        (HappyAbsSyn88  happy_var_1)
         =  HappyAbsSyn88
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_240 _ _ _  = notHappyAtAll 

happyReduce_241 = happySpecReduce_3  82# happyReduction_241
happyReduction_241 (HappyAbsSyn9  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn89
                 ((Key (getName happy_var_1), happy_var_3)
        )
happyReduction_241 _ _ _  = notHappyAtAll 

happyReduce_242 = happySpecReduce_2  83# happyReduction_242
happyReduction_242 (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_2) (CLstE [])
        )
happyReduction_242 _ _  = notHappyAtAll 

happyReduce_243 = happySpecReduce_3  83# happyReduction_243
happyReduction_243 (HappyTerminal happy_var_3)
        (HappyAbsSyn10  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CLstE happy_var_2)
        )
happyReduction_243 _ _ _  = notHappyAtAll 

happyReduce_244 = happyReduce 4# 84# happyReduction_244
happyReduction_244 ((HappyTerminal happy_var_4) `HappyStk`
        (HappyAbsSyn92  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_4) (CDoE happy_var_3)
        ) `HappyStk` happyRest

happyReduce_245 = happyReduce 4# 84# happyReduction_245
happyReduction_245 ((HappyTerminal happy_var_4) `HappyStk`
        (HappyAbsSyn92  happy_var_3) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_4) (CDoE happy_var_3)
        ) `HappyStk` happyRest

happyReduce_246 = happySpecReduce_1  85# happyReduction_246
happyReduction_246 (HappyAbsSyn92  happy_var_1)
         =  HappyAbsSyn92
                 (happy_var_1
        )
happyReduction_246 _  = notHappyAtAll 

happyReduce_247 = happySpecReduce_3  85# happyReduction_247
happyReduction_247 (HappyAbsSyn92  happy_var_3)
        _
        (HappyAbsSyn92  happy_var_1)
         =  HappyAbsSyn92
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_247 _ _ _  = notHappyAtAll 

happyReduce_248 = happySpecReduce_1  86# happyReduction_248
happyReduction_248 (HappyAbsSyn92  happy_var_1)
         =  HappyAbsSyn92
                 (happy_var_1
        )
happyReduction_248 _  = notHappyAtAll 

happyReduce_249 = happySpecReduce_3  86# happyReduction_249
happyReduction_249 (HappyAbsSyn92  happy_var_3)
        _
        (HappyAbsSyn92  happy_var_1)
         =  HappyAbsSyn92
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_249 _ _ _  = notHappyAtAll 

happyReduce_250 = happySpecReduce_3  87# happyReduction_250
happyReduction_250 (HappyAbsSyn9  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn92
                 ([CstDoBind (EV (getName happy_var_1)) happy_var_3]
        )
happyReduction_250 _ _ _  = notHappyAtAll 

happyReduce_251 = happyReduce 4# 87# happyReduction_251
happyReduction_251 (_ `HappyStk`
        (HappyAbsSyn73  happy_var_3) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn92
                 ([CstDoLet (EV v) e | (EV v, e) <- happy_var_3]
        ) `HappyStk` happyRest

happyReduce_252 = happySpecReduce_1  87# happyReduction_252
happyReduction_252 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn92
                 ([CstDoBare happy_var_1]
        )
happyReduction_252 _  = notHappyAtAll 

happyReduce_253 = happySpecReduce_2  88# happyReduction_253
happyReduction_253 (HappyAbsSyn96  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CAccessorE happy_var_2)
        )
happyReduction_253 _ _  = notHappyAtAll 

happyReduce_254 = happySpecReduce_2  88# happyReduction_254
happyReduction_254 (HappyAbsSyn96  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CAccessorE happy_var_2)
        )
happyReduction_254 _ _  = notHappyAtAll 

happyReduce_255 = happySpecReduce_2  89# happyReduction_255
happyReduction_255 (HappyAbsSyn97  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn96
                 (CABKey (getName happy_var_1) happy_var_2
        )
happyReduction_255 _ _  = notHappyAtAll 

happyReduce_256 = happySpecReduce_2  89# happyReduction_256
happyReduction_256 (HappyAbsSyn97  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn96
                 (CABIdx (fromInteger (getInt happy_var_1)) happy_var_2
        )
happyReduction_256 _ _  = notHappyAtAll 

happyReduce_257 = happySpecReduce_3  89# happyReduction_257
happyReduction_257 _
        (HappyAbsSyn98  happy_var_2)
        _
         =  HappyAbsSyn96
                 (CABGroup happy_var_2
        )
happyReduction_257 _ _ _  = notHappyAtAll 

happyReduce_258 = happySpecReduce_0  90# happyReduction_258
happyReduction_258  =  HappyAbsSyn97
                 (CATEnd
        )

happyReduce_259 = happySpecReduce_2  90# happyReduction_259
happyReduction_259 (HappyAbsSyn9  happy_var_2)
        _
         =  HappyAbsSyn97
                 (CATSet happy_var_2
        )
happyReduction_259 _ _  = notHappyAtAll 

happyReduce_260 = happySpecReduce_2  90# happyReduction_260
happyReduction_260 (HappyAbsSyn96  happy_var_2)
        _
         =  HappyAbsSyn97
                 (CATChain happy_var_2
        )
happyReduction_260 _ _  = notHappyAtAll 

happyReduce_261 = happySpecReduce_1  91# happyReduction_261
happyReduction_261 (HappyAbsSyn96  happy_var_1)
         =  HappyAbsSyn98
                 ([happy_var_1]
        )
happyReduction_261 _  = notHappyAtAll 

happyReduce_262 = happySpecReduce_3  91# happyReduction_262
happyReduction_262 (HappyAbsSyn96  happy_var_3)
        _
        (HappyAbsSyn98  happy_var_1)
         =  HappyAbsSyn98
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_262 _ _ _  = notHappyAtAll 

happyReduce_263 = happySpecReduce_2  92# happyReduction_263
happyReduction_263 (HappyAbsSyn96  happy_var_2)
        _
         =  HappyAbsSyn96
                 (happy_var_2
        )
happyReduction_263 _ _  = notHappyAtAll 

happyReduce_264 = happySpecReduce_2  92# happyReduction_264
happyReduction_264 (HappyAbsSyn96  happy_var_2)
        _
         =  HappyAbsSyn96
                 (happy_var_2
        )
happyReduction_264 _ _  = notHappyAtAll 

happyReduce_265 = happySpecReduce_3  93# happyReduction_265
happyReduction_265 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CVarE (EV (getName happy_var_1 <> "." <> getName happy_var_3)))
        )
happyReduction_265 _ _ _  = notHappyAtAll 

happyReduce_266 = happySpecReduce_3  93# happyReduction_266
happyReduction_266 (HappyTerminal happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CLabeledVarE (getName happy_var_1) (EV (getName happy_var_3)))
        )
happyReduction_266 _ _ _  = notHappyAtAll 

happyReduce_267 = happySpecReduce_1  93# happyReduction_267
happyReduction_267 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CVarE (EV (getName happy_var_1)))
        )
happyReduction_267 _  = notHappyAtAll 

happyReduce_268 = happySpecReduce_1  94# happyReduction_268
happyReduction_268 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 CHolE
        )
happyReduction_268 _  = notHappyAtAll 

happyReduce_269 = happySpecReduce_1  95# happyReduction_269
happyReduction_269 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CLogE True)
        )
happyReduction_269 _  = notHappyAtAll 

happyReduce_270 = happySpecReduce_1  95# happyReduction_270
happyReduction_270 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CLogE False)
        )
happyReduction_270 _  = notHappyAtAll 

happyReduce_271 = happySpecReduce_1  96# happyReduction_271
happyReduction_271 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CIntE (getInt happy_var_1))
        )
happyReduction_271 _  = notHappyAtAll 

happyReduce_272 = happySpecReduce_1  96# happyReduction_272
happyReduction_272 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CRealE (DS.fromFloatDigits (getFloat happy_var_1)))
        )
happyReduction_272 _  = notHappyAtAll 

happyReduce_273 = happySpecReduce_1  97# happyReduction_273
happyReduction_273 (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (at happy_var_1 (CStrE (getString happy_var_1))
        )
happyReduction_273 _  = notHappyAtAll 

happyReduce_274 = happySpecReduce_1  97# happyReduction_274
happyReduction_274 (HappyAbsSyn9  happy_var_1)
         =  HappyAbsSyn9
                 (happy_var_1
        )
happyReduction_274 _  = notHappyAtAll 

happyReduce_275 = happySpecReduce_3  98# happyReduction_275
happyReduction_275 (HappyTerminal happy_var_3)
        (HappyAbsSyn106  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn9
                 (Loc (happy_var_1 <-> happy_var_3) (CInterpE (getString happy_var_1) (fst happy_var_2) (snd happy_var_2) (getString happy_var_3))
        )
happyReduction_275 _ _ _  = notHappyAtAll 

happyReduce_276 = happySpecReduce_3  99# happyReduction_276
happyReduction_276 _
        (HappyAbsSyn9  happy_var_2)
        _
         =  HappyAbsSyn106
                 (([happy_var_2], [])
        )
happyReduction_276 _ _ _  = notHappyAtAll 

happyReduce_277 = happyReduce 5# 99# happyReduction_277
happyReduction_277 (_ `HappyStk`
        (HappyAbsSyn9  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyTerminal happy_var_2) `HappyStk`
        (HappyAbsSyn106  happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn106
                 (let (es, ms) = happy_var_1 in (es ++ [happy_var_4], ms ++ [getString happy_var_2])
        ) `HappyStk` happyRest

happyReduce_278 = happySpecReduce_1  100# happyReduction_278
happyReduction_278 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_278 _  = notHappyAtAll 

happyReduce_279 = happySpecReduce_1  100# happyReduction_279
happyReduction_279 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_279 _  = notHappyAtAll 

happyReduce_280 = happySpecReduce_3  101# happyReduction_280
happyReduction_280 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (case happy_var_3 of { FunU args ret -> FunU (happy_var_1 : args) ret; t -> FunU [happy_var_1] t }
        )
happyReduction_280 _ _ _  = notHappyAtAll 

happyReduce_281 = happySpecReduce_3  102# happyReduction_281
happyReduction_281 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn8
                 (ExistU (TV (getName happy_var_2)) ([], Open) ([], Open)
        )
happyReduction_281 _ _ _  = notHappyAtAll 

happyReduce_282 = happyReduce 4# 102# happyReduction_282
happyReduction_282 ((HappyAbsSyn8  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn116  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn8
                 (EffectU (EffectSet (Set.fromList happy_var_2)) happy_var_4
        ) `HappyStk` happyRest

happyReduce_283 = happySpecReduce_1  102# happyReduction_283
happyReduction_283 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_283 _  = notHappyAtAll 

happyReduce_284 = happySpecReduce_3  103# happyReduction_284
happyReduction_284 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatAddU happy_var_1 happy_var_3
        )
happyReduction_284 _ _ _  = notHappyAtAll 

happyReduce_285 = happySpecReduce_3  103# happyReduction_285
happyReduction_285 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatSubU happy_var_1 happy_var_3
        )
happyReduction_285 _ _ _  = notHappyAtAll 

happyReduce_286 = happySpecReduce_1  103# happyReduction_286
happyReduction_286 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_286 _  = notHappyAtAll 

happyReduce_287 = happySpecReduce_3  104# happyReduction_287
happyReduction_287 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatMulU happy_var_1 happy_var_3
        )
happyReduction_287 _ _ _  = notHappyAtAll 

happyReduce_288 = happySpecReduce_3  104# happyReduction_288
happyReduction_288 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (NatDivU happy_var_1 happy_var_3
        )
happyReduction_288 _ _ _  = notHappyAtAll 

happyReduce_289 = happySpecReduce_1  104# happyReduction_289
happyReduction_289 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_289 _  = notHappyAtAll 

happyReduce_290 = happySpecReduce_2  105# happyReduction_290
happyReduction_290 (HappyAbsSyn8  happy_var_2)
        (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (applyType happy_var_1 happy_var_2
        )
happyReduction_290 _ _  = notHappyAtAll 

happyReduce_291 = happySpecReduce_1  105# happyReduction_291
happyReduction_291 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn8
                 (happy_var_1
        )
happyReduction_291 _  = notHappyAtAll 

happyReduce_292 = happySpecReduce_2  106# happyReduction_292
happyReduction_292 _
        _
         =  HappyAbsSyn8
                 (BT.unitU
        )

happyReduce_293 = happySpecReduce_3  106# happyReduction_293
happyReduction_293 _
        (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (happy_var_2
        )
happyReduction_293 _ _ _  = notHappyAtAll 

happyReduce_294 = happyReduce 5# 106# happyReduction_294
happyReduction_294 (_ `HappyStk`
        (HappyAbsSyn43  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn8  happy_var_2) `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn8
                 (BT.tupleU (happy_var_2 : happy_var_4)
        ) `HappyStk` happyRest

happyReduce_295 = happySpecReduce_3  106# happyReduction_295
happyReduction_295 _
        (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (BT.listU happy_var_2
        )
happyReduction_295 _ _ _  = notHappyAtAll 

happyReduce_296 = happySpecReduce_2  106# happyReduction_296
happyReduction_296 (HappyAbsSyn8  happy_var_2)
        _
         =  HappyAbsSyn8
                 (OptionalU happy_var_2
        )
happyReduction_296 _ _  = notHappyAtAll 

happyReduce_297 = happySpecReduce_1  106# happyReduction_297
happyReduction_297 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (VarU (TV (getName happy_var_1))
        )
happyReduction_297 _  = notHappyAtAll 

happyReduce_298 = happySpecReduce_3  106# happyReduction_298
happyReduction_298 (HappyAbsSyn8  happy_var_3)
        _
        _
         =  HappyAbsSyn8
                 (happy_var_3
        )
happyReduction_298 _ _ _  = notHappyAtAll 

happyReduce_299 = happySpecReduce_1  106# happyReduction_299
happyReduction_299 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (VarU (TV (getName happy_var_1))
        )
happyReduction_299 _  = notHappyAtAll 

happyReduce_300 = happySpecReduce_1  106# happyReduction_300
happyReduction_300 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (VarU (TV (getString happy_var_1))
        )
happyReduction_300 _  = notHappyAtAll 

happyReduce_301 = happySpecReduce_1  106# happyReduction_301
happyReduction_301 (HappyTerminal happy_var_1)
         =  HappyAbsSyn8
                 (NatLitU (getInt happy_var_1)
        )
happyReduction_301 _  = notHappyAtAll 

happyReduce_302 = happySpecReduce_1  107# happyReduction_302
happyReduction_302 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn43
                 ([happy_var_1]
        )
happyReduction_302 _  = notHappyAtAll 

happyReduce_303 = happySpecReduce_3  107# happyReduction_303
happyReduction_303 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn43  happy_var_1)
         =  HappyAbsSyn43
                 (happy_var_1 ++ [happy_var_3]
        )
happyReduction_303 _ _ _  = notHappyAtAll 

happyReduce_304 = happySpecReduce_1  108# happyReduction_304
happyReduction_304 (HappyAbsSyn8  happy_var_1)
         =  HappyAbsSyn43
                 ([happy_var_1]
        )
happyReduction_304 _  = notHappyAtAll 

happyReduce_305 = happySpecReduce_2  108# happyReduction_305
happyReduction_305 (HappyAbsSyn8  happy_var_2)
        (HappyAbsSyn43  happy_var_1)
         =  HappyAbsSyn43
                 (happy_var_1 ++ [happy_var_2]
        )
happyReduction_305 _ _  = notHappyAtAll 

happyReduce_306 = happySpecReduce_1  109# happyReduction_306
happyReduction_306 (HappyTerminal happy_var_1)
         =  HappyAbsSyn116
                 ([getName happy_var_1]
        )
happyReduction_306 _  = notHappyAtAll 

happyReduce_307 = happySpecReduce_3  109# happyReduction_307
happyReduction_307 (HappyTerminal happy_var_3)
        _
        (HappyAbsSyn116  happy_var_1)
         =  HappyAbsSyn116
                 (happy_var_1 ++ [getName happy_var_3]
        )
happyReduction_307 _ _ _  = notHappyAtAll 

happyReduce_308 = happySpecReduce_3  110# happyReduction_308
happyReduction_308 (HappyAbsSyn118  happy_var_3)
        _
        (HappyAbsSyn118  happy_var_1)
         =  HappyAbsSyn117
                 (CstSigType (Just happy_var_1) happy_var_3
        )
happyReduction_308 _ _ _  = notHappyAtAll 

happyReduce_309 = happySpecReduce_1  110# happyReduction_309
happyReduction_309 (HappyAbsSyn118  happy_var_1)
         =  HappyAbsSyn117
                 (CstSigType Nothing happy_var_1
        )
happyReduction_309 _  = notHappyAtAll 

happyReduce_310 = happySpecReduce_3  111# happyReduction_310
happyReduction_310 (HappyAbsSyn118  happy_var_3)
        _
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn118
                 (happy_var_1 : happy_var_3
        )
happyReduction_310 _ _ _  = notHappyAtAll 

happyReduce_311 = happySpecReduce_1  111# happyReduction_311
happyReduction_311 (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn118
                 ([happy_var_1]
        )
happyReduction_311 _  = notHappyAtAll 

happyReduce_312 = happySpecReduce_3  112# happyReduction_312
happyReduction_312 _
        (HappyTerminal happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, ExistU (TV (getName happy_var_2)) ([], Open) ([], Open))
        )
happyReduction_312 _ _ _  = notHappyAtAll 

happyReduce_313 = happyReduce 4# 112# happyReduction_313
happyReduction_313 ((HappyAbsSyn119  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn116  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn119
                 ((locPos happy_var_1, EffectU (EffectSet (Set.fromList happy_var_2)) (snd happy_var_4))
        ) `HappyStk` happyRest

happyReduce_314 = happySpecReduce_1  112# happyReduction_314
happyReduction_314 (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 (happy_var_1
        )
happyReduction_314 _  = notHappyAtAll 

happyReduce_315 = happySpecReduce_3  113# happyReduction_315
happyReduction_315 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 ((fst happy_var_1, NatAddU (snd happy_var_1) happy_var_3)
        )
happyReduction_315 _ _ _  = notHappyAtAll 

happyReduce_316 = happySpecReduce_3  113# happyReduction_316
happyReduction_316 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 ((fst happy_var_1, NatSubU (snd happy_var_1) happy_var_3)
        )
happyReduction_316 _ _ _  = notHappyAtAll 

happyReduce_317 = happySpecReduce_1  113# happyReduction_317
happyReduction_317 (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 (happy_var_1
        )
happyReduction_317 _  = notHappyAtAll 

happyReduce_318 = happySpecReduce_3  114# happyReduction_318
happyReduction_318 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 ((fst happy_var_1, NatMulU (snd happy_var_1) happy_var_3)
        )
happyReduction_318 _ _ _  = notHappyAtAll 

happyReduce_319 = happySpecReduce_3  114# happyReduction_319
happyReduction_319 (HappyAbsSyn8  happy_var_3)
        _
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 ((fst happy_var_1, NatDivU (snd happy_var_1) happy_var_3)
        )
happyReduction_319 _ _ _  = notHappyAtAll 

happyReduce_320 = happySpecReduce_1  114# happyReduction_320
happyReduction_320 (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 (happy_var_1
        )
happyReduction_320 _  = notHappyAtAll 

happyReduce_321 = happySpecReduce_2  115# happyReduction_321
happyReduction_321 (HappyAbsSyn8  happy_var_2)
        (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 ((fst happy_var_1, applyType (snd happy_var_1) happy_var_2)
        )
happyReduction_321 _ _  = notHappyAtAll 

happyReduce_322 = happySpecReduce_1  115# happyReduction_322
happyReduction_322 (HappyAbsSyn119  happy_var_1)
         =  HappyAbsSyn119
                 (happy_var_1
        )
happyReduction_322 _  = notHappyAtAll 

happyReduce_323 = happySpecReduce_2  116# happyReduction_323
happyReduction_323 _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, BT.unitU)
        )
happyReduction_323 _ _  = notHappyAtAll 

happyReduce_324 = happySpecReduce_3  116# happyReduction_324
happyReduction_324 _
        (HappyAbsSyn8  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, happy_var_2)
        )
happyReduction_324 _ _ _  = notHappyAtAll 

happyReduce_325 = happyReduce 5# 116# happyReduction_325
happyReduction_325 (_ `HappyStk`
        (HappyAbsSyn43  happy_var_4) `HappyStk`
        _ `HappyStk`
        (HappyAbsSyn8  happy_var_2) `HappyStk`
        (HappyTerminal happy_var_1) `HappyStk`
        happyRest)
         = HappyAbsSyn119
                 ((locPos happy_var_1, BT.tupleU (happy_var_2 : happy_var_4))
        ) `HappyStk` happyRest

happyReduce_326 = happySpecReduce_3  116# happyReduction_326
happyReduction_326 _
        (HappyAbsSyn8  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, BT.listU happy_var_2)
        )
happyReduction_326 _ _ _  = notHappyAtAll 

happyReduce_327 = happySpecReduce_2  116# happyReduction_327
happyReduction_327 (HappyAbsSyn119  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, OptionalU (snd happy_var_2))
        )
happyReduction_327 _ _  = notHappyAtAll 

happyReduce_328 = happySpecReduce_1  116# happyReduction_328
happyReduction_328 (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, VarU (TV (getName happy_var_1)))
        )
happyReduction_328 _  = notHappyAtAll 

happyReduce_329 = happySpecReduce_3  116# happyReduction_329
happyReduction_329 (HappyAbsSyn8  happy_var_3)
        _
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, LabeledU (TV (getName happy_var_1)) happy_var_3)
        )
happyReduction_329 _ _ _  = notHappyAtAll 

happyReduce_330 = happySpecReduce_1  116# happyReduction_330
happyReduction_330 (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, VarU (TV (getName happy_var_1)))
        )
happyReduction_330 _  = notHappyAtAll 

happyReduce_331 = happySpecReduce_1  116# happyReduction_331
happyReduction_331 (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, VarU (TV (getString happy_var_1)))
        )
happyReduction_331 _  = notHappyAtAll 

happyReduce_332 = happySpecReduce_1  116# happyReduction_332
happyReduction_332 (HappyTerminal happy_var_1)
         =  HappyAbsSyn119
                 ((locPos happy_var_1, NatLitU (getInt happy_var_1))
        )
happyReduction_332 _  = notHappyAtAll 

happyReduce_333 = happySpecReduce_2  117# happyReduction_333
happyReduction_333 (HappyAbsSyn43  happy_var_2)
        (HappyTerminal happy_var_1)
         =  HappyAbsSyn124
                 (Constraint (ClassName (getName happy_var_1)) happy_var_2
        )
happyReduction_333 _ _  = notHappyAtAll 

happyReduce_334 = happySpecReduce_1  118# happyReduction_334
happyReduction_334 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_334 _  = notHappyAtAll 

happyReduce_335 = happySpecReduce_1  118# happyReduction_335
happyReduction_335 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_335 _  = notHappyAtAll 

happyReduce_336 = happySpecReduce_1  118# happyReduction_336
happyReduction_336 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_336 _  = notHappyAtAll 

happyReduce_337 = happySpecReduce_1  118# happyReduction_337
happyReduction_337 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_337 _  = notHappyAtAll 

happyReduce_338 = happySpecReduce_1  118# happyReduction_338
happyReduction_338 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_338 _  = notHappyAtAll 

happyReduce_339 = happySpecReduce_1  118# happyReduction_339
happyReduction_339 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_339 _  = notHappyAtAll 

happyReduce_340 = happySpecReduce_1  119# happyReduction_340
happyReduction_340 (HappyTerminal happy_var_1)
         =  HappyAbsSyn24
                 (happy_var_1
        )
happyReduction_340 _  = notHappyAtAll 

happyReduce_341 = happySpecReduce_3  119# happyReduction_341
happyReduction_341 _
        (HappyAbsSyn24  happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_341 _ _ _  = notHappyAtAll 

happyReduce_342 = happySpecReduce_3  119# happyReduction_342
happyReduction_342 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_342 _ _ _  = notHappyAtAll 

happyReduce_343 = happySpecReduce_3  119# happyReduction_343
happyReduction_343 _
        (HappyTerminal happy_var_2)
        _
         =  HappyAbsSyn24
                 (happy_var_2
        )
happyReduction_343 _ _ _  = notHappyAtAll 

happyReduce_344 = happySpecReduce_0  120# happyReduction_344
happyReduction_344  =  HappyAbsSyn10
                 ([]
        )

happyReduce_345 = happyReduce 4# 120# happyReduction_345
happyReduction_345 (_ `HappyStk`
        (HappyAbsSyn10  happy_var_3) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 (happy_var_3
        ) `HappyStk` happyRest

happyReduce_346 = happyReduce 4# 120# happyReduction_346
happyReduction_346 (_ `HappyStk`
        (HappyAbsSyn10  happy_var_3) `HappyStk`
        _ `HappyStk`
        _ `HappyStk`
        happyRest)
         = HappyAbsSyn10
                 (happy_var_3
        ) `HappyStk` happyRest

happyReduce_347 = happySpecReduce_1  121# happyReduction_347
happyReduction_347 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_347 _  = notHappyAtAll 

happyReduce_348 = happySpecReduce_3  121# happyReduction_348
happyReduction_348 (HappyAbsSyn10  happy_var_3)
        _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_348 _ _ _  = notHappyAtAll 

happyReduce_349 = happySpecReduce_1  122# happyReduction_349
happyReduction_349 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_349 _  = notHappyAtAll 

happyReduce_350 = happySpecReduce_3  122# happyReduction_350
happyReduction_350 (HappyAbsSyn10  happy_var_3)
        _
        (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1 ++ happy_var_3
        )
happyReduction_350 _ _ _  = notHappyAtAll 

happyReduce_351 = happySpecReduce_1  123# happyReduction_351
happyReduction_351 (HappyAbsSyn10  happy_var_1)
         =  HappyAbsSyn10
                 (happy_var_1
        )
happyReduction_351 _  = notHappyAtAll 

happyReduce_352 = happySpecReduce_0  124# happyReduction_352
happyReduction_352  =  HappyAbsSyn20
                 ([]
        )

happyReduce_353 = happySpecReduce_2  124# happyReduction_353
happyReduction_353 (HappyTerminal happy_var_2)
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [getName happy_var_2]
        )
happyReduction_353 _ _  = notHappyAtAll 

happyReduce_354 = happySpecReduce_1  125# happyReduction_354
happyReduction_354 (HappyTerminal happy_var_1)
         =  HappyAbsSyn20
                 ([getName happy_var_1]
        )
happyReduction_354 _  = notHappyAtAll 

happyReduce_355 = happySpecReduce_2  125# happyReduction_355
happyReduction_355 (HappyTerminal happy_var_2)
        (HappyAbsSyn20  happy_var_1)
         =  HappyAbsSyn20
                 (happy_var_1 ++ [getName happy_var_2]
        )
happyReduction_355 _ _  = notHappyAtAll 

happyTerminalToTok term = case term of {
        Located _ TokVLBrace _ -> 2#;
        Located _ TokVRBrace _ -> 3#;
        Located _ TokVSemi _ -> 4#;
        Located _ TokLParen _ -> 5#;
        Located _ TokRParen _ -> 6#;
        Located _ TokLBracket _ -> 7#;
        Located _ TokRBracket _ -> 8#;
        Located _ TokLBrace _ -> 9#;
        Located _ TokRBrace _ -> 10#;
        Located _ TokLAngle _ -> 11#;
        Located _ TokRAngle _ -> 12#;
        Located _ TokComma _ -> 13#;
        Located _ TokBackslash _ -> 14#;
        Located _ TokUnderscore _ -> 15#;
        Located _ TokBang _ -> 16#;
        Located _ TokQuestion _ -> 17#;
        Located _ TokDot _ -> 18#;
        Located _ TokGetterDot _ -> 19#;
        Located _ TokNsDot _ -> 20#;
        Located _ TokLabelColon _ -> 21#;
        Located _ TokGetterDotChain _ -> 22#;
        Located _ TokEquals _ -> 23#;
        Located _ TokDColon _ -> 24#;
        Located _ TokArrow _ -> 25#;
        Located _ TokFatArrow _ -> 26#;
        Located _ TokBind _ -> 27#;
        Located _ TokStar _ -> 28#;
        Located _ TokMinus _ -> 29#;
        Located _ TokColon _ -> 30#;
        Located _ TokModule _ -> 31#;
        Located _ TokImport _ -> 32#;
        Located _ TokSource _ -> 33#;
        Located _ TokFrom _ -> 34#;
        Located _ TokWhere _ -> 35#;
        Located _ TokAs _ -> 36#;
        Located _ TokTrue _ -> 37#;
        Located _ TokFalse _ -> 38#;
        Located _ TokType _ -> 39#;
        Located _ TokRecord _ -> 40#;
        Located _ TokObject _ -> 41#;
        Located _ TokTable _ -> 42#;
        Located _ TokClass _ -> 43#;
        Located _ TokInstance _ -> 44#;
        Located _ TokInfixl _ -> 45#;
        Located _ TokInfixr _ -> 46#;
        Located _ TokInfix _ -> 47#;
        Located _ TokLet _ -> 48#;
        Located _ TokIn _ -> 49#;
        Located _ TokDo _ -> 50#;
        Located _ TokNull _ -> 51#;
        Located _ (TokLowerName _) _ -> 52#;
        Located _ (TokUpperName _) _ -> 53#;
        Located _ (TokOperator "+") _ -> 54#;
        Located _ (TokOperator "/") _ -> 55#;
        Located _ (TokOperator _) _ -> 56#;
        Located _ (TokInteger _) _ -> 57#;
        Located _ (TokFloat _) _ -> 58#;
        Located _ (TokString _) _ -> 59#;
        Located _ (TokStringStart _) _ -> 60#;
        Located _ (TokStringMid _) _ -> 61#;
        Located _ (TokStringEnd _) _ -> 62#;
        Located _ TokInterpOpen _ -> 63#;
        Located _ TokInterpClose _ -> 64#;
        Located _ (TokIntrinsic _) _ -> 65#;
        Located _ TokSemicolon _ -> 66#;
        Located _ TokPragmaInline _ -> 67#;
        Located _ TokEOF _ -> 68#;
        _ -> -1#;
        }
{-# NOINLINE happyTerminalToTok #-}

happyLex kend  _kmore []       = kend notHappyAtAll []
happyLex _kend kmore  (tk:tks) = kmore (happyTerminalToTok tk) tk tks
{-# INLINE happyLex #-}

happyNewToken action sts stk = happyLex (\tk -> happyDoAction 69# notHappyAtAll action sts stk) (\i tk -> happyDoAction i tk action sts stk)

happyReport 69# tk explist resume tks = happyReport' tks explist resume
happyReport _ tk explist resume tks = happyReport' (tk:tks) explist (\tks -> resume (Happy_Prelude.tail tks))


happyThen :: () => (P a) -> (a -> (P b)) -> (P b)
happyThen = ((>>=))
happyReturn :: () => a -> (P a)
happyReturn = (return)
happyThen1 m k tks = ((>>=)) m (\a -> k a tks)
happyFmap1 f m tks = happyThen (m tks) (\a -> happyReturn (f a))
happyReturn1 :: () => a -> b -> (P a)
happyReturn1 = \a tks -> (return) a
happyReport' :: () => [(Located)] -> [Happy_Prelude.String] -> ([(Located)] -> (P a)) -> (P a)
happyReport' = (\tokens expected resume -> (parseError) (tokens, expected))

happyAbort :: () => [(Located)] -> (P a)
happyAbort = Happy_Prelude.error "Called abort handler in non-resumptive parser"

parseProgram tks = happySomeParser where
 happySomeParser = happyThen (happyDoParse 0# tks) (\x -> case x of {HappyAbsSyn7 z -> happyReturn z; _other -> notHappyAtAll })

parseTypeOnly tks = happySomeParser where
 happySomeParser = happyThen (happyDoParse 1# tks) (\x -> case x of {HappyAbsSyn8 z -> happyReturn z; _other -> notHappyAtAll })

parseExprOnly tks = happySomeParser where
 happySomeParser = happyThen (happyDoParse 2# tks) (\x -> case x of {HappyAbsSyn9 z -> happyReturn z; _other -> notHappyAtAll })

happySeq = happyDontSeq


--------------------------------------------------------------------
-- Parser monad
--------------------------------------------------------------------

data PState = PState
  { psExpIndex    :: !Int
  , psSourceMap   :: !(Map.Map Int SrcLoc)
  , psModulePath  :: !(Maybe Path)
  , psModuleConfig :: !ModuleConfig
  , psDocMap      :: !(Map.Map Pos [Text])
  , psSourceLines :: ![Text]
  , psLangMap :: !(Map.Map T.Text Lang) -- alias -> Lang for all known languages
  , psProjectRoot :: !(Maybe Path) -- project root (directory of entry-point file)
  , psTermDocs    :: !(Map.Map EVar [Text])
  , psWarnings    :: ![Text] -- docstring warnings accumulated during desugar
  , psModuleDoc   :: ![Text] -- module-level description
  , psModuleEpilogues :: ![[Text]] -- epilogue blocks
  }
  deriving (Show)

emptyPState :: PState
emptyPState = PState 1 Map.empty Nothing defaultValue Map.empty [] Map.empty Nothing Map.empty [] [] []

type P a = State.StateT PState (Either ParseError) a

--------------------------------------------------------------------
-- Token extraction helpers
--------------------------------------------------------------------

getName :: Located -> Text
getName (Located _ (TokLowerName n) _) = n
getName (Located _ (TokUpperName n) _) = n
getName (Located _ _ t) = t

getInt :: Located -> Integer
getInt (Located _ (TokInteger n) _) = n
getInt _ = 0

getFloat :: Located -> Double
getFloat (Located _ (TokFloat d) _) = d
getFloat _ = 0

getString :: Located -> Text
getString (Located _ (TokString s) _) = s
getString (Located _ (TokStringStart s) _) = s
getString (Located _ (TokStringMid s) _) = s
getString (Located _ (TokStringEnd s) _) = s
getString (Located _ _ t) = t

getIntrinsicName :: Located -> Text
getIntrinsicName (Located _ (TokIntrinsic n) _) = n
getIntrinsicName _ = ""

parseKind :: Text -> Kind
parseKind "Nat" = KindNat
parseKind _ = KindType

getOp :: Located -> Text
getOp (Located _ (TokOperator t) _) = t
getOp (Located _ TokMinus _) = "-"
getOp (Located _ TokStar _) = "*"
getOp (Located _ TokDot _) = "."
getOp (Located _ TokLAngle _) = "<"
getOp (Located _ TokRAngle _) = ">"
getOp (Located _ _ t) = t

toEVar :: Located -> EVar
toEVar (Located _ (TokLowerName n) _) = EV n
toEVar (Located _ (TokOperator n) _) = EV n
toEVar (Located _ TokMinus _) = EV "-"
toEVar (Located _ TokStar _) = EV "*"
toEVar (Located _ TokDot _) = EV "."
toEVar (Located _ TokLAngle _) = EV "<"
toEVar (Located _ TokRAngle _) = EV ">"
toEVar _ = EV "?"

--------------------------------------------------------------------
-- Type helper
--------------------------------------------------------------------

applyType :: TypeU -> TypeU -> TypeU
applyType (AppU f args) x = AppU f (args ++ [x])
applyType f x = AppU f [x]

--------------------------------------------------------------------
-- Error handling
--------------------------------------------------------------------

parseError :: ([Located], [String]) -> P a
parseError ([], expected) = do
  srcLines <- State.gets psSourceLines
  State.lift (Left (ParseError (Pos 0 0 "") "unexpected end of input" expected srcLines))
parseError (Located pos tok _ : _, expected) = do
  srcLines <- State.gets psSourceLines
  State.lift (Left (ParseError pos ("unexpected " ++ showToken tok) expected srcLines))

--------------------------------------------------------------------
-- Desugar bridge
--------------------------------------------------------------------

toDState :: PState -> DState
toDState ps = DState
  { dsExpIndex = psExpIndex ps
  , dsSourceMap = psSourceMap ps
  , dsDocMap = psDocMap ps
  , dsModulePath = psModulePath ps
  , dsModuleConfig = psModuleConfig ps
  , dsSourceLines = psSourceLines ps
  , dsLangMap = psLangMap ps
  , dsProjectRoot = psProjectRoot ps
  , dsTermDocs = psTermDocs ps
  , dsWarnings = psWarnings ps
  , dsModuleDoc = psModuleDoc ps
  , dsModuleEpilogues = psModuleEpilogues ps
  }

fromDState :: PState -> DState -> PState
fromDState ps ds = ps
  { psExpIndex = dsExpIndex ds
  , psSourceMap = dsSourceMap ds
  , psTermDocs = dsTermDocs ds
  , psWarnings = dsWarnings ds
  , psModuleDoc = dsModuleDoc ds
  , psModuleEpilogues = dsModuleEpilogues ds
  }

-- | Run parse + desugar
parseAndDesugar :: PState -> [Located] -> Either ParseError ([ExprI], PState)
parseAndDesugar pstate tokens =
  case State.runStateT (parseProgram tokens) pstate of
    Left err -> Left err
    Right ((cstNodes, isImplicitMain), _parseState) ->
      let dstate = toDState pstate
      in case State.runStateT (desugarProgram isImplicitMain cstNodes) dstate of
        Left err -> Left err
        Right (exprIs, finalDState) ->
          Right (exprIs, fromDState pstate finalDState)

-- | Parse and desugar a single expression
parseAndDesugarExpr :: PState -> [Located] -> Either ParseError (ExprI, PState)
parseAndDesugarExpr pstate tokens =
  case State.runStateT (parseExprOnly tokens) pstate of
    Left err -> Left err
    Right (cstExpr, _parseState) ->
      let dstate = toDState pstate
      in case State.runStateT (desugarExpr cstExpr) dstate of
        Left err -> Left err
        Right (exprI, finalDState) ->
          Right (exprI, fromDState pstate finalDState)

--------------------------------------------------------------------
-- Public API
--------------------------------------------------------------------

readProgram ::
  Maybe MVar ->
  Maybe Path ->
  Text ->
  PState ->
  DAG MVar Import ExprI ->
  Either String (DAG MVar Import ExprI, PState)
readProgram expectedName modulePath sourceCode pstate dag = do
  let filename = maybe "<expr>" id modulePath
  (tokens, docMap, groupToks) <- case lexMorloc filename sourceCode of
    Left err -> Left (showLexError err)
    Right r -> Right r
  let srcLines = T.lines sourceCode
      pstate' = pstate { psModulePath = modulePath, psDocMap = docMap, psSourceLines = srcLines }
  -- Strategy 1: parse as-is (code with module declarations)
  case parseAndDesugar pstate' tokens of
    Right (result, finalState) ->
      let dag' = foldl (addModule expectedName) dag result
          dag'' = attachGroupAnnotations tokens groupToks dag'
      in return (dag'', finalState)
    Left err ->
      -- Strategy 2: wrap in module, patch trailing expr as __expr__ assignment.
      let wrappedCode = "module main (*)\n" <> sourceCode
      in case lexMorloc filename wrappedCode of
        Right (wrappedTokens, wrappedDocMap, wrappedGroupToks) ->
          let pstate'' = pstate' { psDocMap = wrappedDocMap, psSourceLines = T.lines wrappedCode }
          in case parseAndDesugar pstate'' wrappedTokens of
            Right (result, finalState) ->
              let dag' = foldl (addModule expectedName) dag result
                  dag'' = attachGroupAnnotations wrappedTokens wrappedGroupToks dag'
              in return (dag'', finalState)
            Left _ ->
              case patchForTrailingExpr wrappedTokens of
                Just patchedTokens ->
                  case parseAndDesugar pstate'' patchedTokens of
                    Right (result, finalState) ->
                      let dag' = foldl (addModule expectedName) dag result
                          dag'' = attachGroupAnnotations patchedTokens wrappedGroupToks dag'
                      in return (dag'', finalState)
                    Left _ -> tryExprFallback tokens pstate' dag filename err
                Nothing -> tryExprFallback tokens pstate' dag filename err
        Left _ -> tryExprFallback tokens pstate' dag filename err
  where
    tryExprFallback tokens' ps dag' filename' origErr =
      let exprTokens = stripLayoutTokens tokens'
      in case parseAndDesugarExpr ps exprTokens of
        Right (exprI, exprState) -> do
          let s = exprState
              i1 = psExpIndex s
              assI = ExprI i1 (AssE (EV "__expr__") exprI [])
              s1 = s { psExpIndex = i1 + 1 }
              i2 = psExpIndex s1
              expI = ExprI i2 (ExpE ExportAll)
              s2 = s1 { psExpIndex = i2 + 1 }
              i3 = psExpIndex s2
              modI = ExprI i3 (ModE (MV "main") [expI, assI])
              finalState = s2 { psExpIndex = i3 + 1 }
              dag'' = Map.insert (MV "main") (modI, []) dag'
          return (dag'', finalState)
        Left _ ->
          Left (showParseError filename' origErr)

    -- When an expected module name is provided (e.g., from "import .units"),
    -- use it as the DAG key so edges from the importing module resolve correctly.
    -- The file may declare "module units (...)" but the import edge targets ".units".
    addModule mayExpected d e@(ExprI _ (ModE n es)) =
      let key = maybe n id mayExpected
          imports = [(importModuleName i, i) | (ExprI _ (ImpE i)) <- es]
      in Map.insert key (e, imports) d
    addModule _ _ _ = error "expected a module"

patchForTrailingExpr :: [Located] -> Maybe [Located]
patchForTrailingExpr tokens = do
  let tokens' = patchExport tokens
  patchLastStmt tokens'

patchExport :: [Located] -> [Located]
patchExport [] = []
patchExport (t@(Located _ TokLParen _) : Located p TokStar _ : rest) =
  t : Located p (TokLowerName "__expr__") "__expr__" : rest
patchExport (t : rest) = t : patchExport rest

patchLastStmt :: [Located] -> Maybe [Located]
patchLastStmt tokens =
  case findLastTopVSemi tokens 0 0 Nothing of
    Just idx ->
      let (before, after) = splitAt (idx + 1) tokens
          dummyPos = Pos 0 0 "<expr>"
          exprTok = Located dummyPos (TokLowerName "__expr__") "__expr__"
          eqTok = Located dummyPos TokEquals "="
      in Just (before ++ [exprTok, eqTok] ++ after)
    Nothing -> Nothing
  where
    findLastTopVSemi :: [Located] -> Int -> Int -> Maybe Int -> Maybe Int
    findLastTopVSemi [] _ _ lastIdx = lastIdx
    findLastTopVSemi (Located _ TokVLBrace _ : rest) depth pos lastIdx =
      findLastTopVSemi rest (depth + 1) (pos + 1) lastIdx
    findLastTopVSemi (Located _ TokVRBrace _ : rest) depth pos lastIdx =
      findLastTopVSemi rest (max 0 (depth - 1)) (pos + 1) lastIdx
    findLastTopVSemi (Located _ TokVSemi _ : rest) depth pos _
      | depth == 1 = findLastTopVSemi rest depth (pos + 1) (Just pos)
    findLastTopVSemi (_ : rest) depth pos lastIdx =
      findLastTopVSemi rest depth (pos + 1) lastIdx

stripLayoutTokens :: [Located] -> [Located]
stripLayoutTokens = filter (not . isLayoutToken)
  where
    isLayoutToken (Located _ TokVLBrace _) = True
    isLayoutToken (Located _ TokVRBrace _) = True
    isLayoutToken (Located _ TokVSemi _) = True
    isLayoutToken _ = False

readType :: Text -> Either String TypeU
readType typeStr = do
  let initState = emptyPState
  (tokens, _, _) <- case lexMorloc "<type>" typeStr of
    Left err -> Left (showLexError err)
    Right r -> Right r
  (result, _) <- case State.runStateT (parseTypeOnly tokens) initState of
    Left err -> Left (showParseError "<type>" err)
    Right r -> Right r
  return result

-- | Post-process the DAG to attach group annotations from --* tokens.
attachGroupAnnotations :: [Located] -> [Located] -> DAG MVar Import ExprI -> DAG MVar Import ExprI
attachGroupAnnotations _ [] dag = dag
attachGroupAnnotations tokens groupToks dag =
  let groupHeaders = parseGroupHeaders groupToks
      exportSymPositions = findExportSymbolPositions tokens
      membership = buildMembership groupHeaders exportSymPositions
      ghdrMap = Map.fromList [(n, d) | (n, d, _) <- groupHeaders]
  in Map.map (\(e, es) -> (attachToExpr membership ghdrMap e, es)) dag
  where
    attachToExpr :: Map.Map T.Text T.Text -> Map.Map T.Text [T.Text] -> ExprI -> ExprI
    attachToExpr mem ghdrs (ExprI i (ModE m es)) =
      ExprI i (ModE m (map (attachToExpr mem ghdrs) es))
    attachToExpr mem ghdrs (ExprI i (ExpE (ExportMany symbols _))) =
      let groupedSymNames = Map.keysSet mem
          groupNames = nubText [gn | (_, gn) <- Map.toList mem]
          exportGroups =
            [ ExportGroup gn (maybe [] id (Map.lookup gn ghdrs))
                (Set.filter (\(_, sym) -> Map.lookup (symText sym) mem == Just gn) symbols)
            | gn <- groupNames
            ]
          ungrouped = Set.filter (\(_, sym) -> not (Set.member (symText sym) groupedSymNames)) symbols
      in ExprI i (ExpE (ExportMany ungrouped exportGroups))
    attachToExpr _ _ e = e

    nubText :: [T.Text] -> [T.Text]
    nubText [] = []
    nubText (x:xs) = x : nubText (filter (/= x) xs)

    symText :: Symbol -> T.Text
    symText (TermSymbol (EV n)) = n
    symText (TypeSymbol (TV n)) = n
    symText (ClassSymbol (ClassName n)) = n

parseGroupHeaders :: [Located] -> [(T.Text, [T.Text], Pos)]
parseGroupHeaders = foldl' accum [] . map extractLine
  where
    extractLine (Located pos (TokGroupLine txt) _) = (pos, stripOne txt)
    extractLine (Located pos _ _) = (pos, T.empty)

    -- consume one leading space after --*, preserve remaining indentation
    stripOne t = T.stripEnd $ case T.uncons t of
      Just (' ', rest) -> rest
      _ -> t

    accum :: [(T.Text, [T.Text], Pos)] -> (Pos, T.Text) -> [(T.Text, [T.Text], Pos)]
    accum gs (pos, line)
      | Just rest <- T.stripPrefix "\\" line = addDesc gs pos (T.stripEnd rest)
      | Just name <- T.stripPrefix "group:" (T.stripStart line) =
          let name' = T.strip name
          in if T.null name'
             then gs ++ [(T.empty, [], pos)]  -- --* group: (no name) = terminator
             else case gs of
               -- last entry has no name yet: set it
               _ | not (null gs), let (n, _, _) = last gs, T.null n ->
                   init gs ++ [let (_, ds, p) = last gs in (name', ds, p)]
               _ -> gs ++ [(name', [], pos)]
      | otherwise = addDesc gs pos line  -- includes blank lines

    addDesc [] pos d = [(T.empty, [d], pos)]  -- no group yet, start unnamed entry
    addDesc gs _ d = init gs ++ [let (n, ds, p) = last gs in (n, ds ++ [d], p)]

findExportSymbolPositions :: [Located] -> [(T.Text, Pos)]
findExportSymbolPositions = findModule
  where
    findModule (Located _ TokModule _ : rest) = findLParen rest
    findModule (_ : rest) = findModule rest
    findModule [] = []

    findLParen (Located _ TokLParen _ : rest) = scanExports 1 rest
    findLParen (Located _ TokStar _ : _) = []
    findLParen (_ : rest) = findLParen rest
    findLParen [] = []

    scanExports :: Int -> [Located] -> [(T.Text, Pos)]
    scanExports 0 _ = []
    scanExports depth (Located _ TokLParen _ : rest) = scanExports (depth + 1) rest
    scanExports depth (Located _ TokRParen _ : rest)
      | depth <= 1 = []
      | otherwise = scanExports (depth - 1) rest
    scanExports depth (Located pos (TokLowerName n) _ : rest) = (n, pos) : scanExports depth rest
    scanExports depth (Located pos (TokUpperName n) _ : rest) = (n, pos) : scanExports depth rest
    scanExports depth (_ : rest) = scanExports depth rest
    scanExports _ [] = []

buildMembership :: [(T.Text, [T.Text], Pos)] -> [(T.Text, Pos)] -> Map.Map T.Text T.Text
buildMembership groupHeaders exportSyms = Map.fromList
  [ (sym, gname)
  | (sym, symPos) <- exportSyms
  , Just gname <- [findGroup symPos]
  ]
  where
    sortedGroups = sortBy (\(_,_,p1) (_,_,p2) -> compare p1 p2) groupHeaders

    findGroup :: Pos -> Maybe T.Text
    findGroup symPos = case filter (\(_,_,gpos) -> gpos < symPos) (reverse sortedGroups) of
      ((gname,_,_):_)
        | T.null gname -> Nothing  -- empty name = group terminator
        | otherwise -> Just gname
      [] -> Nothing
-- $Id: GenericTemplate.hs,v 1.26 2005/01/14 14:47:22 simonmar Exp $

#if !defined(__GLASGOW_HASKELL__)
#  error This code isn't being built with GHC.
#endif

-- Get WORDS_BIGENDIAN (if defined)
#include "MachDeps.h"

-- Do not remove this comment. Required to fix CPP parsing when using GCC and a clang-compiled alex.
#define LT(n,m) ((Happy_GHC_Exts.tagToEnum# (n Happy_GHC_Exts.<# m)) :: Happy_Prelude.Bool)
#define GTE(n,m) ((Happy_GHC_Exts.tagToEnum# (n Happy_GHC_Exts.>=# m)) :: Happy_Prelude.Bool)
#define EQ(n,m) ((Happy_GHC_Exts.tagToEnum# (n Happy_GHC_Exts.==# m)) :: Happy_Prelude.Bool)
#define PLUS(n,m) (n Happy_GHC_Exts.+# m)
#define MINUS(n,m) (n Happy_GHC_Exts.-# m)
#define TIMES(n,m) (n Happy_GHC_Exts.*# m)
#define NEGATE(n) (Happy_GHC_Exts.negateInt# (n))

type Happy_Int = Happy_GHC_Exts.Int#
data Happy_IntList = HappyCons Happy_Int Happy_IntList

#define INVALID_TOK -1#
#define ERROR_TOK 0#
#define CATCH_TOK 1#

#if defined(HAPPY_COERCE)
#  define GET_ERROR_TOKEN(x)  (case Happy_GHC_Exts.unsafeCoerce# x of { (Happy_GHC_Exts.I# i) -> i })
#  define MK_ERROR_TOKEN(i)   (Happy_GHC_Exts.unsafeCoerce# (Happy_GHC_Exts.I# i))
#  define MK_TOKEN(x)         (happyInTok (x))
#else
#  define GET_ERROR_TOKEN(x)  (case x of { HappyErrorToken (Happy_GHC_Exts.I# i) -> i })
#  define MK_ERROR_TOKEN(i)   (HappyErrorToken (Happy_GHC_Exts.I# i))
#  define MK_TOKEN(x)         (HappyTerminal (x))
#endif

#if defined(HAPPY_DEBUG)
#  define DEBUG_TRACE(s)    (happyTrace (s)) Happy_Prelude.$
happyTrace string expr = Happy_System_IO_Unsafe.unsafePerformIO Happy_Prelude.$ do
    Happy_System_IO.hPutStr Happy_System_IO.stderr string
    Happy_Prelude.return expr
#else
#  define DEBUG_TRACE(s)    {- nothing -}
#endif

infixr 9 `HappyStk`
data HappyStk a = HappyStk a (HappyStk a)

-----------------------------------------------------------------------------
-- starting the parse

happyDoParse start_state = happyNewToken start_state notHappyAtAll notHappyAtAll

-----------------------------------------------------------------------------
-- Accepting the parse

-- If the current token is ERROR_TOK, it means we've just accepted a partial
-- parse (a %partial parser).  We must ignore the saved token on the top of
-- the stack in this case.
happyAccept ERROR_TOK tk st sts (_ `HappyStk` ans `HappyStk` _) =
        happyReturn1 ans
happyAccept j tk st sts (HappyStk ans _) =
        (happyTcHack j (happyTcHack st)) (happyReturn1 ans)

-----------------------------------------------------------------------------
-- Arrays only: do the next action

happyDoAction i tk st =
  DEBUG_TRACE("state: " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++
              ",\ttoken: " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# i) Happy_Prelude.++
              ",\taction: ")
  case happyDecodeAction (happyNextAction i st) of
    HappyFail             -> DEBUG_TRACE("failing.\n")
                             happyFail i tk st
    HappyAccept           -> DEBUG_TRACE("accept.\n")
                             happyAccept i tk st
    HappyReduce rule      -> DEBUG_TRACE("reduce (rule " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# rule) Happy_Prelude.++ ")")
                             (happyReduceArr Happy_Data_Array.! (Happy_GHC_Exts.I# rule)) i tk st
    HappyShift  new_state -> DEBUG_TRACE("shift, enter state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# new_state) Happy_Prelude.++ "\n")
                             happyShift new_state i tk st

{-# INLINE happyNextAction #-}
happyNextAction i st = case happyIndexActionTable i st of
  Happy_Prelude.Just (Happy_GHC_Exts.I# act) -> act
  Happy_Prelude.Nothing                      -> happyIndexOffAddr happyDefActions st

{-# INLINE happyIndexActionTable #-}
happyIndexActionTable i st
  | GTE(i, 0#), GTE(off, 0#), EQ(happyIndexOffAddr happyCheck off, i)
  -- i >= 0:   Guard against INVALID_TOK (do the default action, which ultimately errors)
  -- off >= 0: Otherwise it's a default action
  -- equality check: Ensure that the entry in the compressed array is owned by st
  = Happy_Prelude.Just (Happy_GHC_Exts.I# (happyIndexOffAddr happyTable off))
  | Happy_Prelude.otherwise
  = Happy_Prelude.Nothing
  where
    off = PLUS(happyIndexOffAddr happyActOffsets st, i)

data HappyAction
  = HappyFail
  | HappyAccept
  | HappyReduce Happy_Int -- rule number
  | HappyShift Happy_Int  -- new state
  deriving Happy_Prelude.Show

{-# INLINE happyDecodeAction #-}
happyDecodeAction :: Happy_Int -> HappyAction
happyDecodeAction  0#                        = HappyFail
happyDecodeAction -1#                        = HappyAccept
happyDecodeAction action | LT(action, 0#)    = HappyReduce NEGATE(PLUS(action, 1#))
                         | Happy_Prelude.otherwise = HappyShift MINUS(action, 1#)

{-# INLINE happyIndexGotoTable #-}
happyIndexGotoTable nt st = happyIndexOffAddr happyTable off
  where
    off = PLUS(happyIndexOffAddr happyGotoOffsets st, nt)

{-# INLINE happyIndexOffAddr #-}
happyIndexOffAddr :: HappyAddr -> Happy_Int -> Happy_Int
happyIndexOffAddr (HappyA# arr) off =
#if __GLASGOW_HASKELL__ >= 901
  Happy_GHC_Exts.int32ToInt# -- qualified import because it doesn't exist on older GHC's
#endif
#ifdef WORDS_BIGENDIAN
  -- The CI of `alex` tests this code path
  (Happy_GHC_Exts.word32ToInt32# (Happy_GHC_Exts.wordToWord32# (Happy_GHC_Exts.byteSwap32# (Happy_GHC_Exts.word32ToWord# (Happy_GHC_Exts.int32ToWord32#
#endif
  (Happy_GHC_Exts.indexInt32OffAddr# arr off)
#ifdef WORDS_BIGENDIAN
  )))))
#endif

happyIndexRuleArr :: Happy_Int -> (# Happy_Int, Happy_Int #)
happyIndexRuleArr r = (# nt, len #)
  where
    !(Happy_GHC_Exts.I# n_starts) = happy_n_starts
    offs = TIMES(MINUS(r,n_starts),2#)
    nt = happyIndexOffAddr happyRuleArr offs
    len = happyIndexOffAddr happyRuleArr PLUS(offs,1#)

data HappyAddr = HappyA# Happy_GHC_Exts.Addr#

-----------------------------------------------------------------------------
-- Shifting a token

happyShift new_state ERROR_TOK tk st sts stk@(x `HappyStk` _) =
     -- See "Error Fixup" below
     let i = GET_ERROR_TOKEN(x) in
     DEBUG_TRACE("shifting the error token")
     happyDoAction i tk new_state (HappyCons st sts) stk

happyShift new_state i tk st sts stk =
     happyNewToken new_state (HappyCons st sts) (MK_TOKEN(tk) `HappyStk` stk)

-- happyReduce is specialised for the common cases.

happySpecReduce_0 nt fn j tk st sts stk
     = happySeq fn (happyGoto nt j tk st (HappyCons st sts) (fn `HappyStk` stk))

happySpecReduce_1 nt fn j tk old_st sts@(HappyCons st _) (v1 `HappyStk` stk')
     = let r = fn v1 in
       happyTcHack old_st (happySeq r (happyGoto nt j tk st sts (r `HappyStk` stk')))

happySpecReduce_2 nt fn j tk old_st
  (HappyCons _ sts@(HappyCons st _))
  (v1 `HappyStk` v2 `HappyStk` stk')
     = let r = fn v1 v2 in
       happyTcHack old_st (happySeq r (happyGoto nt j tk st sts (r `HappyStk` stk')))

happySpecReduce_3 nt fn j tk old_st
  (HappyCons _ (HappyCons _ sts@(HappyCons st _)))
  (v1 `HappyStk` v2 `HappyStk` v3 `HappyStk` stk')
     = let r = fn v1 v2 v3 in
       happyTcHack old_st (happySeq r (happyGoto nt j tk st sts (r `HappyStk` stk')))

happyReduce k nt fn j tk st sts stk
     = case happyDrop MINUS(k,(1# :: Happy_Int)) sts of
         sts1@(HappyCons st1 _) ->
                let r = fn stk in -- it doesn't hurt to always seq here...
                st `happyTcHack` happyDoSeq r (happyGoto nt j tk st1 sts1 r)

happyMonadReduce k nt fn j tk st sts stk =
      case happyDrop k (HappyCons st sts) of
        sts1@(HappyCons st1 _) ->
          let drop_stk = happyDropStk k stk in
          j `happyTcHack` happyThen1 (fn stk tk)
                                     (\r -> happyGoto nt j tk st1 sts1 (r `HappyStk` drop_stk))

happyMonad2Reduce k nt fn j tk st sts stk =
      case happyDrop k (HappyCons st sts) of
        sts1@(HappyCons st1 _) ->
          let drop_stk = happyDropStk k stk
              off = happyIndexOffAddr happyGotoOffsets st1
              off_i = PLUS(off, nt)
              new_state = happyIndexOffAddr happyTable off_i
          in
            j `happyTcHack` happyThen1 (fn stk tk)
                                       (\r -> happyNewToken new_state sts1 (r `HappyStk` drop_stk))

happyDrop 0# l               = l
happyDrop n  (HappyCons _ t) = happyDrop MINUS(n,(1# :: Happy_Int)) t

happyDropStk 0# l                 = l
happyDropStk n  (x `HappyStk` xs) = happyDropStk MINUS(n,(1#::Happy_Int)) xs

-----------------------------------------------------------------------------
-- Moving to a new state after a reduction

happyGoto nt j tk st =
   DEBUG_TRACE(", goto state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# new_state) Happy_Prelude.++ "\n")
   happyDoAction j tk new_state
  where new_state = happyIndexGotoTable nt st

{- Note [Error recovery]
~~~~~~~~~~~~~~~~~~~~~~~~
When there is no applicable action for the current lookahead token `tk`,
happy enters error recovery mode. Depending on whether the grammar file
declares the two action form `%error { abort } { report }` for
    Resumptive Error Handling,
it works in one (not resumptive) or two phases (resumptive):

 1. Fixup mode:
    Try to see if there is an action for the error token ERROR_TOK. If there
    is, do *not* emit an error and pretend instead that an `error` token was
    inserted.
    When there is no ERROR_TOK action, report an error.

    In non-resumptive error handling, calling the single error handler
    (e.g. `happyError`) will throw an exception and abort the parser.
    However, in resumptive error handling we enter *error resumption mode*.

 2. Error resumption mode:
    After reporting the error (with `report`), happy will attempt to find
    a good state stack to resume parsing in.
    For each candidate stack, it discards input until one of the candidates
    resumes (i.e. shifts the current input).
    If no candidate resumes before the end of input, resumption failed and
    calls the `abort` function, to much the same effect as in non-resumptive
    error handling.

    Candidate stacks are declared by the grammar author using the special
    `catch` terminal and called "catch frames".
    This mechanism is described in detail in Note [happyResume].

The `catch` resumption mechanism (2) is what usually is associated with
`error` in `bison` or `menhir`. Since `error` is used for the Fixup mechanism
(1) above, we call the corresponding token `catch`.
Furthermore, in constrast to `bison`, our implementation of `catch`
non-deterministically considers multiple catch frames on the stack for
resumption (See Note [Multiple catch frames]).

Note [happyResume]
~~~~~~~~~~~~~~~~~~
`happyResume` implements the resumption mechanism from Note [Error recovery].
It is best understood by example. Consider

Exp :: { String }
Exp : '1'                { "1" }
    | catch              { "catch" }
    | Exp '+' Exp %shift { $1 Happy_Prelude.++ " + " Happy_Prelude.++ $3 } -- %shift: associate 1 + 1 + 1 to the right
    | '(' Exp ')'        { "(" Happy_Prelude.++ $2 Happy_Prelude.++ ")" }

The idea of the use of `catch` here is that upon encountering a parse error
during expression parsing, we can gracefully degrade using the `catch` rule,
still producing a partial syntax tree and keep on parsing to find further
syntax errors.

Let's trace the parser state for input 11+1, which will error out after shifting 1.
After shifting, we have the following item stack (growing downwards and omitting
transitive closure items):

  State 0: %start_parseExp -> . Exp
  State 5: Exp -> '1' .

(Stack as a list of state numbers: [5,0].)
As Note [Error recovery] describes, we will first try Fixup mode.
That fails because no production can shift the `error` token.
Next we try Error resumption mode. This works as follows:

  1. Pop off the item stack until we find an item that can shift the `catch`
     token. (Implemented in `pop_items`.)
       * State 5 cannot shift catch. Pop.
       * State 0 can shift catch, which would transition into
          State 4: Exp -> catch .
     So record the *stack* `[4,0]` after doing the shift transition.
     We call this a *catch frame*, where the top is a *catch state*,
     corresponding to an item in which we just shifted a `catch` token.
     There can be multiple such catch stacks, see Note [Multiple catch frames].

  2. Discard tokens from the input until the lookahead can be shifted in one
     of the catch stacks. (Implemented in `discard_input_until_exp` and
     `some_catch_state_shifts`.)
       * We cannot shift the current lookahead '1' in state 4, so we discard
       * We *can* shift the next lookahead '+' in state 4, but only after
         reducing, which pops State 4 and goes to State 3:
           State 3: %start_parseExp -> Exp .
                    Exp -> Exp . '+' Exp
         Here we can shift '+'.
     As you can see, to implement this machinery we need to simulate
     the operation of the LALR automaton, especially reduction
     (`happySimulateReduce`).

Note [Multiple catch frames]
~~~~~~~~~~~~~~~~~~~~~~~~~~~~
For fewer spurious error messages, it can be beneficial to trace multiple catch
items. Consider

Exp : '1'
    | catch
    | Exp '+' Exp %shift
    | '(' Exp ')'

Let's trace the parser state for input (;+1, which will error out after shifting (.
After shifting, we have the following item stack (growing downwards):

  State 0: %start_parseExp -> . Exp
  State 6: Exp -> '(' . Exp ')'

Upon error, we want to find items in the stack which can shift a catch token.
Note that both State 0 and State 6 can shift a catch token, transitioning into
  State 4: Exp -> catch .
Hence we record the catch frames `[4,6,0]` and `[4,0]` for possible resumption.

Which catch frame do we pick for resumption?
Note that resuming catch frame `[4,0]` will parse as "catch+1", whereas
resuming the innermost frame `[4,6,0]` corresponds to parsing "(catch+1".
The latter would keep discarding input until the closing ')' is found.
So we will discard + and 1, leading to a spurious syntax error at the end of
input, aborting the parse and never producing a partial syntax tree. Bad!

It is far preferable to resume with catch frame `[4,0]`, where we can resume
successfully on input +, so that is what we do.

In general, we pick the catch frame for resumption that discards the least
amount of input for a successful shift, preferring the topmost such catch frame.
-}

-- happyFail :: Happy_Int -> Token -> Happy_Int -> _
-- This function triggers Note [Error recovery].
-- If the current token is ERROR_TOK, phase (1) has failed and we might try
-- phase (2).
happyFail ERROR_TOK = happyFixupFailed
happyFail i         = happyTryFixup i

-- Enter Error Fixup (see Note [Error recovery]):
-- generate an error token, save the old token and carry on.
-- When a `happyShift` accepts the error token, we will pop off the error token
-- to resume parsing with the current lookahead `i`.
happyTryFixup i tk action sts stk =
  DEBUG_TRACE("entering `error` fixup.\n")
  happyDoAction ERROR_TOK tk action sts (MK_ERROR_TOKEN(i) `HappyStk` stk)
  -- NB: `happyShift` will simply pop the error token and carry on with
  --     `tk`. Hence we don't change `tk` in the call here

-- See Note [Error recovery], phase (2).
-- Enter resumption mode after reporting the error by calling `happyResume`.
happyFixupFailed tk st sts (x `HappyStk` stk) =
  let i = GET_ERROR_TOKEN(x) in
  DEBUG_TRACE("`error` fixup failed.\n")
  let resume   = happyResume i tk st sts stk
      expected = happyExpectedTokens st sts in
  happyReport i tk expected resume

-- happyResume :: Happy_Int -> Token -> Happy_Int -> _
-- See Note [happyResume]
happyResume i tk st sts stk = pop_items [] st sts stk
  where
    !(Happy_GHC_Exts.I# n_starts) = happy_n_starts   -- this is to test whether we have a start token
    !(Happy_GHC_Exts.I# eof_i) = happy_n_terms Happy_Prelude.- 1   -- this is the token number of the EOF token
    happy_list_to_list :: Happy_IntList -> [Happy_Prelude.Int]
    happy_list_to_list (HappyCons st sts)
      | LT(st, n_starts)
      = [(Happy_GHC_Exts.I# st)]
      | Happy_Prelude.otherwise
      = (Happy_GHC_Exts.I# st) : happy_list_to_list sts

    -- See (1) of Note [happyResume]
    pop_items catch_frames st sts stk
      | LT(st, n_starts)
      = DEBUG_TRACE("reached start state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ ", ")
        if Happy_Prelude.null catch_frames_new
          then DEBUG_TRACE("no resumption.\n")
               happyAbort
          else DEBUG_TRACE("now discard input, trying to anchor in states " Happy_Prelude.++ Happy_Prelude.show (Happy_Prelude.map (happy_list_to_list . Happy_Prelude.fst) (Happy_Prelude.reverse catch_frames_new)) Happy_Prelude.++ ".\n")
               discard_input_until_exp i tk (Happy_Prelude.reverse catch_frames_new)
      | (HappyCons st1 sts1) <- sts, _ `HappyStk` stk1 <- stk
      = pop_items catch_frames_new st1 sts1 stk1
      where
        !catch_frames_new
          | HappyShift new_state <- happyDecodeAction (happyNextAction CATCH_TOK st)
          , DEBUG_TRACE("can shift catch token in state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ ", into state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# new_state) Happy_Prelude.++ "\n")
            Happy_Prelude.null (Happy_Prelude.filter (\(HappyCons _ (HappyCons h _),_) -> EQ(st,h)) catch_frames)
          = (HappyCons new_state (HappyCons st sts), MK_ERROR_TOKEN(i) `HappyStk` stk):catch_frames -- MK_ERROR_TOKEN(i) is just some dummy that should not be accessed by user code
          | Happy_Prelude.otherwise
          = DEBUG_TRACE("already shifted or can't shift catch in " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ "\n")
            catch_frames

    -- See (2) of Note [happyResume]
    discard_input_until_exp i tk catch_frames
      | Happy_Prelude.Just (HappyCons st (HappyCons catch_st sts), catch_frame) <- some_catch_state_shifts i catch_frames
      = DEBUG_TRACE("found expected token in state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ " after shifting from " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# catch_st) Happy_Prelude.++ ": " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# i) Happy_Prelude.++ "\n")
        happyDoAction i tk st (HappyCons catch_st sts) catch_frame
      | EQ(i,eof_i) -- is i EOF?
      = DEBUG_TRACE("reached EOF, cannot resume. abort parse :(\n")
        happyAbort
      | Happy_Prelude.otherwise
      = DEBUG_TRACE("discard token " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# i) Happy_Prelude.++ "\n")
        happyLex (\eof_tk -> discard_input_until_exp eof_i eof_tk catch_frames) -- eof
                 (\i tk   -> discard_input_until_exp i tk catch_frames)         -- not eof

    some_catch_state_shifts _ [] = DEBUG_TRACE("no catch state could shift.\n") Happy_Prelude.Nothing
    some_catch_state_shifts i catch_frames@(((HappyCons st sts),_):_) = try_head i st sts catch_frames
      where
        try_head i st sts catch_frames = -- PRECONDITION: head catch_frames = (HappyCons st sts)
          DEBUG_TRACE("trying token " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# i) Happy_Prelude.++ " in state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ ": ")
          case happyDecodeAction (happyNextAction i st) of
            HappyFail     -> DEBUG_TRACE("fail.\n")   some_catch_state_shifts i (Happy_Prelude.tail catch_frames)
            HappyAccept   -> DEBUG_TRACE("accept.\n") Happy_Prelude.Just (Happy_Prelude.head catch_frames)
            HappyShift _  -> DEBUG_TRACE("shift.\n")  Happy_Prelude.Just (Happy_Prelude.head catch_frames)
            HappyReduce r -> case happySimulateReduce r st sts of
              (HappyCons st1 sts1) -> try_head i st1 sts1 catch_frames

happySimulateReduce r st sts =
  DEBUG_TRACE("simulate reduction of rule " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# r) Happy_Prelude.++ ", ")
  let (# nt, len #) = happyIndexRuleArr r in
  DEBUG_TRACE("nt " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# nt) Happy_Prelude.++ ", len: " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# len) Happy_Prelude.++ ", new_st ")
  let !(sts1@(HappyCons st1 _)) = happyDrop len (HappyCons st sts)
      new_st = happyIndexGotoTable nt st1 in
  DEBUG_TRACE(Happy_Prelude.show (Happy_GHC_Exts.I# new_st) Happy_Prelude.++ ".\n")
  (HappyCons new_st sts1)

happyTokenToString :: Happy_Prelude.Int -> Happy_Prelude.String
happyTokenToString i = happyTokenStrings Happy_Prelude.!! (i Happy_Prelude.- 2) -- 2: errorTok, catchTok

happyExpectedTokens :: Happy_Int -> Happy_IntList -> [Happy_Prelude.String]
-- Upon a parse error, we want to suggest tokens that are expected in that
-- situation. This function computes such tokens.
-- It works by examining the top of the state stack.
-- For every token number that does a shift transition, record that token number.
-- For every token number that does a reduce transition, simulate that reduction
-- on the state state stack and repeat.
-- The recorded token numbers are then formatted with 'happyTokenToString' and
-- returned.
happyExpectedTokens st sts =
  DEBUG_TRACE("constructing expected tokens.\n")
  Happy_Prelude.map happyTokenToString (search_shifts st sts [])
  where
    search_shifts st sts shifts = Happy_Prelude.foldr (add_action st sts) shifts (distinct_actions st)
    add_action st sts (Happy_GHC_Exts.I# i, Happy_GHC_Exts.I# act) shifts =
      DEBUG_TRACE("found action in state " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# st) Happy_Prelude.++ ", input " Happy_Prelude.++ Happy_Prelude.show (Happy_GHC_Exts.I# i) Happy_Prelude.++ ", " Happy_Prelude.++ Happy_Prelude.show (happyDecodeAction act) Happy_Prelude.++ "\n")
      case happyDecodeAction act of
        HappyFail     -> shifts
        HappyAccept   -> shifts -- This would always be %eof or error... Not helpful
        HappyShift _  -> Happy_Prelude.insert (Happy_GHC_Exts.I# i) shifts
        HappyReduce r -> case happySimulateReduce r st sts of
          (HappyCons st1 sts1) -> search_shifts st1 sts1 shifts
    distinct_actions st
      -- The (token number, action) pairs of all actions in the given state
      = ((-1), (Happy_GHC_Exts.I# (happyIndexOffAddr happyDefActions st)))
      : [ (i, act) | i <- [begin_i..happy_n_terms], act <- get_act row_off i ]
      where
        row_off = happyIndexOffAddr happyActOffsets st
        begin_i = 2 -- +2: errorTok,catchTok
    get_act off (Happy_GHC_Exts.I# i) -- happyIndexActionTable with cached row offset
      | let off_i = PLUS(off,i)
      , GTE(off_i,0#)
      , EQ(happyIndexOffAddr happyCheck off_i,i)
      = [(Happy_GHC_Exts.I# (happyIndexOffAddr happyTable off_i))]
      | Happy_Prelude.otherwise
      = []

-- Internal happy errors:

notHappyAtAll :: a
notHappyAtAll = Happy_Prelude.error "Internal Happy parser panic. This is not supposed to happen! Please open a bug report at https://github.com/haskell/happy/issues.\n"

-----------------------------------------------------------------------------
-- Hack to get the typechecker to accept our action functions

happyTcHack :: Happy_Int -> a -> a
happyTcHack x y = y
{-# INLINE happyTcHack #-}

-----------------------------------------------------------------------------
-- Seq-ing.  If the --strict flag is given, then Happy emits
--      happySeq = happyDoSeq
-- otherwise it emits
--      happySeq = happyDontSeq

happyDoSeq, happyDontSeq :: a -> b -> b
happyDoSeq   a b = a `Happy_GHC_Exts.seq` b
happyDontSeq a b = b

-----------------------------------------------------------------------------
-- Don't inline any functions from the template.  GHC has a nasty habit
-- of deciding to inline happyGoto everywhere, which increases the size of
-- the generated parser quite a bit.

{-# NOINLINE happyDoAction #-}
{-# NOINLINE happyTable #-}
{-# NOINLINE happyCheck #-}
{-# NOINLINE happyActOffsets #-}
{-# NOINLINE happyGotoOffsets #-}
{-# NOINLINE happyDefActions #-}

{-# NOINLINE happyShift #-}
{-# NOINLINE happySpecReduce_0 #-}
{-# NOINLINE happySpecReduce_1 #-}
{-# NOINLINE happySpecReduce_2 #-}
{-# NOINLINE happySpecReduce_3 #-}
{-# NOINLINE happyReduce #-}
{-# NOINLINE happyMonadReduce #-}
{-# NOINLINE happyGoto #-}
{-# NOINLINE happyFail #-}

-- end of Happy Template.


================================================
FILE: library/Morloc/Frontend/Parser.y
================================================
{
{-# LANGUAGE OverloadedStrings #-}

module Morloc.Frontend.Parser
  ( readProgram
  , readType
  , PState (..)
  , emptyPState
  ) where

import Data.Text (Text)
import qualified Data.Text as T
import qualified Data.Map.Strict as Map
import qualified Data.Set as Set
import qualified Data.Scientific as DS
import Data.List (sortBy, foldl')
import qualified Control.Monad.State.Strict as State
import Morloc.Frontend.Token
import Morloc.Frontend.Lexer (lexMorloc, showLexError)
import Morloc.Frontend.CST
import Morloc.Frontend.Desugar (DState(..), D, ParseError(..), showParseError, desugarProgram, desugarExpr)
import Morloc.Namespace.Prim
import Morloc.Namespace.Type
import Morloc.Namespace.Expr
import qualified Morloc.BaseTypes as BT
}

%name parseProgram program
%name parseTypeOnly type_eof
%name parseExprOnly expr_eof

%tokentype { Located }
%monad { P } { (>>=) } { return }
%error { parseError }
%errorhandlertype explist

-- shift/reduce conflicts, all resolved correctly by shift:
-- - 1 from :: type annotation (infix_expr followed by ::)
-- - 2 from app_expr (./- could start new atom or be operators)
-- - 1 from sig_or_ass (LOWER could be param or start of new decl)
-- - 6 from class_constraints (UPPER could be constraint arg or end of constraint)
-- - 3 from original grammar
-- - 4 from accessor_tail (GDOT/= could continue chain or end it)
-- - 2 from guard_clauses ('?' could start guard or be part of next decl)
-- - 1 from guard_expr ('?' in expr could be nested guard_expr or next guard_clause)
-- - 4 from optional type syntax ('?' could start optional type or guard)
-- Note: force_expr (!) re-added for inline effect forcing in do-blocks
-- - 2 from force_expr ('!' could start force or be part of another expr)
-- - 1 from import_module_name (module_comp could be namespace prefix or whole name)
-- - 0 from var_expr qualified name and import 'as' namespace (no new conflicts)
-- - 13 from type-level Nat arithmetic ('+' and '*' in add_type/mul_type rules)
%expect 84

%token
  VLBRACE    { Located _ TokVLBrace _ }
  VRBRACE    { Located _ TokVRBrace _ }
  VSEMI      { Located _ TokVSemi _ }
  '('        { Located _ TokLParen _ }
  ')'        { Located _ TokRParen _ }
  '['        { Located _ TokLBracket _ }
  ']'        { Located _ TokRBracket _ }
  '{'        { Located _ TokLBrace _ }
  '}'        { Located _ TokRBrace _ }
  '<'        { Located _ TokLAngle _ }
  '>'        { Located _ TokRAngle _ }
  ','        { Located _ TokComma _ }
  '\\'       { Located _ TokBackslash _ }
  '_'        { Located _ TokUnderscore _ }
  '!'        { Located _ TokBang _ }
  '?'        { Located _ TokQuestion _ }
  '.'        { Located _ TokDot _ }
  GDOT       { Located _ TokGetterDot _ }
  NSDOT      { Located _ TokNsDot _ }
  LABELCOLON { Located _ TokLabelColon _ }
  GDOTCHAIN  { Located _ TokGetterDotChain _ }
  '='        { Located _ TokEquals _ }
  '::'       { Located _ TokDColon _ }
  '->'       { Located _ TokArrow _ }
  '=>'       { Located _ TokFatArrow _ }
  '<-'       { Located _ TokBind _ }
  '*'        { Located _ TokStar _ }
  '-'        { Located _ TokMinus _ }
  ':'        { Located _ TokColon _ }
  'module'   { Located _ TokModule _ }
  'import'   { Located _ TokImport _ }
  'source'   { Located _ TokSource _ }
  'from'     { Located _ TokFrom _ }
  'where'    { Located _ TokWhere _ }
  'as'       { Located _ TokAs _ }
  'True'     { Located _ TokTrue _ }
  'False'    { Located _ TokFalse _ }
  'type'     { Located _ TokType _ }
  'record'   { Located _ TokRecord _ }
  'object'   { Located _ TokObject _ }
  'table'    { Located _ TokTable _ }
  'class'    { Located _ TokClass _ }
  'instance' { Located _ TokInstance _ }
  'infixl'   { Located _ TokInfixl _ }
  'infixr'   { Located _ TokInfixr _ }
  'infix'    { Located _ TokInfix _ }
  'let'      { Located _ TokLet _ }
  'in'       { Located _ TokIn _ }
  'do'       { Located _ TokDo _ }
  'Null'     { Located _ TokNull _ }
  LOWER      { Located _ (TokLowerName _) _ }
  UPPER      { Located _ (TokUpperName _) _ }
  '+'        { Located _ (TokOperator "+") _ }
  '/'        { Located _ (TokOperator "/") _ }
  OPERATOR   { Located _ (TokOperator _) _ }
  INTEGER    { Located _ (TokInteger _) _ }
  FLOAT      { Located _ (TokFloat _) _ }
  STRING     { Located _ (TokString _) _ }
  STRSTART   { Located _ (TokStringStart _) _ }
  STRMID     { Located _ (TokStringMid _) _ }
  STREND     { Located _ (TokStringEnd _) _ }
  INTERPOPEN { Located _ TokInterpOpen _ }
  INTERPCLOSE { Located _ TokInterpClose _ }
  INTRINSIC  { Located _ (TokIntrinsic _) _ }
  ';'        { Located _ TokSemicolon _ }
  '%inline'  { Located _ TokPragmaInline _ }
  EOF        { Located _ TokEOF _ }

%%

--------------------------------------------------------------------
-- Program
--------------------------------------------------------------------

program :: { ([Loc CstExpr], Bool) }
  : modules EOF             { ($1, False) }
  | top_body EOF            { ($1, True) }

-- Standalone entry points with explicit EOF
type_eof :: { TypeU }
  : type EOF                { $1 }

expr_eof :: { Loc CstExpr }
  : expr EOF                { $1 }

modules :: { [Loc CstExpr] }
  : module                   { [$1] }
  | modules module           { $1 ++ [$2] }

module :: { Loc CstExpr }
  : 'module' module_name '(' exports ')' top_body
      { at $1 (CModE (Just $2) $4 $6) }
  | 'module' '(' exports ')' top_body
      { at $1 (CModE Nothing $3 $5) }

top_body :: { [Loc CstExpr] }
  : VLBRACE top_decls VRBRACE   { $2 }
  | VLBRACE VRBRACE              { [] }
  | '{' top_decls_explicit '}'   { $2 }
  | '{' '}'                      { [] }

top_decls :: { [Loc CstExpr] }
  : top_decl                     { $1 }
  | top_decls VSEMI top_decl     { $1 ++ $3 }

top_decls_explicit :: { [Loc CstExpr] }
  : top_decl                           { $1 }
  | top_decls_explicit ';' top_decl    { $1 ++ $3 }

top_decl :: { [Loc CstExpr] }
  : import_decl       { [$1] }
  | typedef_decl      { [$1] }
  | typeclass_decl    { [$1] }
  | instance_decl     { $1 }
  | fixity_decl       { [$1] }
  | source_decl       { $1 }
  | '%inline' source_decl { map (\(Loc sp e) -> Loc sp (CInlineE (Loc sp e))) $2 }
  | sig_or_ass        { $1 }

sig_or_ass :: { [Loc CstExpr] }
  : evar_or_op '::' sig_type
      { [at $1 (CSigE (toEVar $1) $3)] }
  | evar_or_op lower_names '=' expr opt_where_decls
      { [at $1 (CAssE (toEVar $1) $2 $4 $5)] }
  | evar_or_op lower_names guard_clauses ':' expr opt_where_decls
      { [at $1 (CGuardedAssE (toEVar $1) $2 $3 $5 $6)] }

guard_clauses :: { [(Loc CstExpr, Loc CstExpr)] }
  : guard_clause                    { [$1] }
  | guard_clauses guard_clause      { $1 ++ [$2] }

guard_clause :: { (Loc CstExpr, Loc CstExpr) }
  : '?' expr '=' expr              { ($2, $4) }

--------------------------------------------------------------------
-- Module names
--------------------------------------------------------------------

module_name :: { Text }
  : module_parts             { T.intercalate "." $1 }

module_parts :: { [Text] }
  : module_comp                        { [$1] }
  | module_parts '.' module_comp       { $1 ++ [$3] }
  | module_parts GDOT module_comp      { $1 ++ [$3] }
  | module_parts NSDOT module_comp     { $1 ++ [$3] }
  | module_parts GDOTCHAIN module_comp { $1 ++ [$3] }

module_comp :: { Text }
  : LOWER                              { getName $1 }
  | module_comp '-' LOWER              { $1 <> "-" <> getName $3 }

--------------------------------------------------------------------
-- Exports
--------------------------------------------------------------------

exports :: { CstExport }
  : '*'                     { CstExportAll }
  | export_list             { CstExportMany $1 }

export_list :: { [Located] }
  : export_item                      { [$1] }
  | export_list ',' export_item      { $1 ++ [$3] }

export_item :: { Located }
  : symbol              { $1 }

symbol :: { Located }
  : LOWER               { $1 }
  | '(' operator_name ')' { $2 }
  | '(' '-' ')'          { $2 }
  | '(' '.' ')'          { $2 }
  | UPPER               { $1 }

--------------------------------------------------------------------
-- Imports
--------------------------------------------------------------------

import_decl :: { Loc CstExpr }
  : 'import' import_module_name opt_import_list
      { at $1 (CImpE (Import (MV $2) $3 [] Nothing)) }
  | 'import' import_module_name 'as' LOWER opt_import_list
      { at $1 (CImpE (Import (MV $2) $5 [] (Just (EV (getName $4))))) }
  | 'import' GDOT module_name opt_import_list
      { at $1 (CImpE (Import (MV ("." <> $3)) $4 [] Nothing)) }
  | 'import' GDOT module_name 'as' LOWER opt_import_list
      { at $1 (CImpE (Import (MV ("." <> $3)) $6 [] (Just (EV (getName $5))))) }

-- | Module names in import context allow an optional namespace prefix: owner/name
import_module_name :: { Text }
  : module_comp '/' module_name      { $1 <> "/" <> $3 }
  | module_name                      { $1 }

opt_import_list :: { Maybe [AliasedSymbol] }
  : {- empty -}                            { Nothing }
  | '(' import_items ')'                   { Just $2 }

import_items :: { [AliasedSymbol] }
  : import_item                            { [$1] }
  | import_items ',' import_item           { $1 ++ [$3] }

import_item :: { AliasedSymbol }
  : LOWER                              { AliasedTerm (EV (getName $1)) (EV (getName $1)) }
  | LOWER 'as' LOWER                   { AliasedTerm (EV (getName $1)) (EV (getName $3)) }
  | '(' operator_name ')' 'as' LOWER   { AliasedTerm (EV (getOp $2)) (EV (getName $5)) }
  | '(' operator_name ')'              { AliasedTerm (EV (getOp $2)) (EV (getOp $2)) }
  | '(' '-' ')' 'as' LOWER            { AliasedTerm (EV "-") (EV (getName $5)) }
  | '(' '-' ')'                        { AliasedTerm (EV "-") (EV "-") }
  | '(' '.' ')' 'as' LOWER            { AliasedTerm (EV ".") (EV (getName $5)) }
  | '(' '.' ')'                        { AliasedTerm (EV ".") (EV ".") }
  | UPPER                              { AliasedType (TV (getName $1)) (TV (getName $1)) }
  | UPPER 'as' UPPER                   { AliasedType (TV (getName $1)) (TV (getName $3)) }

--------------------------------------------------------------------
-- Type definitions
--------------------------------------------------------------------

typedef_decl :: { Loc CstExpr }
  : 'type' UPPER '=>' typedef_term '=' concrete_rhs
      { at $1 (CTypE (CstTypeAlias (Just $2) $4 $6)) }
  | 'type' LOWER '=>' typedef_term '=' concrete_rhs
      { at $1 (CTypE (CstTypeAlias (Just $2) $4 $6)) }
  | 'type' UPPER typedef_params '=' type
      { at $1 (CTypE (CstTypeAlias Nothing (TV (getName $2), $3) ($5, False))) }
  | 'type' UPPER typedef_params
      { at $1 (CTypE (CstTypeAliasForward (TV (getName $2), $3))) }
  | 'type' '(' UPPER typedef_params ')' '=' type
      { at $1 (CTypE (CstTypeAlias Nothing (TV (getName $3), $4) ($7, False))) }
  | 'type' '(' UPPER typedef_params ')'
      { at $1 (CTypE (CstTypeAliasForward (TV (getName $3), $4))) }
  | nam_type typedef_term 'where' VLBRACE nam_entry_list_loc VRBRACE
      { at (fst $1) (CTypE (CstNamTypeWhere (snd $1) $2 $5)) }
  | nam_type typedef_term '=' nam_constructor opt_nam_entries
      { at (fst $1) (CTypE (CstNamTypeLegacy Nothing (snd $1) $2 $4 $5)) }
  | nam_type UPPER '=>' typedef_term '=' nam_constructor opt_nam_entries
      { at (fst $1) (CTypE (CstNamTypeLegacy (Just $2) (snd $1) $4 $6 $7)) }
  | nam_type LOWER '=>' typedef_term '=' nam_constructor opt_nam_entries
      { at (fst $1) (CTypE (CstNamTypeLegacy (Just $2) (snd $1) $4 $6 $7)) }

nam_type :: { (Located, NamType) }
  : 'record'   { ($1, NamRecord) }
  | 'object'   { ($1, NamObject) }
  | 'table'    { ($1, NamTable) }

nam_constructor :: { (Text, Bool) }
  : STRING                    { (getString $1, True) }
  | UPPER                     { (getName $1, False) }
  | LOWER                     { (getName $1, False) }

opt_nam_entries :: { [(Key, TypeU)] }
  : {- empty -}              { [] }
  | '{' nam_entries '}'       { $2 }

lang_token :: { Located }
  : UPPER                    { $1 }
  | LOWER                    { $1 }

typedef_term :: { (TVar, [Either (TVar, Kind) TypeU]) }
  : UPPER typedef_params              { (TV (getName $1), $2) }
  | '(' UPPER typedef_params ')'     { (TV (getName $2), $3) }

typedef_params :: { [Either (TVar, Kind) TypeU] }
  : {- empty -}                        { [] }
  | typedef_params LOWER               { $1 ++ [Left (TV (getName $2), KindType)] }
  | typedef_params '(' LOWER '::' UPPER ')'  { $1 ++ [Left (TV (getName $3), parseKind (getName $5))] }
  | typedef_params '(' type ')'        { $1 ++ [Right $3] }

nam_entry :: { (Key, TypeU) }
  : LOWER '::' type          { (Key (getName $1), $3) }

nam_entry_loc :: { (Located, Key, TypeU) }
  : LOWER '::' type          { ($1, Key (getName $1), $3) }

nam_entry_list_loc :: { [(Located, Key, TypeU)] }
  : nam_entry_loc                              { [$1] }
  | nam_entry_list_loc VSEMI nam_entry_loc     { $1 ++ [$3] }

nam_entries :: { [(Key, TypeU)] }
  : nam_entry                          { [$1] }
  | nam_entries ',' nam_entry          { $1 ++ [$3] }

concrete_rhs :: { (TypeU, Bool) }
  : STRING concrete_rhs_args    { (case $2 of { [] -> VarU (TV (getString $1)); ts -> AppU (VarU (TV (getString $1))) ts }, True) }
  | non_string_type             { ($1, False) }

concrete_rhs_args :: { [TypeU] }
  : {- empty -}                       { [] }
  | concrete_rhs_args atom_type       { $1 ++ [$2] }

non_string_type :: { TypeU }
  : non_string_non_fun '->' type  { case $3 of { FunU args ret -> FunU ($1 : args) ret; t -> FunU [$1] t } }
  | non_string_non_fun            { $1 }

non_string_non_fun :: { TypeU }
  : '<' LOWER '>'            { ExistU (TV (getName $2)) ([], Open) ([], Open) }
  | '<' effect_labels '>' non_string_non_fun  { EffectU (EffectSet (Set.fromList $2)) $4 }
  | non_string_add            { $1 }

non_string_add :: { TypeU }
  : non_string_add '+' non_string_mul  { NatAddU $1 $3 }
  | non_string_add '-' non_string_mul  { NatSubU $1 $3 }
  | non_string_mul                      { $1 }

non_string_mul :: { TypeU }
  : non_string_mul '*' non_string_app  { NatMulU $1 $3 }
  | non_string_mul '/' non_string_app  { NatDivU $1 $3 }
  | non_string_app                      { $1 }

non_string_app :: { TypeU }
  : non_string_app atom_type  { applyType $1 $2 }
  | non_string_atom           { $1 }

non_string_atom :: { TypeU }
  : '(' ')'                  { BT.unitU }
  | '(' type ')'             { $2 }
  | '(' type ',' type_list1 ')' { BT.tupleU ($2 : $4) }
  | '[' type ']'              { BT.listU $2 }
  | '?' non_string_atom       { OptionalU $2 }
  | UPPER                     { VarU (TV (getName $1)) }
  | LOWER ':' non_fun_type   { LabeledU (TV (getName $1)) $3 }
  | LOWER                     { VarU (TV (getName $1)) }
  | INTEGER                   { NatLitU (getInt $1) }

--------------------------------------------------------------------
-- Typeclasses
--------------------------------------------------------------------

typeclass_decl :: { Loc CstExpr }
  : 'class' class_head 'where' VLBRACE sig_list VRBRACE
      { at $1 (CClsE $2 $5) }
  | 'class' class_head
      { at $1 (CClsE $2 []) }

class_head :: { CstClassHead }
  : app_type '=>' app_type
      { CCHConstrained $1 $3 }
  | '(' class_constraints ')' '=>' app_type
      { CCHMultiConstrained $2 $5 }
  | app_type
      { CCHSimple $1 }

class_constraints :: { [Constraint] }
  : single_constraint                            { [$1] }
  | class_constraints ',' single_constraint      { $1 ++ [$3] }

sig_list :: { [CstSigItem] }
  : signature                     { [$1] }
  | sig_list VSEMI signature      { $1 ++ [$3] }

signature :: { CstSigItem }
  : evar_or_op '::' sig_type
      { CstSigItem (toEVar $1) $3 }

--------------------------------------------------------------------
-- Instances
--------------------------------------------------------------------

instance_decl :: { [Loc CstExpr] }
  : 'instance' instance_heads 'where' VLBRACE instance_items VRBRACE
      { [at $1 (CIstE cn ts (concat $5)) | (cn, ts) <- $2] }
  | 'instance' instance_heads
      { [at $1 (CIstE cn ts []) | (cn, ts) <- $2] }

instance_heads :: { [(ClassName, [TypeU])] }
  : UPPER types1                              { [(ClassName (getName $1), $2)] }
  | instance_heads ',' UPPER types1           { $1 ++ [(ClassName (getName $3), $4)] }

instance_items :: { [[Loc CstExpr]] }
  : instance_item                        { [$1] }
  | instance_items VSEMI instance_item   { $1 ++ [$3] }

instance_item :: { [Loc CstExpr] }
  : source_decl             { $1 }
  | '%inline' source_decl   { map (\(Loc sp e) -> Loc sp (CInlineE (Loc sp e))) $2 }
  | sig_or_ass              { $1 }

--------------------------------------------------------------------
-- Fixity declarations
--------------------------------------------------------------------

fixity_decl :: { Loc CstExpr }
  : 'infixl' INTEGER operator_names
      { at $1 (CFixE InfixL (fromInteger (getInt $2)) $3) }
  | 'infixr' INTEGER operator_names
      { at $1 (CFixE InfixR (fromInteger (getInt $2)) $3) }
  | 'infix' INTEGER operator_names
      { at $1 (CFixE InfixN (fromInteger (getInt $2)) $3) }

operator_names :: { [EVar] }
  : operator_ref                         { [$1] }
  | operator_names ',' operator_ref      { $1 ++ [$3] }

operator_ref :: { EVar }
  : '(' operator_name ')'     { EV (getOp $2) }
  | '(' '-' ')'               { EV "-" }
  | '(' '.' ')'               { EV "." }
  | operator_name              { EV (getOp $1) }
  | '.'                        { EV "." }
  | '-'                        { EV "-" }
  | LOWER                      { EV (getName $1) }

--------------------------------------------------------------------
-- Source declarations
--------------------------------------------------------------------

source_decl :: { [Loc CstExpr] }
  : 'source' lang_token opt_from '(' source_items ')'
      { [at $1 (CSrcOldE $2 $3 $5)] }
  | 'source' lang_token opt_from 'where' VLBRACE source_new_items VRBRACE
      { [at $1 (CSrcNewE $2 $3 $6)] }

opt_from :: { Maybe Text }
  : {- empty -}                    { Nothing }
  | 'from' STRING                  { Just (getString $2) }

source_items :: { [(Text, Maybe Text)] }
  : source_item                          { [$1] }
  | source_items ',' source_item         { $1 ++ [$3] }

source_item :: { (Text, Maybe Text) }
  : STRING                              { (getString $1, Nothing) }
  | STRING 'as' LOWER                   { (getString $1, Just (getName $3)) }
  | STRING 'as' UPPER                   { (getString $1, Just (getName $3)) }
  | STRING 'as' source_op               { (getString $1, Just $3) }
  | source_op                           { ($1, Nothing) }
  | source_op 'as' source_op            { ($1, Just $3) }
  | source_op 'as' LOWER               { ($1, Just (getName $3)) }
  | source_op 'as' UPPER               { ($1, Just (getName $3)) }

source_op :: { Text }
  : '(' operator_name ')'              { getOp $2 }
  | '(' '-' ')'                        { "-" }
  | '(' '.' ')'                        { "." }

source_new_items :: { [(Bool, Text, Located)] }
  : source_new_item                          { [$1] }
  | source_new_items VSEMI source_new_item   { $1 ++ [$3] }

source_new_item :: { (Bool, Text, Located) }
  : '%inline' source_new_term         { (True, fst $2, snd $2) }
  | source_new_term                   { (False, fst $1, snd $1) }

source_new_term :: { (Text, Located) }
  : LOWER                             { (getName $1, $1) }
  | '(' operator_name ')'            { (getOp $2, $2) }
  | '(' '-' ')'                      { ("-", $2) }
  | '(' '.' ')'                      { (".", $2) }

--------------------------------------------------------------------
-- Expressions
--------------------------------------------------------------------

expr :: { Loc CstExpr }
  : let_expr                { $1 }
  | lambda_expr             { $1 }
  | guard_expr              { $1 }
  | infix_expr              { $1 }
  | infix_expr '::' type    { at $2 (CAnnE $1 $3) }

guard_expr :: { Loc CstExpr }
  : guard_clauses ':' expr
      { Loc (fst (head $1) <-> $3) (CGuardExprE $1 $3) }

let_expr :: { Loc CstExpr }
  : 'let' VLBRACE let_bindings VRBRACE 'in' expr
      { at $1 (CLetE $3 $6) }
  | 'let' VLBRACE let_bindings VRBRACE let_expr
      { at $1 (CLetE $3 $5) }
  | 'let' '{' let_bindings_explicit '}' 'in' expr
      { at $1 (CLetE $3 $6) }
  | 'let' '{' let_bindings_explicit '}' let_expr
      { at $1 (CLetE $3 $5) }

let_bindings :: { [(EVar, Loc CstExpr)] }
  : let_binding                        { [$1] }
  | let_bindings VSEMI let_binding     { $1 ++ [$3] }

let_bindings_explicit :: { [(EVar, Loc CstExpr)] }
  : let_binding                              { [$1] }
  | let_bindings_explicit ';' let_binding    { $1 ++ [$3] }

let_binding :: { (EVar, Loc CstExpr) }
  : LOWER '=' expr                     { (EV (getName $1), $3) }
  | '_' '=' expr                       { (EV "_", $3) }
  | LOWER guard_clauses ':' expr
      { (EV (getName $1), Loc ($1 <-> $4) (CGuardExprE $2 $4)) }

lambda_expr :: { Loc CstExpr }
  : '\\' lower_names1 '->' expr
      { at $1 (CLamE (map EV $2) $4) }

infix_expr :: { Loc CstExpr }
  : operand                  { $1 }
  | operand operator_name expr
      { at $2 (CBopE $1 $2 $3) }
  | operand '-' expr
      { at $2 (CBopE $1 $2 $3) }
  | operand '.' expr
      { at $2 (CBopE $1 $2 $3) }

operand :: { Loc CstExpr }
  : app_expr                 { $1 }
  | '-' INTEGER              { at $1 (CIntE (negate (getInt $2))) }
  | '-' FLOAT                { at $1 (CRealE (DS.fromFloatDigits (negate (getFloat $2)))) }

app_expr :: { Loc CstExpr }
  : force_expr                     { $1 }
  | force_expr atom_exprs1         { Loc ($1 <-> last $2) (CAppE $1 $2) }

force_expr :: { Loc CstExpr }
  : '!' atom_expr                  { Loc ($1 <-> $2) (CForceE $2) }
  | atom_expr                      { $1 }

atom_exprs1 :: { [Loc CstExpr] }
  : force_expr                     { [$1] }
  | atom_exprs1 force_expr         { $1 ++ [$2] }

atom_expr :: { Loc CstExpr }
  : paren_expr                { $1 }
  | getter_expr               { $1 }
  | string_expr               { $1 }
  | bool_expr                 { $1 }
  | num_expr                  { $1 }
  | list_expr                 { $1 }
  | record_expr               { $1 }
  | var_expr                  { $1 }
  | hole_expr                 { $1 }
  | do_expr                   { $1 }
  | null_expr                 { $1 }
  | intrinsic_expr            { $1 }

null_expr :: { Loc CstExpr }
  : 'Null'                    { at $1 CNullE }

intrinsic_expr :: { Loc CstExpr }
  : INTRINSIC                 { at $1 (CIntrinsicE (getIntrinsicName $1)) }

paren_expr :: { Loc CstExpr }
  : '(' ')'                   { at $1 CUniE }
  | '(' operator_name ')'     { at $1 (CVarE (EV (getOp $2))) }
  | '(' '-' ')'               { at $1 (CVarE (EV "-")) }
  | '(' '.' ')'               { at $1 (CVarE (EV ".")) }
  | '(' expr ')'              { Loc ($1 <-> $3) (CParenE $2) }
  | '(' expr ',' expr_list1 ')' { Loc ($1 <-> $5) (CTupE ($2 : $4)) }

expr_list1 :: { [Loc CstExpr] }
  : expr                       { [$1] }
  | expr_list1 ',' expr        { $1 ++ [$3] }

record_expr :: { Loc CstExpr }
  : '{' record_entries '}'    { Loc ($1 <-> $3) (CNamE $2) }

record_entries :: { [(Key, Loc CstExpr)] }
  : record_entry                         { [$1] }
  | record_entries ',' record_entry      { $1 ++ [$3] }

record_entry :: { (Key, Loc CstExpr) }
  : LOWER '=' expr                       { (Key (getName $1), $3) }

list_expr :: { Loc CstExpr }
  : '[' ']'                   { Loc ($1 <-> $2) (CLstE []) }
  | '[' expr_list1 ']'        { Loc ($1 <-> $3) (CLstE $2) }

do_expr :: { Loc CstExpr }
  : 'do' VLBRACE do_stmts VRBRACE     { Loc ($1 <-> $4) (CDoE $3) }
  | 'do' '{' do_stmts_explicit '}'    { Loc ($1 <-> $4) (CDoE $3) }

do_stmts :: { [CstDoStmt] }
  : do_stmt                   { $1 }
  | do_stmts VSEMI do_stmt    { $1 ++ $3 }

do_stmts_explicit :: { [CstDoStmt] }
  : do_stmt                              { $1 }
  | do_stmts_explicit ';' do_stmt        { $1 ++ $3 }

do_stmt :: { [CstDoStmt] }
  : LOWER '<-' expr            { [CstDoBind (EV (getName $1)) $3] }
  | 'let' VLBRACE let_bindings VRBRACE
      { [CstDoLet (EV v) e | (EV v, e) <- $3] }
  | expr                       { [CstDoBare $1] }

getter_expr :: { Loc CstExpr }
  : GDOT accessor_body      { at $1 (CAccessorE $2) }
  | GDOTCHAIN accessor_body { at $1 (CAccessorE $2) }

accessor_body :: { CstAccessorBody }
  : LOWER accessor_tail           { CABKey (getName $1) $2 }
  | INTEGER accessor_tail         { CABIdx (fromInteger (getInt $1)) $2 }
  | '(' grouped_accessors ')'    { CABGroup $2 }

accessor_tail :: { CstAccessorTail }
  : {- empty -}                   { CATEnd }
  | '=' expr                      { CATSet $2 }
  | GDOTCHAIN accessor_body       { CATChain $2 }

grouped_accessors :: { [CstAccessorBody] }
  : grouped_accessor                          { [$1] }
  | grouped_accessors ',' grouped_accessor   { $1 ++ [$3] }

grouped_accessor :: { CstAccessorBody }
  : GDOT accessor_body      { $2 }
  | GDOTCHAIN accessor_body { $2 }

var_expr :: { Loc CstExpr }
  : LOWER NSDOT LOWER         { Loc ($1 <-> $3) (CVarE (EV (getName $1 <> "." <> getName $3))) }
  | LOWER LABELCOLON LOWER    { Loc ($1 <-> $3) (CLabeledVarE (getName $1) (EV (getName $3))) }
  | LOWER                     { at $1 (CVarE (EV (getName $1))) }

hole_expr :: { Loc CstExpr }
  : '_'                        { at $1 CHolE }

bool_expr :: { Loc CstExpr }
  : 'True'                     { at $1 (CLogE True) }
  | 'False'                    { at $1 (CLogE False) }

num_expr :: { Loc CstExpr }
  : INTEGER                    { at $1 (CIntE (getInt $1)) }
  | FLOAT                      { at $1 (CRealE (DS.fromFloatDigits (getFloat $1))) }

string_expr :: { Loc CstExpr }
  : STRING                     { at $1 (CStrE (getString $1)) }
  | interp_string              { $1 }

interp_string :: { Loc CstExpr }
  : STRSTART interp_body STREND
      { Loc ($1 <-> $3) (CInterpE (getString $1) (fst $2) (snd $2) (getString $3)) }

interp_body :: { ([Loc CstExpr], [Text]) }
  : INTERPOPEN expr INTERPCLOSE
      { ([$2], []) }
  | interp_body STRMID INTERPOPEN expr INTERPCLOSE
      { let (es, ms) = $1 in (es ++ [$4], ms ++ [getString $2]) }

--------------------------------------------------------------------
-- Types
--------------------------------------------------------------------

type :: { TypeU }
  : fun_type                 { $1 }
  | non_fun_type             { $1 }

fun_type :: { TypeU }
  : non_fun_type '->' type   { case $3 of { FunU args ret -> FunU ($1 : args) ret; t -> FunU [$1] t } }

non_fun_type :: { TypeU }
  : '<' LOWER '>'            { ExistU (TV (getName $2)) ([], Open) ([], Open) }
  | '<' effect_labels '>' non_fun_type  { EffectU (EffectSet (Set.fromList $2)) $4 }
  | add_type                  { $1 }

add_type :: { TypeU }
  : add_type '+' mul_type     { NatAddU $1 $3 }
  | add_type '-' mul_type     { NatSubU $1 $3 }
  | mul_type                  { $1 }

mul_type :: { TypeU }
  : mul_type '*' app_type     { NatMulU $1 $3 }
  | mul_type '/' app_type     { NatDivU $1 $3 }
  | app_type                  { $1 }

app_type :: { TypeU }
  : app_type atom_type        { applyType $1 $2 }
  | atom_type                 { $1 }

atom_type :: { TypeU }
  : '(' ')'                  { BT.unitU }
  | '(' type ')'             { $2 }
  | '(' type ',' type_list1 ')' { BT.tupleU ($2 : $4) }
  | '[' type ']'              { BT.listU $2 }
  | '?' atom_type             { OptionalU $2 }
  | UPPER                     { VarU (TV (getName $1)) }
  | LOWER ':' non_fun_type   { $3 }
  | LOWER                     { VarU (TV (getName $1)) }
  | STRING                    { VarU (TV (getString $1)) }
  | INTEGER                   { NatLitU (getInt $1) }

type_list1 :: { [TypeU] }
  : type                      { [$1] }
  | type_list1 ',' type       { $1 ++ [$3] }

types1 :: { [TypeU] }
  : atom_type                  { [$1] }
  | types1 atom_type           { $1 ++ [$2] }

effect_labels :: { [EffectLabel] }
  : UPPER                       { [getName $1] }
  | effect_labels ',' UPPER     { $1 ++ [getName $3] }

--------------------------------------------------------------------
-- Constraints and signature types
--------------------------------------------------------------------

sig_type :: { CstSigType }
  : sig_fun_args '=>' sig_fun_args
      { CstSigType (Just $1) $3 }
  | sig_fun_args
      { CstSigType Nothing $1 }

sig_fun_args :: { [(Pos, TypeU)] }
  : pos_non_fun_type '->' sig_fun_args  { $1 : $3 }
  | pos_non_fun_type                     { [$1] }

pos_non_fun_type :: { (Pos, TypeU) }
  : '<' LOWER '>'     { (locPos $1, ExistU (TV (getName $2)) ([], Open) ([], Open)) }
  | '<' effect_labels '>' pos_non_fun_type  { (locPos $1, EffectU (EffectSet (Set.fromList $2)) (snd $4)) }
  | pos_add_type       { $1 }

pos_add_type :: { (Pos, TypeU) }
  : pos_add_type '+' mul_type  { (fst $1, NatAddU (snd $1) $3) }
  | pos_add_type '-' mul_type  { (fst $1, NatSubU (snd $1) $3) }
  | pos_mul_type                { $1 }

pos_mul_type :: { (Pos, TypeU) }
  : pos_mul_type '*' app_type  { (fst $1, NatMulU (snd $1) $3) }
  | pos_mul_type '/' app_type  { (fst $1, NatDivU (snd $1) $3) }
  | pos_app_type                { $1 }

pos_app_type :: { (Pos, TypeU) }
  : pos_app_type atom_type  { (fst $1, applyType (snd $1) $2) }
  | pos_atom_type            { $1 }

pos_atom_type :: { (Pos, TypeU) }
  : '(' ')'                     { (locPos $1, BT.unitU) }
  | '(' type ')'                { (locPos $1, $2) }
  | '(' type ',' type_list1 ')' { (locPos $1, BT.tupleU ($2 : $4)) }
  | '[' type ']'                { (locPos $1, BT.listU $2) }
  | '?' pos_atom_type            { (locPos $1, OptionalU (snd $2)) }
  | UPPER                       { (locPos $1, VarU (TV (getName $1))) }
  | LOWER ':' non_fun_type      { (locPos $1, LabeledU (TV (getName $1)) $3) }
  | LOWER                       { (locPos $1, VarU (TV (getName $1))) }
  | STRING                      { (locPos $1, VarU (TV (getString $1))) }
  | INTEGER                     { (locPos $1, NatLitU (getInt $1)) }

single_constraint :: { Constraint }
  : UPPER types1                         { Constraint (ClassName (getName $1)) $2 }

--------------------------------------------------------------------
-- Helpers
--------------------------------------------------------------------

operator_name :: { Located }
  : OPERATOR                  { $1 }
  | '+'                       { $1 }
  | '*'                       { $1 }
  | '<'                       { $1 }
  | '>'                       { $1 }
  | '/'                       { $1 }

evar_or_op :: { Located }
  : LOWER                     { $1 }
  | '(' operator_name ')'     { $2 }
  | '(' '-' ')'               { $2 }
  | '(' '.' ')'               { $2 }

opt_where_decls :: { [Loc CstExpr] }
  : {- empty -}                               { [] }
  | 'where' VLBRACE where_items VRBRACE       { $3 }
  | 'where' '{' where_items_explicit '}'      { $3 }

where_items :: { [Loc CstExpr] }
  : where_item                      { $1 }
  | where_items VSEMI where_item    { $1 ++ $3 }

where_items_explicit :: { [Loc CstExpr] }
  : where_item                             { $1 }
  | where_items_explicit ';' where_item    { $1 ++ $3 }

where_item :: { [Loc CstExpr] }
  : sig_or_ass                { $1 }

lower_names :: { [Text] }
  : {- empty -}               { [] }
  | lower_names LOWER         { $1 ++ [getName $2] }

lower_names1 :: { [Text] }
  : LOWER                     { [getName $1] }
  | lower_names1 LOWER        { $1 ++ [getName $2] }

{

--------------------------------------------------------------------
-- Parser monad
--------------------------------------------------------------------

data PState = PState
  { psExpIndex    :: !Int
  , psSourceMap   :: !(Map.Map Int SrcLoc)
  , psModulePath  :: !(Maybe Path)
  , psModuleConfig :: !ModuleConfig
  , psDocMap      :: !(Map.Map Pos [Text])
  , psSourceLines :: ![Text]
  , psLangMap :: !(Map.Map T.Text Lang) -- alias -> Lang for all known languages
  , psProjectRoot :: !(Maybe Path) -- project root (directory of entry-point file)
  , psTermDocs    :: !(Map.Map EVar [Text])
  , psWarnings    :: ![Text] -- docstring warnings accumulated during desugar
  , psModuleDoc   :: ![Text] -- module-level description
  , psModuleEpilogues :: ![[Text]] -- epilogue blocks
  }
  deriving (Show)

emptyPState :: PState
emptyPState = PState 1 Map.empty Nothing defaultValue Map.empty [] Map.empty Nothing Map.empty [] [] []

type P a = State.StateT PState (Either ParseError) a

--------------------------------------------------------------------
-- Token extraction helpers
--------------------------------------------------------------------

getName :: Located -> Text
getName (Located _ (TokLowerName n) _) = n
getName (Located _ (TokUpperName n) _) = n
getName (Located _ _ t) = t

getInt :: Located -> Integer
getInt (Located _ (TokInteger n) _) = n
getInt _ = 0

getFloat :: Located -> Double
getFloat (Located _ (TokFloat d) _) = d
getFloat _ = 0

getString :: Located -> Text
getString (Located _ (TokString s) _) = s
getString (Located _ (TokStringStart s) _) = s
getString (Located _ (TokStringMid s) _) = s
getString (Located _ (TokStringEnd s) _) = s
getString (Located _ _ t) = t

getIntrinsicName :: Located -> Text
getIntrinsicName (Located _ (TokIntrinsic n) _) = n
getIntrinsicName _ = ""

parseKind :: Text -> Kind
parseKind "Nat" = KindNat
parseKind _ = KindType

getOp :: Located -> Text
getOp (Located _ (TokOperator t) _) = t
getOp (Located _ TokMinus _) = "-"
getOp (Located _ TokStar _) = "*"
getOp (Located _ TokDot _) = "."
getOp (Located _ TokLAngle _) = "<"
getOp (Located _ TokRAngle _) = ">"
getOp (Located _ _ t) = t

toEVar :: Located -> EVar
toEVar (Located _ (TokLowerName n) _) = EV n
toEVar (Located _ (TokOperator n) _) = EV n
toEVar (Located _ TokMinus _) = EV "-"
toEVar (Located _ TokStar _) = EV "*"
toEVar (Located _ TokDot _) = EV "."
toEVar (Located _ TokLAngle _) = EV "<"
toEVar (Located _ TokRAngle _) = EV ">"
toEVar _ = EV "?"

--------------------------------------------------------------------
-- Type helper
--------------------------------------------------------------------

applyType :: TypeU -> TypeU -> TypeU
applyType (AppU f args) x = AppU f (args ++ [x])
applyType f x = AppU f [x]

--------------------------------------------------------------------
-- Error handling
--------------------------------------------------------------------

parseError :: ([Located], [String]) -> P a
parseError ([], expected) = do
  srcLines <- State.gets psSourceLines
  State.lift (Left (ParseError (Pos 0 0 "") "unexpected end of input" expected srcLines))
parseError (Located pos tok _ : _, expected) = do
  srcLines <- State.gets psSourceLines
  State.lift (Left (ParseError pos ("unexpected " ++ showToken tok) expected srcLines))

--------------------------------------------------------------------
-- Desugar bridge
--------------------------------------------------------------------

toDState :: PState -> DState
toDState ps = DState
  { dsExpIndex = psExpIndex ps
  , dsSourceMap = psSourceMap ps
  , dsDocMap = psDocMap ps
  , dsModulePath = psModulePath ps
  , dsModuleConfig = psModuleConfig ps
  , dsSourceLines = psSourceLines ps
  , dsLangMap = psLangMap ps
  , dsProjectRoot = psProjectRoot ps
  , dsTermDocs = psTermDocs ps
  , dsWarnings = psWarnings ps
  , dsModuleDoc = psModuleDoc ps
  , dsModuleEpilogues = psModuleEpilogues ps
  }

fromDState :: PState -> DState -> PState
fromDState ps ds = ps
  { psExpIndex = dsExpIndex ds
  , psSourceMap = dsSourceMap ds
  , psTermDocs = dsTermDocs ds
  , psWarnings = dsWarnings ds
  , psModuleDoc = dsModuleDoc ds
  , psModuleEpilogues = dsModuleEpilogues ds
  }

-- | Run parse + desugar
parseAndDesugar :: PState -> [Located] -> Either ParseError ([ExprI], PState)
parseAndDesugar pstate tokens =
  case State.runStateT (parseProgram tokens) pstate of
    Left err -> Left err
    Right ((cstNodes, isImplicitMain), _parseState) ->
      let dstate = toDState pstate
      in case State.runStateT (desugarProgram isImplicitMain cstNodes) dstate of
        Left err -> Left err
        Right (exprIs, finalDState) ->
          Right (exprIs, fromDState pstate finalDState)

-- | Parse and desugar a single expression
parseAndDesugarExpr :: PState -> [Located] -> Either ParseError (ExprI, PState)
parseAndDesugarExpr pstate tokens =
  case State.runStateT (parseExprOnly tokens) pstate of
    Left err -> Left err
    Right (cstExpr, _parseState) ->
      let dstate = toDState pstate
      in case State.runStateT (desugarExpr cstExpr) dstate of
        Left err -> Left err
        Right (exprI, finalDState) ->
          Right (exprI, fromDState pstate finalDState)

--------------------------------------------------------------------
-- Public API
--------------------------------------------------------------------

readProgram ::
  Maybe MVar ->
  Maybe Path ->
  Text ->
  PState ->
  DAG MVar Import ExprI ->
  Either String (DAG MVar Import ExprI, PState)
readProgram _moduleName modulePath sourceCode pstate dag = do
  let filename = maybe "<expr>" id modulePath
  (tokens, docMap, groupToks) <- case lexMorloc filename sourceCode of
    Left err -> Left (showLexError err)
    Right r -> Right r
  let srcLines = T.lines sourceCode
      pstate' = pstate { psModulePath = modulePath, psDocMap = docMap, psSourceLines = srcLines }
  -- Strategy 1: parse as-is (code with module declarations)
  case parseAndDesugar pstate' tokens of
    Right (result, finalState) ->
      let dag' = foldl addModule dag result
          dag'' = attachGroupAnnotations tokens groupToks dag'
      in return (dag'', finalState)
    Left err ->
      -- Strategy 2: wrap in module, patch trailing expr as __expr__ assignment.
      let wrappedCode = "module main (*)\n" <> sourceCode
      in case lexMorloc filename wrappedCode of
        Right (wrappedTokens, wrappedDocMap, wrappedGroupToks) ->
          let pstate'' = pstate' { psDocMap = wrappedDocMap, psSourceLines = T.lines wrappedCode }
          in case parseAndDesugar pstate'' wrappedTokens of
            Right (result, finalState) ->
              let dag' = foldl addModule dag result
                  dag'' = attachGroupAnnotations wrappedTokens wrappedGroupToks dag'
              in return (dag'', finalState)
            Left _ ->
              case patchForTrailingExpr wrappedTokens of
                Just patchedTokens ->
                  case parseAndDesugar pstate'' patchedTokens of
                    Right (result, finalState) ->
                      let dag' = foldl addModule dag result
                          dag'' = attachGroupAnnotations patchedTokens wrappedGroupToks dag'
                      in return (dag'', finalState)
                    Left _ -> tryExprFallback tokens pstate' dag filename err
                Nothing -> tryExprFallback tokens pstate' dag filename err
        Left _ -> tryExprFallback tokens pstate' dag filename err
  where
    tryExprFallback tokens' ps dag' filename' origErr =
      let exprTokens = stripLayoutTokens tokens'
      in case parseAndDesugarExpr ps exprTokens of
        Right (exprI, exprState) -> do
          let s = exprState
              i1 = psExpIndex s
              assI = ExprI i1 (AssE (EV "__expr__") exprI [])
              s1 = s { psExpIndex = i1 + 1 }
              i2 = psExpIndex s1
              expI = ExprI i2 (ExpE ExportAll)
              s2 = s1 { psExpIndex = i2 + 1 }
              i3 = psExpIndex s2
              modI = ExprI i3 (ModE (MV "main") [expI, assI])
              finalState = s2 { psExpIndex = i3 + 1 }
              dag'' = Map.insert (MV "main") (modI, []) dag'
          return (dag'', finalState)
        Left _ ->
          Left (showParseError filename' origErr)

    addModule d e@(ExprI _ (ModE n es)) =
      let imports = [(importModuleName i', i') | (ExprI _ (ImpE i')) <- es]
      in Map.insert n (e, imports) d
    addModule _ _ = error "expected a module"

patchForTrailingExpr :: [Located] -> Maybe [Located]
patchForTrailingExpr tokens = do
  let tokens' = patchExport tokens
  patchLastStmt tokens'

patchExport :: [Located] -> [Located]
patchExport [] = []
patchExport (t@(Located _ TokLParen _) : Located p TokStar _ : rest) =
  t : Located p (TokLowerName "__expr__") "__expr__" : rest
patchExport (t : rest) = t : patchExport rest

patchLastStmt :: [Located] -> Maybe [Located]
patchLastStmt tokens =
  case findLastTopVSemi tokens 0 0 Nothing of
    Just idx ->
      let (before, after) = splitAt (idx + 1) tokens
          dummyPos = Pos 0 0 "<expr>"
          exprTok = Located dummyPos (TokLowerName "__expr__") "__expr__"
          eqTok = Located dummyPos TokEquals "="
      in Just (before ++ [exprTok, eqTok] ++ after)
    Nothing -> Nothing
  where
    findLastTopVSemi :: [Located] -> Int -> Int -> Maybe Int -> Maybe Int
    findLastTopVSemi [] _ _ lastIdx = lastIdx
    findLastTopVSemi (Located _ TokVLBrace _ : rest) depth pos lastIdx =
      findLastTopVSemi rest (depth + 1) (pos + 1) lastIdx
    findLastTopVSemi (Located _ TokVRBrace _ : rest) depth pos lastIdx =
      findLastTopVSemi rest (max 0 (depth - 1)) (pos + 1) lastIdx
    findLastTopVSemi (Located _ TokVSemi _ : rest) depth pos _
      | depth == 1 = findLastTopVSemi rest depth (pos + 1) (Just pos)
    findLastTopVSemi (_ : rest) depth pos lastIdx =
      findLastTopVSemi rest depth (pos + 1) lastIdx

stripLayoutTokens :: [Located] -> [Located]
stripLayoutTokens = filter (not . isLayoutToken)
  where
    isLayoutToken (Located _ TokVLBrace _) = True
    isLayoutToken (Located _ TokVRBrace _) = True
    isLayoutToken (Located _ TokVSemi _) = True
    isLayoutToken _ = False

readType :: Text -> Either String TypeU
readType typeStr = do
  let initState = emptyPState
  (tokens, _, _) <- case lexMorloc "<type>" typeStr of
    Left err -> Left (showLexError err)
    Right r -> Right r
  (result, _) <- case State.runStateT (parseTypeOnly tokens) initState of
    Left err -> Left (showParseError "<type>" err)
    Right r -> Right r
  return result

-- | Post-process the DAG to attach group annotations from --* tokens.
attachGroupAnnotations :: [Located] -> [Located] -> DAG MVar Import ExprI -> DAG MVar Import ExprI
attachGroupAnnotations _ [] dag = dag
attachGroupAnnotations tokens groupToks dag =
  let groupHeaders = parseGroupHeaders groupToks
      exportSymPositions = findExportSymbolPositions tokens
      membership = buildMembership groupHeaders exportSymPositions
      ghdrMap = Map.fromList [(n, d) | (n, d, _) <- groupHeaders]
  in Map.map (\(e, es) -> (attachToExpr membership ghdrMap e, es)) dag
  where
    attachToExpr :: Map.Map T.Text T.Text -> Map.Map T.Text [T.Text] -> ExprI -> ExprI
    attachToExpr mem ghdrs (ExprI i (ModE m es)) =
      ExprI i (ModE m (map (attachToExpr mem ghdrs) es))
    attachToExpr mem ghdrs (ExprI i (ExpE (ExportMany symbols _))) =
      let groupedSymNames = Map.keysSet mem
          groupNames = nubText [gn | (_, gn) <- Map.toList mem]
          exportGroups =
            [ ExportGroup gn (maybe [] id (Map.lookup gn ghdrs))
                (Set.filter (\(_, sym) -> Map.lookup (symText sym) mem == Just gn) symbols)
            | gn <- groupNames
            ]
          ungrouped = Set.filter (\(_, sym) -> not (Set.member (symText sym) groupedSymNames)) symbols
      in ExprI i (ExpE (ExportMany ungrouped exportGroups))
    attachToExpr _ _ e = e

    nubText :: [T.Text] -> [T.Text]
    nubText [] = []
    nubText (x:xs) = x : nubText (filter (/= x) xs)

    symText :: Symbol -> T.Text
    symText (TermSymbol (EV n)) = n
    symText (TypeSymbol (TV n)) = n
    symText (ClassSymbol (ClassName n)) = n

parseGroupHeaders :: [Located] -> [(T.Text, [T.Text], Pos)]
parseGroupHeaders = foldl' accum [] . map extractLine
  where
    extractLine (Located pos (TokGroupLine txt) _) = (pos, stripOne txt)
    extractLine (Located pos _ _) = (pos, T.empty)

    -- consume one leading space after --*, preserve remaining indentation
    stripOne t = T.stripEnd $ case T.uncons t of
      Just (' ', rest) -> rest
      _ -> t

    accum :: [(T.Text, [T.Text], Pos)] -> (Pos, T.Text) -> [(T.Text, [T.Text], Pos)]
    accum gs (pos, line)
      | Just rest <- T.stripPrefix "\\" line = addDesc gs pos (T.stripEnd rest)
      | Just name <- T.stripPrefix "group:" (T.stripStart line) =
          let name' = T.strip name
          in if T.null name'
             then gs ++ [(T.empty, [], pos)]  -- --* group: (no name) = terminator
             else case gs of
               -- last entry has no name yet: set it
               _ | not (null gs), let (n, _, _) = last gs, T.null n ->
                   init gs ++ [let (_, ds, p) = last gs in (name', ds, p)]
               _ -> gs ++ [(name', [], pos)]
      | otherwise = addDesc gs pos line  -- includes blank lines

    addDesc [] pos d = [(T.empty, [d], pos)]  -- no group yet, start unnamed entry
    addDesc gs _ d = init gs ++ [let (n, ds, p) = last gs in (n, ds ++ [d], p)]

findExportSymbolPositions :: [Located] -> [(T.Text, Pos)]
findExportSymbolPositions = findModule
  where
    findModule (Located _ TokModule _ : rest) = findLParen rest
    findModule (_ : rest) = findModule rest
    findModule [] = []

    findLParen (Located _ TokLParen _ : rest) = scanExports 1 rest
    findLParen (Located _ TokStar _ : _) = []
    findLParen (_ : rest) = findLParen rest
    findLParen [] = []

    scanExports :: Int -> [Located] -> [(T.Text, Pos)]
    scanExports 0 _ = []
    scanExports depth (Located _ TokLParen _ : rest) = scanExports (depth + 1) rest
    scanExports depth (Located _ TokRParen _ : rest)
      | depth <= 1 = []
      | otherwise = scanExports (depth - 1) rest
    scanExports depth (Located pos (TokLowerName n) _ : rest) = (n, pos) : scanExports depth rest
    scanExports depth (Located pos (TokUpperName n) _ : rest) = (n, pos) : scanExports depth rest
    scanExports depth (_ : rest) = scanExports depth rest
    scanExports _ [] = []

buildMembership :: [(T.Text, [T.Text], Pos)] -> [(T.Text, Pos)] -> Map.Map T.Text T.Text
buildMembership groupHeaders exportSyms = Map.fromList
  [ (sym, gname)
  | (sym, symPos) <- exportSyms
  , Just gname <- [findGroup symPos]
  ]
  where
    sortedGroups = sortBy (\(_,_,p1) (_,_,p2) -> compare p1 p2) groupHeaders

    findGroup :: Pos -> Maybe T.Text
    findGroup symPos = case filter (\(_,_,gpos) -> gpos < symPos) (reverse sortedGroups) of
      ((gname,_,_):_)
        | T.null gname -> Nothing  -- empty name = group terminator
        | otherwise -> Just gname
      [] -> Nothing
}


================================================
FILE: library/Morloc/Frontend/Restructure.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE TupleSections #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Frontend.Restructure
Description : Resolve imports, exports, binary operators, holes, and type aliases
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Transforms the raw module DAG into the form expected by 'Link' and 'Treeify'.
This pass resolves import\/export edges to alias maps, converts binary
operator chains into correctly-associated application trees (via Pratt
parsing), expands hole expressions into lambdas, removes self-referential
type declarations, and collects type definitions and source mappings into
'MorlocState'.
-}
module Morloc.Frontend.Restructure (restructure) where

import Data.Set (Set)
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as T
import qualified Morloc.Data.DAG as DAG
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import Morloc.Data.Map (Map)
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import qualified Morloc.Frontend.AST as AST
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM

-- | Resolve type aliases, term aliases and import/exports
restructure ::
  DAG MVar Import ExprI ->
  MorlocMonad (DAG MVar [AliasedSymbol] ExprI)
restructure s = do
  -- Set the counter for reindexing expressions.
  --
  -- This is the first use of the morloc state counter. The indices currently
  -- in the tree were generated by the lexer state counter. So now we need
  -- to find the largest index in the tree and resume counting from there.
  -- Since d is the entire tree, the initizalized counter will start at global maximum.
  MM.setCounter $ maximum (map AST.maxIndex (DAG.nodes s)) + 1

  checkForSelfRecursion s -- currently, do no not allow type self-recursion
    >>= resolveImports -- rewrite DAG edges to map imported terms to their aliases
    >>= handleBinops -- first resolve binary operators
    >>= resolveHoles -- then holes
    >>= refineKinds -- promote VarU to NatVarU based on typedef param kinds (before self-defs are removed)
      |>> handleTypeDeclarations
    >>= doM collectTags
    >>= doM collectTypes
    >>= (\x -> collectUniversalTypes >> return x)
    >>= doM collectSources

doM :: (Monad m) => (a -> m ()) -> a -> m a
doM f x = f x >> return x

{- | Check for infinitely expanding self-recursive types

There are cases were the defined term may appear on the right. For example:

  type Py (Tree n e l) = "Tree" n e l

Here the general type Tree is mapped to the concrete type "Tree" in Python.
The fact that the general and concrete names are the same is fine. They are
different languages. But what about:

  type (Tree n) = Node n [Tree n]

This type should be legal, but currently it is not supported. Which
is why I need to raise an explicit error to avoid infinite loops.
-}
checkForSelfRecursion :: DAG k e ExprI -> MorlocMonad (DAG k e ExprI)
checkForSelfRecursion d = do
  _ <- DAG.mapNodeM (AST.checkExprI isExprSelfRecursive) d
  return d
  where
    -- A typedef is self-recursive if its name appears in its definition
    isExprSelfRecursive :: ExprI -> MorlocMonad ()
    -- Allow general type existence statements without parameters
    isExprSelfRecursive (ExprI _ (TypE (ExprTypeE Nothing _ [] _ _))) = return ()
    --  and also with parameters
    isExprSelfRecursive (ExprI i (TypE (ExprTypeE Nothing v vs t _)))
      | t == AppU (VarU v) (map (either (VarU . fst) id) vs) = return ()
      | hasTerm v t = MM.throwSourcedError i $ "Found unsupported self-recursive type alias:" <+> pretty v
      | otherwise = return ()
    -- otherwise disallow self-recursion
    isExprSelfRecursive (ExprI i (TypE (ExprTypeE _ v ts t _)))
      | any (hasTerm v) (t : (rights ts)) =
          MM.throwSourcedError i $ "Found unsupported self-recursive type alias:" <+> pretty v
      | otherwise = return ()
    isExprSelfRecursive _ = return ()

    -- check if a given term appears in a type
    hasTerm :: TVar -> TypeU -> Bool
    hasTerm v (VarU v') = v == v'
    hasTerm _ (NatVarU _) = False
    hasTerm v (ForallU _ t) = hasTerm v t
    hasTerm v (FunU (t1 : rs) t2) = hasTerm v t1 || hasTerm v (FunU rs t2)
    hasTerm v (FunU [] t) = hasTerm v t
    hasTerm v (AppU t1 (t2 : rs)) = hasTerm v t2 || hasTerm v (AppU t1 rs)
    hasTerm v (AppU t1 []) = hasTerm v t1
    hasTerm v (NamU o n ps ((_, t) : rs)) = hasTerm v t || hasTerm v (NamU o n ps rs)
    hasTerm v (NamU o n (p : ps) []) = hasTerm v p || hasTerm v (NamU o n ps [])
    hasTerm _ (NamU _ _ [] []) = False
    hasTerm v (EffectU _ t) = hasTerm v t
    hasTerm v (OptionalU t) = hasTerm v t
    hasTerm _ (NatLitU _) = False
    hasTerm v (NatAddU a b) = hasTerm v a || hasTerm v b
    hasTerm v (NatMulU a b) = hasTerm v a || hasTerm v b
    hasTerm v (NatSubU a b) = hasTerm v a || hasTerm v b
    hasTerm v (NatDivU a b) = hasTerm v a || hasTerm v b
    hasTerm v (LabeledU _ t) = hasTerm v t
    hasTerm _ ExistU {} = error "There should not be existentionals in typedefs"

resolveHoles ::
  DAG MVar [AliasedSymbol] ExprI ->
  MorlocMonad (DAG MVar [AliasedSymbol] ExprI)
resolveHoles = DAG.mapNodeM unhole
  where
    unhole :: ExprI -> MorlocMonad ExprI
    unhole e@(ExprI _ (LstE _)) = unholeContainer e
    unhole e@(ExprI _ (TupE _)) = unholeContainer e
    unhole e@(ExprI _ (NamE _)) = unholeContainer e
    unhole (ExprI i (AppE e0 es0)) =
      case length [HolE | (ExprI _ HolE) <- es0] of
        0 -> AppE <$> unhole e0 <*> mapM unhole es0 |>> ExprI i
        n -> do
          lambdaIndex <- MM.getCounter
          let vs = map (nameHole lambdaIndex) [1 .. n]
              (_, es) = statefulMap insertHole vs es0
          newApp <- AppE <$> unhole e0 <*> mapM unhole es
          return $ ExprI lambdaIndex (LamE vs (ExprI i newApp))
      where
        insertHole :: [EVar] -> ExprI -> ([EVar], ExprI)
        insertHole (v : vs) (ExprI j HolE) = (vs, ExprI j (VarE defaultValue v))
        insertHole vs e = (vs, e)
    -- simple recursion
    unhole (ExprI i (ModE m es)) = ModE m <$> mapM unhole es |>> ExprI i
    unhole (ExprI i (IstE c ts es)) = IstE c ts <$> mapM unhole es |>> ExprI i
    unhole (ExprI i (AssE v e es)) = AssE v <$> unhole e <*> mapM unhole es |>> ExprI i
    unhole (ExprI i (HolE)) = return HolE |>> ExprI i
    unhole (ExprI i (LamE vs e)) = LamE vs <$> unhole e |>> ExprI i
    unhole (ExprI i (AnnE e t)) = AnnE <$> unhole e <*> pure t |>> ExprI i
    unhole (ExprI i (LetE bindings body)) = do
      bindings' <- mapM (\(v, e) -> (,) v <$> unhole e) bindings
      body' <- unhole body
      return $ ExprI i (LetE bindings' body')
    unhole (ExprI i (IfE c t e)) = IfE <$> unhole c <*> unhole t <*> unhole e |>> ExprI i
    unhole (ExprI i (DoBlockE e)) = DoBlockE <$> unhole e |>> ExprI i
    unhole (ExprI i (EvalE e)) = EvalE <$> unhole e |>> ExprI i
    unhole (ExprI i (IntrinsicE intr es)) = IntrinsicE intr <$> mapM unhole es |>> ExprI i
    unhole (ExprI _ (BopE _ _ _ _)) = error "Bop should have been resolved"
    unhole e = return e

    unholeContainer :: ExprI -> MorlocMonad ExprI
    unholeContainer e0@(ExprI i0 _) =
      case countHoles e0 of
        0 -> descend e0
        n -> do
          let vs = map (nameHole i0) [1 .. n]
          e <- descend . snd . insertHoles vs $ e0
          MM.sayVVV $ "unholeContainer vs:" <+> list (map pretty vs)
          MM.sayVVV $ "unholeContainer e:" <+> pretty e
          return $ ExprI i0 (LamE vs e)
          where
            insertHoles :: [EVar] -> ExprI -> ([EVar], ExprI)
            insertHoles (v : vs) (ExprI i HolE) = (vs, ExprI i (VarE defaultValue v))
            insertHoles vs (ExprI i (LstE es)) =
              let (vs', es') = statefulMap insertHoles vs es
               in (vs', ExprI i (LstE es'))
            insertHoles vs (ExprI i (TupE es)) =
              let (vs', es') = statefulMap insertHoles vs es
               in (vs', ExprI i (TupE es'))
            insertHoles vs (ExprI i (NamE (unzip -> (ks, es)))) =
              let (vs', es') = statefulMap insertHoles vs es
               in (vs', ExprI i (NamE (zip ks es')))
            insertHoles vs e = (vs, e)

    countHoles :: ExprI -> Int
    countHoles (ExprI _ HolE) = 1
    countHoles (ExprI _ (LstE xs)) = sum (map countHoles xs)
    countHoles (ExprI _ (TupE xs)) = sum (map countHoles xs)
    countHoles (ExprI _ (NamE (map snd -> xs))) = sum (map countHoles xs)
    countHoles _ = 0

    descend :: ExprI -> MorlocMonad ExprI
    -- refresh
    descend e@(ExprI _ (AppE _ _)) = unhole e
    -- simple recurse
    descend (ExprI i (LamE vs e)) = LamE vs <$> descend e |>> ExprI i
    descend (ExprI i (LstE es)) = LstE <$> mapM descend es |>> ExprI i
    descend (ExprI i (TupE es)) = TupE <$> mapM descend es |>> ExprI i
    descend (ExprI i (NamE rs)) = NamE <$> mapM (\(k, e) -> (,) k <$> descend e) rs |>> ExprI i
    descend (ExprI i (AnnE e t)) = AnnE <$> descend e <*> pure t |>> ExprI i
    descend (ExprI i (IfE c t e)) = IfE <$> descend c <*> descend t <*> descend e |>> ExprI i
    descend (ExprI i (DoBlockE e)) = DoBlockE <$> descend e |>> ExprI i
    descend (ExprI i (EvalE e)) = EvalE <$> descend e |>> ExprI i
    descend (ExprI i (IntrinsicE intr es)) = IntrinsicE intr <$> mapM descend es |>> ExprI i
    descend e = return e

    -- name a hole based on the index of the new lambda and the hole position
    nameHole :: Int -> Int -> EVar
    nameHole lidx aidx = EV ("_hole" <> MT.show' lidx <> "_" <> MT.show' aidx)

{- | Use export/import information to find which terms are imported into each module
* reduces the Import edge type to an alias map.
* replaces Export terms in expressions
-}
resolveImports ::
  DAG MVar Import ExprI ->
  MorlocMonad (DAG MVar [AliasedSymbol] ExprI)
resolveImports d0 =
  DAG.synthesize resolveExports resolveEdge d0
    >>= maybe (MM.throwSystemError "Cyclical import dependency in resolveImports") return
  where
    -- Collect all exported terms from a module (including those imported
    -- without qualification. Then update the ExpE term
    resolveExports :: MVar -> ExprI -> [(MVar, Import, ExprI)] -> MorlocMonad ExprI
    resolveExports m e children = do
      let allLocalSymbols = findSymbols e -- Set Symbol
          export = AST.findExport e -- Export
      allImportedSymbols <-
        Set.unions <$> mapM (\(_, imp', expr') -> filterImports m imp' (AST.findExport expr')) children

      let allSymbols = Set.union allLocalSymbols allImportedSymbols

      case export of
        ExportAll -> do
          exports <- mapM addIndex (Set.toList allSymbols) |>> Set.fromList
          return $ AST.setExport (ExportMany exports []) e
        (ExportMany ungroupedExports groups) ->
          let allExplicit = Set.unions (ungroupedExports : [exportGroupMembers g | g <- groups])
              resolved = resolveExplicitTypeclasses allSymbols allExplicit
              missing = Set.map snd resolved `Set.difference` allSymbols
           in if Set.null missing
                then do
                  -- Rebuild groups with resolved typeclasses
                  let resolvedGroups =
                        map
                          (\g -> g {exportGroupMembers = resolveExplicitTypeclasses allSymbols (exportGroupMembers g)})
                          groups
                      resolvedUngrouped = resolveExplicitTypeclasses allSymbols ungroupedExports
                  return $ AST.setExport (ExportMany resolvedUngrouped resolvedGroups) e
                else
                  MM.throwSystemError $
                    "Module"
                      <+> squotes (pretty m)
                      <+> "does not export the following terms or types:"
                      <+> list (map pretty (Set.toList missing))

    resolveExplicitTypeclasses :: Set Symbol -> Set (Int, Symbol) -> Set (Int, Symbol)
    resolveExplicitTypeclasses ss sis = Set.map f sis
      where
        f :: (Int, Symbol) -> (Int, Symbol)
        f (i, TypeSymbol (TV x))
          | (ClassSymbol (ClassName x)) `Set.member` ss = (i, ClassSymbol (ClassName x))
          | otherwise = (i, TypeSymbol (TV x))
        f x = x

    addIndex :: a -> MorlocMonad (Int, a)
    addIndex x = (,) <$> MM.getCounter <*> pure x

    -- TODO: distinguish between these expressions at the type-level
    --       the contains unresolved imports, that later resolved
    resolveEdge ::
      Import ->
      ExprI -> -- importing module expression (with resolved exports)
      ExprI -> -- imported module expression  (with resolved exports)
      MorlocMonad [AliasedSymbol]
    resolveEdge imp _ childX = case (importInclude imp, importNamespace imp, AST.findExport childX) of
      (_, _, ExportAll) -> error "This should have been resolved already"
      -- No namespace: existing behavior
      (Nothing, Nothing, ExportMany exps gs) ->
        let allExps = Set.unions (exps : [exportGroupMembers g | g <- gs])
         in return $ map (toAliasedSymbol . snd) (Set.toList allExps)
      (Just ass, Nothing, ExportMany exps gs) -> return . catMaybes $ map (importAlias . unAliasedSymbol) ass
        where
          allExps = Set.unions (exps : [exportGroupMembers g | g <- gs])
          exportMap = Map.fromList [(unSymbol s, s) | (_, s) <- Set.toList allExps]
          excludes = map unSymbol (importExclude imp)

          importAlias :: (Text, Text) -> Maybe AliasedSymbol
          importAlias (name, alias)
            | name `elem` excludes = Nothing
            | otherwise = case Map.lookup name exportMap of
                Nothing -> Nothing
                (Just (TermSymbol _)) -> Just $ AliasedTerm (EV name) (EV alias)
                (Just (TypeSymbol _)) -> Just $ AliasedType (TV name) (TV alias)
                (Just (ClassSymbol _)) -> Just $ AliasedClass (ClassName name)
      -- With namespace: prefix term aliases (V1: types/classes not prefixed)
      (Nothing, Just ns, ExportMany exps gs) ->
        let allExps = Set.unions (exps : [exportGroupMembers g | g <- gs])
         in return $ map (prefixAlias ns . toAliasedSymbol . snd) (Set.toList allExps)
      (Just ass, Just ns, ExportMany exps gs) -> return . catMaybes $ map (importAlias . unAliasedSymbol) ass
        where
          allExps = Set.unions (exps : [exportGroupMembers g | g <- gs])
          exportMap = Map.fromList [(unSymbol s, s) | (_, s) <- Set.toList allExps]
          excludes = map unSymbol (importExclude imp)

          importAlias :: (Text, Text) -> Maybe AliasedSymbol
          importAlias (name, alias)
            | name `elem` excludes = Nothing
            | otherwise = case Map.lookup name exportMap of
                Nothing -> Nothing
                (Just (TermSymbol _)) -> Just $ prefixAlias ns (AliasedTerm (EV name) (EV alias))
                (Just (TypeSymbol _)) -> Just $ AliasedType (TV name) (TV alias)
                (Just (ClassSymbol _)) -> Just $ AliasedClass (ClassName name)

    prefixAlias :: EVar -> AliasedSymbol -> AliasedSymbol
    prefixAlias (EV ns) (AliasedTerm orig (EV alias)) = AliasedTerm orig (EV (ns <> "." <> alias))
    prefixAlias _ sym = sym

    filterImports ::
      MVar ->
      Import -> -- the current node import list
      Export -> -- the imported modules export list
      MorlocMonad (Set Symbol)
    -- No namespace, no include list: import everything
    filterImports _ (Import _ Nothing exclude Nothing) (ExportMany exports gs) =
      let allExports = Set.unions (exports : [exportGroupMembers g | g <- gs])
       in return $ (Set.map snd allExports) `Set.difference` (Set.fromList exclude)
    -- With namespace, no include list: prefix all terms
    filterImports _ (Import _ Nothing exclude (Just (EV ns))) (ExportMany exports gs) =
      let allExports = Set.unions (exports : [exportGroupMembers g | g <- gs])
       in return $ Set.map (prefixSymbol ns) ((Set.map snd allExports) `Set.difference` (Set.fromList exclude))
    -- No namespace, with include list: existing behavior
    filterImports m1 (Import m2 (Just as) (map unSymbol -> exclude) Nothing) (ExportMany exports gs) =
      case partitionEithers . catMaybes $ map importAlias (map unAliasedSymbol as) of
        ([], imps) -> return $ Set.fromList imps
        (missing, _) ->
          MM.throwSystemError $
            "The terms imported from"
              <+> squotes (pretty m1)
              <+> "are not exported from module"
              <+> squotes (pretty m2)
              <> ":\n"
                <+> indent 2 (vsep (map pretty missing))
      where
        allExports = Set.unions (exports : [exportGroupMembers g | g <- gs])
        exportMap = Map.fromList [(unSymbol s, s) | (_, s) <- Set.toList allExports]

        importAlias :: (Text, Text) -> Maybe (Either Text Symbol)
        importAlias (name, alias)
          | name `elem` exclude = Nothing
          | otherwise = case Map.lookup name exportMap of
              Nothing -> Just (Left name)
              (Just (TermSymbol _)) -> Just . Right $ TermSymbol (EV alias)
              (Just (TypeSymbol _)) -> Just . Right $ TypeSymbol (TV alias)
              (Just (ClassSymbol _)) -> Just . Right $ ClassSymbol (ClassName alias)
    -- With namespace and include list: prefix selected terms
    filterImports m1 (Import m2 (Just as) (map unSymbol -> exclude) (Just (EV ns))) (ExportMany exports gs) =
      case partitionEithers . catMaybes $ map importAlias (map unAliasedSymbol as) of
        ([], imps) -> return $ Set.fromList imps
        (missing, _) ->
          MM.throwSystemError $
            "The terms imported from"
              <+> squotes (pretty m1)
              <+> "are not exported from module"
              <+> squotes (pretty m2)
              <> ":\n"
                <+> indent 2 (vsep (map pretty missing))
      where
        allExports = Set.unions (exports : [exportGroupMembers g | g <- gs])
        exportMap = Map.fromList [(unSymbol s, s) | (_, s) <- Set.toList allExports]

        importAlias :: (Text, Text) -> Maybe (Either Text Symbol)
        importAlias (name, alias)
          | name `elem` exclude = Nothing
          | otherwise = case Map.lookup name exportMap of
              Nothing -> Just (Left name)
              (Just (TermSymbol _)) -> Just . Right $ TermSymbol (EV (ns <> "." <> alias))
              (Just (TypeSymbol _)) -> Just . Right $ TypeSymbol (TV alias)
              (Just (ClassSymbol _)) -> Just . Right $ ClassSymbol (ClassName alias)
    filterImports _ _ _ = error "Unreachable -- all Export values should have been converted to ExportMany"

    prefixSymbol :: Text -> Symbol -> Symbol
    prefixSymbol ns (TermSymbol (EV name)) = TermSymbol (EV (ns <> "." <> name))
    prefixSymbol _ sym = sym

    findSymbols :: ExprI -> Set Symbol
    findSymbols (ExprI _ (ModE _ es)) = Set.unions (map findSymbols es)
    findSymbols (ExprI _ (TypE (ExprTypeE _ v _ _ _))) = Set.singleton $ TypeSymbol v
    findSymbols (ExprI _ (AssE e _ _)) = Set.singleton $ TermSymbol e
    findSymbols (ExprI _ (ClsE (Typeclass _ cls _ _))) = Set.singleton $ ClassSymbol cls
    findSymbols (ExprI _ (SigE (Signature e _ _))) = Set.singleton $ TermSymbol e
    findSymbols (ExprI _ (SrcE src)) = Set.singleton $ TermSymbol (srcAlias src)
    -- The definition of an instance does not automatically imply export or make
    -- the values available. The instance is ALWAYS relative to the class
    -- definition (either local or imported).
    findSymbols (ExprI _ (IstE cls _ _)) = Set.singleton $ ClassSymbol cls
    findSymbols _ = Set.empty

    unSymbol :: Symbol -> Text
    unSymbol (TypeSymbol (TV v)) = v
    unSymbol (TermSymbol (EV v)) = v
    unSymbol (ClassSymbol (ClassName v)) = v

    unAliasedSymbol :: AliasedSymbol -> (Text, Text)
    unAliasedSymbol (AliasedType x y) = (unTVar x, unTVar y)
    unAliasedSymbol (AliasedTerm x y) = (unEVar x, unEVar y)
    unAliasedSymbol (AliasedClass x) = (unClassName x, unClassName x)

    toAliasedSymbol :: Symbol -> AliasedSymbol
    toAliasedSymbol (TypeSymbol x) = AliasedType x x
    toAliasedSymbol (TermSymbol x) = AliasedTerm x x
    toAliasedSymbol (ClassSymbol x) = AliasedClass x

handleTypeDeclarations ::
  DAG k e ExprI ->
  DAG k e ExprI
handleTypeDeclarations = DAG.mapNode f
  where
    f (ExprI i (ModE m es)) = ExprI i (ModE m (filter isNotSelfDef es))
    f e = e

    isNotSelfDef :: ExprI -> Bool
    isNotSelfDef (ExprI _ (TypE (ExprTypeE Nothing v [] (VarU v') _))) = v /= v'
    isNotSelfDef (ExprI _ (TypE (ExprTypeE Nothing (VarU -> v) (map (either (VarU . fst) id) -> vs) (AppU v' vs') _))) =
      v /= v' || length vs /= length vs' || not (all (uncurry (==)) (zip vs vs'))
    isNotSelfDef _ = True

handleBinops :: DAG MVar [AliasedSymbol] ExprI -> MorlocMonad (DAG MVar [AliasedSymbol] ExprI)
handleBinops d0 = do
  mayN <- DAG.synthesize updateNode (\e _ _ -> return e) d0
  case mayN of
    (Just e') -> return $ DAG.mapNode (\(e, _, _) -> e) e'
    Nothing -> error "Unreachable?"
  where
    updateNode ::
      MVar ->
      ExprI ->
      [(MVar, [AliasedSymbol], (ExprI, Map ClassName [EVar], Map EVar (Associativity, Int)))] ->
      MorlocMonad (ExprI, Map ClassName [EVar], Map EVar (Associativity, Int))
    updateNode _ e es = do
      thisFixityMap <- AST.findFixityMap e

      let clsOps = Map.unions $ findClassOps e : [filterClsOps ss cs | (_, ss, (_, cs, _)) <- es]
          clsOpSet = Set.fromList . concat $ Map.elems clsOps

      fixityMap <-
        mergeFixityMaps $ thisFixityMap : [filterTerms clsOpSet m ss | (_, ss, (_, _, m)) <- es]
      e' <- updateBinopExprs fixityMap e
      return (e', clsOps, fixityMap)

    filterClsOps :: [AliasedSymbol] -> Map ClassName [EVar] -> Map ClassName [EVar]
    filterClsOps ass clsmap =
      let clss = [cls | (AliasedClass cls) <- ass]
       in Map.filterWithKey (\k _ -> elem k clss) clsmap

    findClassOps :: ExprI -> Map ClassName [EVar]
    findClassOps (ExprI _ (ModE _ es)) = Map.unions (map findClassOps es)
    findClassOps (ExprI _ (ClsE (Typeclass _ cls _ sigs))) = Map.singleton cls [v | (Signature v _ _) <- sigs]
    findClassOps _ = Map.empty

    filterTerms :: Set EVar -> Map EVar a -> [AliasedSymbol] -> Map EVar a
    filterTerms cs m ss = Map.union unaliasedOps clsOps
      where
        symMap = Map.fromList [(k, v) | (AliasedTerm k v) <- ss]

        -- gather non-typeclass operator aliases
        unaliasedOps = Map.fromList . catMaybes $ [Map.lookup k symMap |>> (,v) | (k, v) <- Map.toList m]

        -- gather typeclass operators aliases
        clsOps = Map.filterWithKey (\k _ -> Set.member k cs) m

    mergeFixityMaps :: (Eq a) => [Map EVar a] -> MorlocMonad (Map EVar a)
    mergeFixityMaps [] = return Map.empty
    mergeFixityMaps [e1] = return e1
    mergeFixityMaps (e1 : e2 : es) = do
      e' <- foldlM strictInsert e1 (Map.toList e2)
      mergeFixityMaps (e' : es)

    strictInsert :: (Eq v) => Map EVar v -> (EVar, v) -> MorlocMonad (Map EVar v)
    strictInsert m (k, v) = case Map.lookup k m of
      Nothing -> return $ Map.insert k v m
      (Just v') ->
        if v == v'
          then return m
          else MM.throwSystemError $ "Conflicting fixity definitions for" <+> pretty k

    updateBinopExprs :: Map EVar (Associativity, Int) -> ExprI -> MorlocMonad ExprI
    updateBinopExprs m0 = f
      where
        f e@(ExprI _ BopE {}) = resolveBinop m0 e >>= f
        f (ExprI i (ModE m es)) = ModE m <$> mapM f es |>> ExprI i
        f (ExprI i (IstE cls ts es)) = IstE cls ts <$> mapM f es |>> ExprI i
        f (ExprI i (AssE v e es)) = AssE v <$> f e <*> mapM f es |>> ExprI i
        f (ExprI i (LstE es)) = LstE <$> mapM f es |>> ExprI i
        f (ExprI i (TupE es)) = TupE <$> mapM f es |>> ExprI i
        f (ExprI i (NamE rs)) = do
          es' <- mapM (f . snd) rs
          return $ ExprI i (NamE (zip (map fst rs) es'))
        f (ExprI i (AppE e es)) = AppE <$> f e <*> mapM f es |>> ExprI i
        f (ExprI i (LamE vs e)) = LamE vs <$> f e |>> ExprI i
        f (ExprI i (AnnE e t)) = AnnE <$> f e <*> pure t |>> ExprI i
        f (ExprI i (LetE bindings body)) = do
          bindings' <- mapM (\(v, e) -> (,) v <$> f e) bindings
          body' <- f body
          return $ ExprI i (LetE bindings' body')
        f (ExprI i (IfE c t e)) = IfE <$> f c <*> f t <*> f e |>> ExprI i
        f (ExprI i (DoBlockE e)) = DoBlockE <$> f e |>> ExprI i
        f (ExprI i (EvalE e)) = EvalE <$> f e |>> ExprI i
        f (ExprI i (IntrinsicE intr es)) = IntrinsicE intr <$> mapM f es |>> ExprI i
        f (ExprI _ (ParenE inner)) = f inner
        f e = return e

    -- \| Rewrite a right-nested BopE chain into a correctly-associated AppE tree.
    -- Uses the Pratt (precedence climbing) algorithm.
    -- Operators not in fixMap default to infixl 9.
    resolveBinop :: Map EVar (Associativity, Int) -> ExprI -> MorlocMonad ExprI
    resolveBinop fixMap expr = do
      let (lhs0, ops) = flatten expr
      (result, _) <- pratt 0 lhs0 ops
      return result
      where
        lookupFixity :: EVar -> (Associativity, Int)
        lookupFixity v = Map.findWithDefault (InfixL, 9) v fixMap

        -- Walk the right spine of BopE nodes into a flat list.
        -- Each entry: (outerIdx, opIdx, opName, rightOperand)
        flatten :: ExprI -> (ExprI, [(Int, Int, EVar, ExprI)])
        flatten (ExprI outerI (BopE lhs opI op rhs)) =
          let (rhsFirst, rhsRest) = flatten rhs
           in (lhs, (outerI, opI, op, rhsFirst) : rhsRest)
        flatten e = (e, [])

        -- Pratt loop: consume operators with prec >= minPrec.
        -- Returns the parsed lhs and the unconsumed tail.
        pratt :: Int -> ExprI -> [(Int, Int, EVar, ExprI)] -> MorlocMonad (ExprI, [(Int, Int, EVar, ExprI)])
        pratt _ lhs [] = return (lhs, [])
        pratt minPrec lhs ((outerI, opI, op, rhs) : rest) = do
          let (assoc, prec) = lookupFixity op
          if prec < minPrec
            then return (lhs, (outerI, opI, op, rhs) : rest)
            else do
              let nextMinPrec = if assoc == InfixR then prec else prec + 1
              (rhsParsed, remaining) <- pratt nextMinPrec rhs rest
              -- Ambiguity check: incompatible fixities at the same precedence
              case remaining of
                ((_, _, nextOp, _) : _) -> do
                  let (nextAssoc, nextPrec) = lookupFixity nextOp
                  when (nextPrec == prec && (assoc /= nextAssoc || assoc == InfixN)) . MM.throwSourcedError opI $
                    "Ambiguous use of" <+> pretty op <+> "and" <+> pretty nextOp
                      <> ": parenthesize or declare compatible fixities"
                [] -> return ()
              let lhs' = ExprI outerI $ AppE (ExprI opI (VarE defaultValue op)) [lhs, rhsParsed]
              pratt minPrec lhs' remaining

collectTags :: DAG MVar [AliasedSymbol] ExprI -> MorlocMonad ()
collectTags fullDag = do
  _ <- DAG.mapNodeM f fullDag
  return ()
  where
    -- \* add ManifoldConfigs associated with VarE types to MorlocMonad state
    -- \* the configs store the metadata associated with the term tags
    -- \* later we use the manifold indices to lookup things like runtime info
    --   (threads required and such)
    f :: ExprI -> MorlocMonad ()
    f (ExprI i (VarE config _)) = do
      s <- MM.get
      MM.put (s {stateManifoldConfig = Map.insert i config (stateManifoldConfig s)})
    f (ExprI _ (ModE _ es)) = mapM_ f es
    f (ExprI _ (IstE _ _ es)) = mapM_ f es
    f (ExprI _ (AssE _ e es)) = mapM_ f (e : es)
    f (ExprI _ (LstE es)) = mapM_ f es
    f (ExprI _ (TupE es)) = mapM_ f es
    f (ExprI _ (NamE rs)) = mapM_ (f . snd) rs
    f (ExprI _ (AppE e es)) = mapM_ f (e : es)
    f (ExprI _ (LamE _ e)) = f e
    f (ExprI _ (AnnE e _)) = f e
    f (ExprI _ (LetE bindings body)) = mapM_ (f . snd) bindings >> f body
    f _ = return ()

type GCMap = (Scope, Map Lang Scope)

{- | Add the following fields to state:
  * stateGeneralTypedefs           :: GMap Int MVar Scope
  * stateConcreteTypedefs          :: GMap Int MVar (Map Lang Scope)
-}
collectTypes :: DAG MVar [AliasedSymbol] ExprI -> MorlocMonad ()
collectTypes fullDag = do
  let typeDag = DAG.mapEdge (\xs -> [(x, y) | AliasedType x y <- xs]) fullDag
  result <- DAG.synthesizeNodes formTypes typeDag
  case result of
    Nothing -> MM.throwSystemError "Found cyclic module dependency"
    Just _ -> return ()
  where
    formTypes ::
      MVar ->
      ExprI ->
      [ ( MVar -- child module name
        , [(TVar, TVar)] -- alias map
        , GCMap
        )
      ] ->
      MorlocMonad GCMap
    formTypes m e0 childImports = do
      let (generalTypemap, concreteTypemapsIncomplete) = foldl inherit (AST.findTypedefs e0) childImports

      -- Here we are creating links from every indexed term in the module to the module
      -- sources and aliases. When the module abstractions are factored out later,
      -- this will be the only way to access module-specific info.
      let indices = AST.getIndices e0

      -- link concrete records to their full general forms
      let concreteTypemaps = Map.map (completeRecords generalTypemap) concreteTypemapsIncomplete

      s <- MM.get
      MM.put
        ( s
            { stateGeneralTypedefs = GMap.insertMany indices m generalTypemap (stateGeneralTypedefs s)
            , stateConcreteTypedefs = GMap.insertMany indices m concreteTypemaps (stateConcreteTypedefs s)
            }
        )

      return (generalTypemap, concreteTypemaps)

    inherit :: GCMap -> (key, [(TVar, TVar)], GCMap) -> GCMap
    inherit (thisGmap, thisCmap) (_, links, (gmap, cmap)) =
      let gmap' = filterAndSubstitute links gmap
          cmap' = Map.map (filterAndSubstitute links) cmap
       in ( Map.unionWith mergeEntries gmap' thisGmap
          , Map.unionWith (Map.unionWith mergeEntries) cmap' thisCmap
          )

{- | collect type definitions globally
  define:
    * stateUniversalGeneralTypedefs
    * stateUniversalConcreteTypedefs
-}
collectUniversalTypes :: MorlocMonad ()
collectUniversalTypes = do
  universalGeneralScope <- getUniversalGeneralScope
  universalConcreteScope <- getUniversalConcreteScope universalGeneralScope

  s <- MM.get
  MM.put
    ( s
        { stateUniversalGeneralTypedefs = universalGeneralScope
        , stateUniversalConcreteTypedefs = universalConcreteScope
        }
    )
  where
    getUniversalGeneralScope :: MorlocMonad Scope
    getUniversalGeneralScope = do
      (GMap _ (Map.elems -> scopes)) <- MM.gets stateGeneralTypedefs
      return $ Map.unionsWith mergeEntries scopes

    getUniversalConcreteScope :: Scope -> MorlocMonad (Map Lang Scope)
    getUniversalConcreteScope gscope = do
      (GMap _ modMaps) <- MM.gets stateConcreteTypedefs
      let langs = unique $ concatMap Map.keys . Map.elems $ modMaps
      scopes <- mapM getLangScope langs
      return . Map.fromList $ zip langs scopes
      where
        getLangScope :: Lang -> MorlocMonad Scope
        getLangScope lang = do
          (GMap _ (Map.elems -> langMaps)) <- MM.gets stateConcreteTypedefs
          -- See note above, here we are completing any incomplete concrete
          -- record/table/object types
          let langMaps' = map (Map.map (completeRecords gscope)) langMaps
          return . Map.unionsWith mergeEntries . mapMaybe (Map.lookup lang) $ langMaps'

{- | links the general entries from records to their abbreviated concrete cousins.
For example:
  record (Person a) = Person {name :: Str, info a}
  record Py => Person a = "dict"
This syntax avoids the need to duplicate the entire entry
-}
completeRecords :: Scope -> Scope -> Scope
completeRecords gscope = Map.mapWithKey (completeRecord gscope)
  where
    completeRecord ::
      Scope ->
      TVar ->
      [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] ->
      [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)]
    completeRecord g v xs = case Map.lookup v g of
      (Just ys) -> map (completeValue [(vs, t) | (vs, t, _, _) <- ys]) xs
      Nothing -> xs

    completeValue ::
      [([Either (TVar, Kind) TypeU], TypeU)] ->
      ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)
    completeValue ((vs, NamU _ _ ps rs) : _) (_, NamU o v _ [], d, terminal) = (vs, NamU o v ps rs, d, terminal)
    completeValue _ x = x

-- merge type functions, names of generics do not matter
mergeEntries ::
  [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] ->
  [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] ->
  [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)]
mergeEntries xs0 ys0 = filter (isNovel ys0) xs0 <> ys0
  where
    isNovel ::
      [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] -> ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) -> Bool
    isNovel [] _ = True
    isNovel ((vs2, t2, _, isTerminal1) : ys) x@(vs1, t1, _, isTerminal2)
      | (length vs1 == length vs2)
          && t1 == foldl (\t (v1, v2) -> rename v2 v1 t) t2 [(fst v1, fst v2) | (Left v1, Left v2) <- zip vs1 vs2]
          && isTerminal1 == isTerminal2 =
          False
      | otherwise = isNovel ys x

-- clean imports
--   * only keep the exports of a module that are explicitly imported
--   * resolve any aliases
filterAndSubstitute :: [(TVar, TVar)] -> Scope -> Scope
filterAndSubstitute links typemap =
  let importedTypes = Map.filterWithKey (\k _ -> k `elem` map fst links) typemap
   in foldl typeSubstitute importedTypes links
  where
    typeSubstitute ::
      Scope -> -- imported map
      (TVar, TVar) -> -- source name and local alias
      Scope -- renamed map
    typeSubstitute typedefs (sourceName, localAlias) =
      case Map.lookup sourceName typedefs of
        (Just xs) ->
          Map.insert
            localAlias
            (map (\(a, b, c, d) -> (a, rename sourceName localAlias b, c, d)) xs)
            (Map.delete sourceName typedefs)
        Nothing -> typedefs

-- | Promote VarU to NatVarU based on typedef param kinds in all signatures.
-- For each typedef like `type Tensor2 (d1 :: Nat) (d2 :: Nat) a`, build a map
-- from type name to param kinds, then walk all types and upgrade KindType to
-- KindNat for variables that appear in nat-kinded positions.
refineKinds ::
  DAG MVar [AliasedSymbol] ExprI ->
  MorlocMonad (DAG MVar [AliasedSymbol] ExprI)
refineKinds dag = do
  let allParams = concat [collectAllTypeDefParams e | e <- DAG.nodes dag]
      kindMap = Map.fromList [(v, map (either snd (const KindType)) ps) | (v, ps) <- allParams, any (\p -> either (\(_, k) -> k == KindNat) (const False) p) ps]
  if Map.null kindMap
    then return dag
    else DAG.mapNodeM (refineExprKinds kindMap) dag
  where
    collectAllTypeDefParams :: ExprI -> [(TVar, [Either (TVar, Kind) TypeU])]
    collectAllTypeDefParams (ExprI _ (ModE _ es)) = concatMap collectAllTypeDefParams es
    collectAllTypeDefParams (ExprI _ (TypE (ExprTypeE _ v ps _ _))) = [(v, ps)]
    collectAllTypeDefParams (ExprI _ (AssE _ e es)) = concatMap collectAllTypeDefParams (e:es)
    collectAllTypeDefParams (ExprI _ (IstE _ _ es)) = concatMap collectAllTypeDefParams es
    collectAllTypeDefParams _ = []

    refineExprKinds :: Map TVar [Kind] -> ExprI -> MorlocMonad ExprI
    refineExprKinds km = AST.mapTypeInExprI (refineTypeKinds km)

    refineTypeKinds :: Map TVar [Kind] -> TypeU -> TypeU
    refineTypeKinds km t0 =
      let natVars = collectNatVarsFromScope km t0
       in promoteNatVarsR natVars t0

    -- Collect variables that appear in nat-kinded positions according to typedef param kinds
    collectNatVarsFromScope :: Map TVar [Kind] -> TypeU -> Set TVar
    collectNatVarsFromScope km = go
      where
        go (AppU (VarU v) args) = case Map.lookup v km of
          Just kinds -> Set.unions $
            [case (k, a) of
               (KindNat, VarU tv) -> Set.singleton tv
               _ -> go a
            | (k, a) <- zip kinds args]
            ++ [go a | a <- drop (length kinds) args]
          Nothing -> Set.unions (map go args)
        go (NatVarU v) = Set.singleton v
        go (ForallU _ inner) = go inner
        go (FunU args ret) = Set.unions (go ret : map go args)
        go (NamU _ _ ps rs) = Set.unions (map go ps ++ map (go . snd) rs)
        go (EffectU _ inner) = go inner
        go (OptionalU inner) = go inner
        go (NatAddU a b) = Set.union (goNat a) (goNat b)
        go (NatMulU a b) = Set.union (goNat a) (goNat b)
        go (NatSubU a b) = Set.union (goNat a) (goNat b)
        go (NatDivU a b) = Set.union (goNat a) (goNat b)
        go (LabeledU _ inner) = go inner
        go _ = Set.empty

        goNat (VarU v@(TV name))
          | not (T.null name), isLower (T.head name) = Set.singleton v
          | otherwise = Set.empty
        goNat t = go t

    -- Promote VarU to NatVarU for variables identified as nat-kinded,
    -- and strip ForallU wrappers for those variables (they're implicitly quantified)
    promoteNatVarsR :: Set TVar -> TypeU -> TypeU
    promoteNatVarsR natVars = go
      where
        go (VarU v)
          | Set.member v natVars = NatVarU v
          | otherwise = VarU v
        go t@(NatVarU _) = t
        go (ForallU v t)
          | Set.member v natVars = go t  -- strip ForallU for nat vars
        go (ForallU v t) = ForallU v (go t)
        go (FunU ts t) = FunU (map go ts) (go t)
        go (AppU t ts) = AppU (go t) (map go ts)
        go (NamU o v ps rs) = NamU o v (map go ps) [(k, go t) | (k, t) <- rs]
        go (EffectU effs t) = EffectU effs (go t)
        go (OptionalU t) = OptionalU (go t)
        go (ExistU v (ps, pc) (rs, rc)) = ExistU v (map go ps, pc) (map (second go) rs, rc)
        go t@(NatLitU _) = t
        go (NatAddU a b) = NatAddU (go a) (go b)
        go (NatMulU a b) = NatMulU (go a) (go b)
        go (NatSubU a b) = NatSubU (go a) (go b)
        go (NatDivU a b) = NatDivU (go a) (go b)
        go (LabeledU n t) = LabeledU n (go t)

collectSources :: DAG MVar [AliasedSymbol] ExprI -> MorlocMonad ()
collectSources fullDag = do
  _ <- DAG.mapNodeWithKeyM linkSources fullDag
  return ()
  where
    linkSources :: MVar -> ExprI -> MorlocMonad ExprI
    linkSources m e0 = do
      let objSources = AST.findSources e0
      let indices = AST.getIndices e0
      s <- MM.get
      MM.put (s {stateSources = GMap.insertManyWith (<>) indices m objSources (stateSources s)})
      return e0

-- Rename a variable. For example:
--   import maps (Map as HashMap, foo, bar)
--
-- Here all uses `Map` in anything imported from `maps` needs to
-- be renamed to `HashMap`. So we call:
--   rename (TV "Map") (TV "HashMap") x
-- where `x` is any term
rename :: TVar -> TVar -> TypeU -> TypeU
rename sourceName localAlias = f
  where
    f (VarU v)
      | v == sourceName = VarU localAlias
      | otherwise = VarU v
    f (ExistU v (ps, o1) (rs, o2)) =
      let v' = if v == sourceName then localAlias else v
       in ExistU v' (map f ps, o1) (map (second f) rs, o2)
    f (ForallU v t) = ForallU v (f t)
    f (FunU ts t) = FunU (map f ts) (f t)
    f (AppU t ts) = AppU (f t) (map f ts)
    f (NamU o v ts rs) =
      let v' = if v == sourceName then localAlias else v
       in NamU o v' (map f ts) (map (second f) rs)
    f (EffectU effs t) = EffectU effs (f t)
    f (OptionalU t) = OptionalU (f t)
    f t@(NatVarU _) = t
    f t@(NatLitU _) = t
    f (NatAddU a b) = NatAddU (f a) (f b)
    f (NatMulU a b) = NatMulU (f a) (f b)
    f (NatSubU a b) = NatSubU (f a) (f b)
    f (NatDivU a b) = NatDivU (f a) (f b)
    f (LabeledU n t) = LabeledU n (f t)


================================================
FILE: library/Morloc/Frontend/Token.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Frontend.Token
Description : Token types shared between the Alex lexer and Happy parser
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.Frontend.Token
  ( Token (..)
  , Located (..)
  , Pos (..)
  , startPos
  , alexPos
  , showToken
  ) where

import Data.Text (Text)
import qualified Data.Text as T

-- | Source position: line, column (1-based)
data Pos = Pos
  { posLine :: {-# UNPACK #-} !Int
  , posCol :: {-# UNPACK #-} !Int
  , posFile :: !String
  }
  deriving (Show, Eq, Ord)

-- | Initial position (line 1, column 1) for a given filename.
startPos :: String -> Pos
startPos f = Pos 1 1 f

-- | Build a 'Pos' from the line and column reported by the lexer.
alexPos :: String -> Int -> Int -> Pos
alexPos f l c = Pos l c f

-- | A token annotated with its source position and the matched text
data Located = Located
  { locPos :: !Pos
  , locToken :: !Token
  , locText :: !Text
  }
  deriving (Show, Eq)

data Token
  = -- Layout tokens (inserted by layout processor)

    -- | virtual {
    TokVLBrace
  | -- | virtual }
    TokVRBrace
  | -- | virtual ;
    TokVSemi
  | -- Delimiters

    -- | (
    TokLParen
  | -- | )
    TokRParen
  | -- | [
    TokLBracket
  | -- | ]
    TokRBracket
  | -- | {
    TokLBrace
  | -- | }
    TokRBrace
  | -- | <
    TokLAngle
  | -- | >
    TokRAngle
  | -- Punctuation

    -- | ,
    TokComma
  | -- | ; (explicit)
    TokSemicolon
  | -- | backslash (lambda)
    TokBackslash
  | -- | _
    TokUnderscore
  | -- | !
    TokBang
  | -- | ?
    TokQuestion
  | -- | . (operator position, e.g., f . g)
    TokDot
  | -- | . (getter prefix, e.g., .name)
    TokGetterDot
  | -- | . (namespace qualifier, no space before dot, e.g., f.map)
    TokNsDot
  | -- | : (label qualifier, no space, e.g., large:mean)
    TokLabelColon
  | -- | . (chained getter, e.g., the second dot in .foo.bar)
    TokGetterDotChain
  | -- Reserved operators

    -- | =
    TokEquals
  | -- | :
    TokColon
  | -- | ::
    TokDColon
  | -- | ->
    TokArrow
  | -- | =>
    TokFatArrow
  | -- | <-
    TokBind
  | -- | * (only in export context)
    TokStar
  | -- Keywords
    TokModule
  | TokImport
  | TokExport
  | TokSource
  | TokFrom
  | TokWhere
  | TokAs
  | TokTrue
  | TokFalse
  | TokType
  | TokRecord
  | TokObject
  | TokTable
  | TokClass
  | TokInstance
  | TokInfixl
  | TokInfixr
  | TokInfix
  | TokLet
  | TokIn
  | TokDo
  | TokNull
  | -- Identifiers and literals

    -- | lowercase identifier
    TokLowerName !Text
  | -- | uppercase identifier
    TokUpperName !Text
  | -- | operator symbol (e.g., +, *, .)
    TokOperator !Text
  | -- | - (needed separately for module names and unary negation)
    TokMinus
  | TokInteger !Integer
  | TokFloat !Double
  | -- | plain string (no interpolation)
    TokString !Text
  | -- | start of interpolated string: text before first #{}
    TokStringStart !Text
  | -- | text between #{} in interpolated string
    TokStringMid !Text
  | -- | text after last #{} to closing quote
    TokStringEnd !Text
  | -- | #{ opening interpolation
    TokInterpOpen
  | -- | } closing interpolation
    TokInterpClose
  | -- Docstrings

    -- | --' followed by text
    TokDocLine !Text
  | -- Group annotations

    -- | --* followed by text
    TokGroupLine !Text
  | -- Intrinsics (@name)
    TokIntrinsic !Text
  | -- Pragmas
    TokPragmaInline
  | -- Special
    TokEOF
  deriving (Show, Eq, Ord)

-- | Human-readable token description for error messages
showToken :: Token -> String
showToken TokVLBrace = "start of indented block"
showToken TokVRBrace = "end of indented block"
showToken TokVSemi = "new declaration"
showToken TokLParen = "'('"
showToken TokRParen = "')'"
showToken TokLBracket = "'['"
showToken TokRBracket = "']'"
showToken TokLBrace = "'{'"
showToken TokRBrace = "'}'"
showToken TokLAngle = "'<'"
showToken TokRAngle = "'>'"
showToken TokComma = "','"
showToken TokSemicolon = "';'"
showToken TokBackslash = "'\\'"
showToken TokUnderscore = "'_'"
showToken TokBang = "'!'"
showToken TokQuestion = "'?'"
showToken TokDot = "'.'"
showToken TokGetterDot = "'.'"
showToken TokNsDot = "'.' (namespace)"
showToken TokLabelColon = "':' (label)"
showToken TokGetterDotChain = "'.'"
showToken TokEquals = "'='"
showToken TokColon = "':'"
showToken TokDColon = "'::'"
showToken TokArrow = "'->'"
showToken TokFatArrow = "'=>'"
showToken TokBind = "'<-'"
showToken TokStar = "'*'"
showToken TokModule = "'module'"
showToken TokImport = "'import'"
showToken TokExport = "'export'"
showToken TokSource = "'source'"
showToken TokFrom = "'from'"
showToken TokWhere = "'where'"
showToken TokAs = "'as'"
showToken TokTrue = "'True'"
showToken TokFalse = "'False'"
showToken TokType = "'type'"
showToken TokRecord = "'record'"
showToken TokObject = "'object'"
showToken TokTable = "'table'"
showToken TokClass = "'class'"
showToken TokInstance = "'instance'"
showToken TokInfixl = "'infixl'"
showToken TokInfixr = "'infixr'"
showToken TokInfix = "'infix'"
showToken TokLet = "'let'"
showToken TokIn = "'in'"
showToken TokDo = "'do'"
showToken TokNull = "'Null'"
showToken (TokLowerName n) = "identifier '" ++ T.unpack n ++ "'"
showToken (TokUpperName n) = "type name '" ++ T.unpack n ++ "'"
showToken (TokOperator n) = "operator '" ++ T.unpack n ++ "'"
showToken TokMinus = "'-'"
showToken (TokInteger _) = "integer literal"
showToken (TokFloat _) = "float literal"
showToken (TokString _) = "string literal"
showToken (TokStringStart _) = "string literal"
showToken (TokStringMid _) = "string continuation"
showToken (TokStringEnd _) = "string end"
showToken TokInterpOpen = "'#{'"
showToken TokInterpClose = "'}' (interpolation)"
showToken (TokDocLine _) = "docstring"
showToken (TokGroupLine _) = "group annotation"
showToken (TokIntrinsic n) = "intrinsic '@" ++ T.unpack n ++ "'"
showToken TokPragmaInline = "'%inline'"
showToken TokEOF = "end of input"


================================================
FILE: library/Morloc/Frontend/Treeify.hs
================================================
{-# LANGUAGE CPP #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Frontend.Treeify
Description : Dissolve the module DAG into per-export 'AnnoS' call trees
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

After linking populates 'MorlocState', this module builds one 'AnnoS' tree
per exported function by inlining declarations, resolving sources, and
renaming lambda-bound variables for uniqueness. The resulting trees are the
input to the typechecker and code generator.
-}
module Morloc.Frontend.Treeify (treeify) where

import qualified Data.Set as Set
import qualified Morloc.Data.DAG as DAG
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import qualified Morloc.Frontend.AST as AST
import qualified Morloc.Frontend.Link as MFL
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM

-- | Every term must either be sourced or declared.
data TermOrigin = Declared ExprI | Sourced Source
  deriving (Show, Ord, Eq)

data BindKind = LambdaBound | LetBound
  deriving (Show, Eq)

-- Manage unique naming in each tree
data Namer = Namer
  { namerMap :: Map.Map EVar (EVar, BindKind)
  , namerIndex :: Int
  , namerExpanding :: Set.Set EVar  -- functions currently being expanded (recursion detection)
  }
  deriving (Show)

-- When I see a term, I need to look it up. To do so, I need to walk up through
-- scope and fine all sources/declarations and type annotations. This involves
-- walking up through where statements (shadowing is possible), up through lambdas
-- (where again shadowing is possible), to the module scope, and to the imported
-- scope (where terms are merged, not shadowed).
--
-- Generate integers for all positions in the tree, use these to map into a table that includes:
--  * manual type annotations or signatures
--  * inferred type annotations
--
-- All expressions are mapped to integer indices linking expressions to their
-- ultimate type annotations. The indices also match terms to their signatures
-- and locations in source code.
treeify ::
  DAG MVar [AliasedSymbol] ExprI ->
  MorlocMonad [AnnoS Int ManyPoly Int]
treeify d
  | Map.size d == 0 = return []
  | otherwise = case DAG.roots d of
      -- if no parentless element exists, then the graph must be empty or cyclic
      [] -> MM.throwSystemError "cyclic import dependency in treeify"
      -- else if exactly one module name key (k) is found
      [k] -> do
        case DAG.lookupNode k d of
          -- if the key is not in the DAG, then something is dreadfully wrong codewise
          Nothing -> MM.throwSystemError $ "Compiler bug (__FILE__:__LINE__): Module DAG is missing key" <+> pretty k
          (Just (AST.findExport -> ExportMany symbols groups)) -> do
            d' <- DAG.mapNodeM linkAndRemoveAnnotations d

            -- move all to state, after this the DAG will no longer be needed
            _ <- MFL.link d'

            -- find all term exports (ungrouped + grouped)
            let allSymbols = Set.unions (symbols : [exportGroupMembers g | g <- groups])
                exports = [(i, v) | (i, TermSymbol v) <- Set.toList allSymbols]

            -- Build export group info for the state
            let exportGroupInfo =
                  Map.fromList
                    [ ( exportGroupName g
                      , (exportGroupDesc g, [i | (i, TermSymbol _) <- Set.toList (exportGroupMembers g)])
                      )
                    | g <- groups
                    ]

            -- Validate command groups
            let ungroupedNames = Set.fromList [v | (_, TermSymbol v) <- Set.toList symbols]
                groupNames = Set.fromList [exportGroupName g | g <- groups]
                collisions = Set.intersection (Set.map unEVar ungroupedNames) groupNames
            -- group names must not collide with ungrouped command names
            if not (Set.null collisions)
              then
                MM.throwSystemError $
                  "Command group names collide with ungrouped command names:"
                    <+> list (map pretty (Set.toList collisions))
              else return ()

            -- - store all exported indices in state
            -- - Add the export name to state. Failing to do so here, will lose
            --   the name of terms that are exported but not defined, this leads
            --   to cryptic error messages.
            MM.modify
              ( \s ->
                  s
                    { stateExports = map fst exports
                    , stateName = Map.union (stateName s) (Map.fromList exports)
                    , stateExportGroups = exportGroupInfo
                    }
              )

            -- dissolve modules, imports, and sources, leaving behind only a tree for each term exported from main
            statefulMapM collect (Namer Map.empty 0 Set.empty) exports |>> snd
          (Just _) ->
            error "This should not be possible, all ExportAll cases should have been removed in Restructure.hs"

      -- There is no currently supported use case that exposes multiple roots in
      -- one compilation process. The compiler executable takes a single morloc
      -- file as input, therefore this MUST be the root. In the future compiling
      -- multiple projects in parallel with potentially shared information and
      -- constraints could be valuable.
      roots ->
        MM.throwSystemError $
          "Compiler bug (__FILE__:__LINE__): unsupported multi-rooted module DAG:"
            <+> tupled (map pretty roots)

linkAndRemoveAnnotations :: ExprI -> MorlocMonad ExprI
linkAndRemoveAnnotations = f
  where
    f :: ExprI -> MorlocMonad ExprI
    f (ExprI _ (AnnE e@(ExprI i _) t)) = do
      --     ^                ^-- this one is connected to the given types
      --     '-- this index disappears with the lost annotation node
      s <- MM.get
      MM.put $ s {stateAnnotations = Map.insert i t (stateAnnotations s)}
      f e -- notice the topology change
      -- everything below is boilerplate (this is why I need recursion schemes)
    f (ExprI i (ModE v es)) = ExprI i <$> (ModE v <$> mapM f es)
    f (ExprI i (AssE v e es)) = ExprI i <$> (AssE v <$> f e <*> mapM f es)
    f (ExprI i (LstE es)) = ExprI i <$> (LstE <$> mapM f es)
    f (ExprI i (TupE es)) = ExprI i <$> (TupE <$> mapM f es)
    f (ExprI i (NamE rs)) = do
      es' <- mapM (f . snd) rs
      return . ExprI i $ NamE (zip (map fst rs) es')
    f (ExprI i (AppE e es)) = ExprI i <$> (AppE <$> f e <*> mapM f es)
    f (ExprI i (LamE vs e)) = ExprI i <$> (LamE vs <$> f e)
    f (ExprI i (LetE bindings body)) = ExprI i <$> (LetE <$> mapM (\(v, e) -> (,) v <$> f e) bindings <*> f body)
    f (ExprI i (IfE c t e)) = ExprI i <$> (IfE <$> f c <*> f t <*> f e)
    f (ExprI i (DoBlockE e)) = ExprI i <$> (DoBlockE <$> f e)
    f (ExprI i (EvalE e)) = ExprI i <$> (EvalE <$> f e)
    f (ExprI i (IntrinsicE intr es)) = ExprI i <$> (IntrinsicE intr <$> mapM f es)
    f e@(ExprI _ _) = return e

{- | Build the call tree for a single nexus command. The result is ambiguous,
with 1 or more possible tree topologies, each with one or more possible
implementations for each function.

Rewrite all lambda-bound variables to the unique names
"<name>@<index>". Where "<name>" is the original name and "<index>" is an
auto-incrementing integer. This solves naming conflicts while avoiding
excessive traversal of the tree.

Recursion is handled via namerExpanding: when a function is being expanded,
recursive references to it emit CallS back-edge nodes instead of re-expanding.
-}
collect ::
  Namer ->
  ( Int -- the general index for the term
  , EVar -- name of root expression
  ) ->
  MorlocMonad (Namer, AnnoS Int ManyPoly Int)
collect namer0 (gi, v) = do
  MM.sayVVV $
    "collect"
      <> "\n  gi:" <+> pretty gi
      <> "\n  v:" <+> pretty v
  (namer, e) <- collectExprS namer0 (ExprI gi (VarE defaultValue v))
  return (namer, AnnoS gi gi e)

collectAnnoS :: Namer -> ExprI -> MorlocMonad (Namer, AnnoS Int ManyPoly Int)
collectAnnoS namer e@(ExprI gi _) = collectExprS namer e |>> second (AnnoS gi gi)

-- | Translate ExprI to ExprS tree
collectExprS :: Namer -> ExprI -> MorlocMonad (Namer, ExprS Int ManyPoly Int)
collectExprS namer0 (ExprI gi0 e0) = f namer0 e0
  where
    f namer (VarE _ v)
      | Set.member v (namerExpanding namer)
      , Nothing <- Map.lookup v (namerMap namer) = do
          -- Recursive reference detected (not shadowed by local binding)
          MM.sayVVV $ "collectExprS: recursive call to" <+> pretty v
          return (namer, CallS v)
      | otherwise = do
          MM.sayVVV $
            "collectExprS VarE"
              <> "\n  gi:" <+> pretty gi0
              <> "\n  v:" <+> pretty v
          sigs <- MM.gets stateSignatures

          case GMap.lookup gi0 sigs of
            -- A monomorphic term will have a type if it is linked to any source
            -- since sources require signatures. But if it associated only with a
            -- declaration, then it will have no type.
            (GMapJust (Monomorphic t)) -> do
              MM.sayVVV $ "  searchged gi " <+> pretty gi0 <+> "for" <+> pretty v

              MM.sayVVV $ "  monomorphic term" <+> pretty v <> ":" <+> maybe "?" pretty (termGeneral t)
              let namer' = namer { namerExpanding = Set.insert v (namerExpanding namer) }
              (namer'', es) <- termtypesToAnnoS gi0 namer' t
              return $ (namer'' { namerExpanding = namerExpanding namer }, VarS v (MonomorphicExpr (termGeneral t) es))

            -- A polymorphic term should always have a type.
            (GMapJust (Polymorphic cls clsName t ts)) -> do
              MM.sayVVV $
                "  polymorphic term" <+> pretty v <> ":" <+> list (map (maybe "?" pretty . termGeneral) ts)
              let namer' = namer { namerExpanding = Set.insert v (namerExpanding namer) }
              (namer'', ess) <- statefulMapM (termtypesToAnnoS gi0) namer' ts
              let etypes = map (fromJust . termGeneral) ts
              return $ (namer'' { namerExpanding = namerExpanding namer }, VarS v (PolymorphicExpr cls clsName t (zip etypes ess)))

            -- Terms not associated with TermTypes objects must be lambda-bound or let-bound
            -- These terms will be renamed for uniqueness
            _ -> do
              MM.sayVVV $ "bound term" <+> pretty v
              case Map.lookup v (namerMap namer) of
                (Just (v', LambdaBound)) -> return (namer, BndS v')
                (Just (v', LetBound)) -> return (namer, LetBndS v')
                Nothing -> MM.throwSourcedError gi0 $ "Undefined term in namer map:" <+> pretty v
      where
        termtypesToAnnoS :: Int -> Namer -> TermTypes -> MorlocMonad (Namer, [AnnoS Int ManyPoly Int])
        termtypesToAnnoS gi n t = do
          let calls = [AnnoS gi ci (ExeS (SrcCall src)) | (_, Idx ci src) <- termConcrete t]

          (n', declarations) <- statefulMapM termExprToAnnoS n (termDecl t)
          return (n', (calls <> declarations))

        termExprToAnnoS :: Namer -> ExprI -> MorlocMonad (Namer, AnnoS Int ManyPoly Int)
        termExprToAnnoS n e@(ExprI ci _) = do
          (n', e') <- reindexExprI e >>= collectExprS n
          return $ (n', AnnoS gi0 ci e')
    f namer (LstE es) = statefulMapM collectAnnoS namer es |>> second LstS
    f namer (TupE es) = statefulMapM collectAnnoS namer es |>> second TupS
    f namer (NamE rs) = do
      (namer', vals) <- statefulMapM collectAnnoS namer (map snd rs)
      let keys = map fst rs
      return (namer', NamS (zip keys vals))
    f namer (LamE vs e) = do
      let namer' = foldr (updateRenamer LambdaBound) namer vs
          vs' = map (fst . fromJust . (flip Map.lookup) (namerMap namer')) vs
      (_, e') <- collectAnnoS namer' e
      -- return the original name, the lambda bound terms are defined only below
      return (namer, LamS vs' e')
    f namer (LetE ((v, e1) : rest) body) = do
      (namer1, e1') <- collectAnnoS namer e1
      let namer2 = updateRenamer LetBound v namer1
          v' = fst $ fromJust $ Map.lookup v (namerMap namer2)
          innerBody = case rest of
            [] -> body
            _ -> ExprI (exprIIdx body) (LetE rest body)
      (_, body') <- collectAnnoS namer2 innerBody
      return (namer, LetS v' e1' body')
    f _ (LetE [] _) = error "Bug in collectExprS: empty let bindings"
    f namer (AppE e es) = do
      (namer', e') <- collectAnnoS namer e
      (namer'', es') <- statefulMapM collectAnnoS namer' es
      return (namer'', AppS e' es')
    f namer UniE = return (namer, UniS)
    f namer NullE = return (namer, NullS)
    f namer (RealE x) = return (namer, RealS x)
    f namer (IntE x) = return (namer, IntS x)
    f namer (LogE x) = return (namer, LogS x)
    f namer (StrE x) = return (namer, StrS x)
    f namer (PatE p) = return (namer, ExeS (PatCall p))
    f namer (DoBlockE e) = do
      (namer', e') <- collectAnnoS namer e
      return (namer', DoBlockS e')
    f namer (EvalE e) = do
      (namer', e') <- collectAnnoS namer e
      return (namer', EvalS e')
    f namer (IntrinsicE intr es) = do
      (namer', es') <- go namer [] es
      return (namer', IntrinsicS intr es')
      where
        go n acc [] = return (n, reverse acc)
        go n acc (x:xs) = do
          (n', x') <- collectAnnoS n x
          go n' (x':acc) xs
    f namer (IfE c t e) = do
      (namer1, c') <- collectAnnoS namer c
      (namer2, t') <- collectAnnoS namer1 t
      (namer3, e') <- collectAnnoS namer2 e
      return (namer3, IfS c' t' e')
    -- all other expressions are strictly illegal here and represent compiler bugs
    f _ e = error $ "Bug in collectExprS: " <> show (render (pretty e))

updateRenamer :: BindKind -> EVar -> Namer -> Namer
updateRenamer kind v namer =
  let v' = EV (unEVar v <> "@" <> MT.show' (namerIndex namer))
   in namer
        { namerMap = Map.insert v (v', kind) (namerMap namer)
        , namerIndex = namerIndex namer + 1
        }

exprIIdx :: ExprI -> Int
exprIIdx (ExprI i _) = i

reindexExprI :: ExprI -> MorlocMonad ExprI
reindexExprI (ExprI i e) = ExprI <$> newIndex i <*> reindexExpr e

reindexExpr :: Expr -> MorlocMonad Expr
reindexExpr (ModE m es) = ModE m <$> mapM reindexExprI es
reindexExpr (AnnE e ts) = AnnE <$> reindexExprI e <*> pure ts
reindexExpr (AppE e es) = AppE <$> reindexExprI e <*> mapM reindexExprI es
reindexExpr (AssE v e es) = AssE v <$> reindexExprI e <*> mapM reindexExprI es
reindexExpr (LamE vs e) = LamE vs <$> reindexExprI e
reindexExpr (LstE es) = LstE <$> mapM reindexExprI es
reindexExpr (NamE rs) = NamE <$> mapM (\(k, e) -> (,) k <$> reindexExprI e) rs
reindexExpr (TupE es) = TupE <$> mapM reindexExprI es
reindexExpr (LetE bindings body) = LetE <$> mapM (\(v, e) -> (,) v <$> reindexExprI e) bindings <*> reindexExprI body
reindexExpr (IfE c t e) = IfE <$> reindexExprI c <*> reindexExprI t <*> reindexExprI e
reindexExpr (DoBlockE e) = DoBlockE <$> reindexExprI e
reindexExpr (EvalE e) = EvalE <$> reindexExprI e
reindexExpr (IntrinsicE intr es) = IntrinsicE intr <$> mapM reindexExprI es
reindexExpr e = return e

-- FIXME: when I add linking to line numbers, I'll need to update that map
-- also. The trace should be recorded.
newIndex :: Int -> MorlocMonad Int
newIndex i = do
  i' <- MM.getCounter
  copyState i i'
  MM.sayVVV $ "Set indices " <> pretty i <> " = " <> pretty i'
  return i'


================================================
FILE: library/Morloc/Frontend/Typecheck.hs
================================================
{-# LANGUAGE CPP #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Frontend.Typecheck
Description : Bidirectional type inference and checking for general types
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Implements bidirectional type inference over the 'AnnoS' trees produced by
'Treeify'. Checks general (language-independent) types and resolves type
aliases. Concrete (language-specific) types are checked later after language
segregation in the code generator.
-}
module Morloc.Frontend.Typecheck (typecheck, resolveTypes, evaluateAnnoSTypes, peakSExpr) where

import qualified Data.IntMap.Strict as IntMap
import qualified Morloc.BaseTypes as BT
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM
import qualified Morloc.TypeEval as TE
import Morloc.Typecheck.Internal

{- | Each SAnno object in the input list represents one exported function.
Modules, scopes, imports and everything else are abstracted away.

Check the general types, do nothing to the concrete types which may only be
solved after segregation. Later the concrete types will need to be checked
for type consistency and correctness of packers.
-}
typecheck ::
  [AnnoS Int ManyPoly Int] ->
  MorlocMonad [AnnoS (Indexed TypeU) Many Int]
typecheck = mapM run
  where
    run :: AnnoS Int ManyPoly Int -> MorlocMonad (AnnoS (Indexed TypeU) Many Int)
    run e0 = do
      -- standardize names for lambda bound variables (e.g., x0, x1 ...)
      let g0 = Gamma {gammaCounter = 0, gammaSlot = 0, gammaContext = IntMap.empty, gammaExist = Map.empty, gammaSolved = Map.empty, gammaDeferred = [], gammaNatSubs = Map.empty, gammaIntVals = Map.empty}
      (g1, _, e1) <- synthG g0 e0
      insetSay "-------- leaving frontend typechecker ------------------"
      insetSay "g1:"
      seeGamma g1
      insetSay "========================================================"
      let e2 = mapAnnoSG (fmap normalizeType) . applyGen g1 $ e1

      (g2, e3) <- resolveInstances g1 e2
      let g3 = apply g2 g2

      -- re-check deferred Nat constraints now that existentials are solved
      case recheckDeferred g3 of
        Left err -> MM.throwSystemError err
        Right remaining ->
          mapM_ (\(t1, t2) ->
            MM.sayV $ "Warning: unresolved Nat constraint:" <+> prettyTypeU t1 <+> "~" <+> prettyTypeU t2
            ) remaining

      -- perform a final application of gamma the final expression and return
      -- (is this necessary?)
      return (applyGen g3 e3)

-- TypeU --> Type
resolveTypes :: AnnoS (Indexed TypeU) Many Int -> AnnoS (Indexed Type) Many Int
resolveTypes (AnnoS (Idx i t) ci e) =
  AnnoS (Idx i (typeOf t)) ci (f e)
  where
    f :: ExprS (Indexed TypeU) Many Int -> ExprS (Indexed Type) Many Int
    f (BndS x) = BndS x
    f (LetBndS x) = LetBndS x
    f (CallS x) = CallS x
    f (LetS v e1 e2) = LetS v (resolveTypes e1) (resolveTypes e2)
    f (VarS v xs) = VarS v (fmap resolveTypes xs)
    f (ExeS exe) = ExeS exe
    f (AppS x xs) = AppS (resolveTypes x) (map resolveTypes xs)
    f (LamS vs x) = LamS vs (resolveTypes x)
    f (LstS xs) = LstS (map resolveTypes xs)
    f (TupS xs) = TupS (map resolveTypes xs)
    f (NamS rs) = NamS (zip (map fst rs) (map (resolveTypes . snd) rs))
    f (RealS x) = RealS x
    f (IntS x) = IntS x
    f (LogS x) = LogS x
    f (StrS x) = StrS x
    f UniS = UniS
    f NullS = NullS
    f (DoBlockS e') = DoBlockS (resolveTypes e')
    f (EvalS e') = EvalS (resolveTypes e')
    f (CoerceS c e') = CoerceS c (resolveTypes e')
    f (IfS c t' e') = IfS (resolveTypes c) (resolveTypes t') (resolveTypes e')
    f (IntrinsicS intr es) = IntrinsicS intr (map resolveTypes es)

resolveInstances ::
  Gamma -> AnnoS (Indexed TypeU) ManyPoly Int -> MorlocMonad (Gamma, AnnoS (Indexed TypeU) Many Int)
resolveInstances g (AnnoS gi@(Idx genIndex gt) ci e0) = do
  gscope <- MM.getGeneralScope genIndex
  (g', e1) <- f gscope g e0
  return (g', AnnoS gi ci e1)
  where
    f ::
      Scope ->
      Gamma ->
      ExprS (Indexed TypeU) ManyPoly Int ->
      MorlocMonad (Gamma, ExprS (Indexed TypeU) Many Int)

    -- resolve instances
    f scope g0 (VarS v (PolymorphicExpr clsName _ _ rss)) = do
      -- find all instances that are a subtype of the inferred type
      -- Expand aliases in gt before matching (e.g., Vector 4 Int -> List Int)
      -- so instances for List match against Vector usage.
      let gtEval = case TE.evaluateType scope gt of
            Right et -> et
            Left _ -> gt
          emptyGamma = Gamma 0 0 IntMap.empty Map.empty Map.empty [] Map.empty Map.empty
          isCompatible t = isSubtypeOf2 scope t gtEval
                        || isJust (tryCoerce scope t gtEval emptyGamma)
          rssSubtypes = [x | x@(EType t _ _ _, _) <- rss, isCompatible t]


      -- find the most specific instance at the general level, this does not
      -- consider a type to be more specific it is more evaluated.
      --
      -- So for the types below
      --  type Stack = List
      --  type SpecialStack = Stack
      --
      -- And the instances here:
      --  instance Foo Stack where
      --      bar :: ...
      --  instance Foo SpecialStack where
      --      bar :: ...
      --
      --  The two bar instances would be considered equally specialized
      --
      --  They will be separated later when concrete types are considered. From
      --  the general perspective, the evaluate to being equal.
      (g2, es1) <- case mostSpecific [t | (EType t _ _ _, _) <- rssSubtypes] of
        -- if there are no suitable instances, die
        [] ->
          throwTypeError genIndex $
            "No instance found for" <+> pretty clsName
              <> "::"
              <> pretty v
              <> "\n  Are you missing a top-level type signature?"
        -- There may be many suitable instances from the general type level,
        -- however, they may differ at the concrete level, so keep all for know
        -- and let the concrete inference code sort things out later.
        manyTypes -> do
          -- Deduplicate alias-equivalent types: e.g., Array a and List a
          -- are structurally different but evaluate to the same type.
          -- Without this, N aliases cause exponential branching in recursive
          -- resolveInstances calls.
          let eval t = case TE.evaluateType scope t of
                Right et -> et
                Left _ -> t
              deduped = nubBy (\t1 t2 -> eval t1 == eval t2) manyTypes
              es0 = concat [rs | (t, rs) <- rssSubtypes,
                            any (\d -> eval (etype t) == eval d) deduped]
              -- When all matching instances are alias-equivalent (single
              -- deduped entry), propagate existential solutions normally.
              -- When multiple distinct instances exist (e.g. Integral Int
              -- and Integral Real), don't propagate -- solving to one
              -- would break the others.
              singleGroup = length deduped <= 1
          g1 <- connectInstance singleGroup g0 es0
          return (g1, es0)

      (g3, es2) <- statefulMapM resolveInstances g2 es1

      return (g3, VarS v (Many es2))
    f _ g0 (VarS v (MonomorphicExpr _ xs)) = statefulMapM resolveInstances g0 xs |>> second (VarS v . Many)
    -- propagate
    f _ g0 (AppS e es) = do
      (g1, e') <- resolveInstances g0 e
      (g2, es') <- statefulMapM resolveInstances g1 es
      return (g2, AppS e' es')
    f _ g0 (LamS vs e) = resolveInstances g0 e |>> second (LamS vs)
    f _ g0 (LstS es) = statefulMapM resolveInstances g0 es |>> second LstS
    f _ g0 (TupS es) = statefulMapM resolveInstances g0 es |>> second TupS
    f _ g0 (NamS rs) = do
      (g1, es') <- statefulMapM resolveInstances g0 (map snd rs)
      return (g1, NamS (zip (map fst rs) es'))

    -- let expressions
    f _ g0 (LetBndS v) = return (g0, LetBndS v)
    f _ g0 (LetS v e1 e2) = do
      (g1, e1') <- resolveInstances g0 e1
      (g2, e2') <- resolveInstances g1 e2
      return (g2, LetS v e1' e2')
    -- primitives
    f _ g0 UniS = return (g0, UniS)
    f _ g0 NullS = return (g0, NullS)
    f _ g0 (BndS v) = return (g0, BndS v)
    f _ g0 (CallS v) = return (g0, CallS v)
    f _ g0 (RealS x) = return (g0, RealS x)
    f _ g0 (IntS x) = return (g0, IntS x)
    f _ g0 (LogS x) = return (g0, LogS x)
    f _ g0 (StrS x) = return (g0, StrS x)
    f _ g0 (ExeS x) = return (g0, ExeS x)
    f _ g0 (DoBlockS e) = resolveInstances g0 e |>> second DoBlockS
    f _ g0 (EvalS e) = resolveInstances g0 e |>> second EvalS
    f _ g0 (CoerceS c e) = resolveInstances g0 e |>> second (CoerceS c)
    f _ g0 (IfS c t e) = do
      (g1, c') <- resolveInstances g0 c
      (g2, t') <- resolveInstances g1 t
      (g3, e') <- resolveInstances g2 e
      return (g3, IfS c' t' e')
    f _ g0 (IntrinsicS intr es) = do
      (g1, es') <- statefulMapM resolveInstances g0 es
      return (g1, IntrinsicS intr es')

    -- When unique (single alias-equivalent group), propagate gamma normally.
    -- When not unique (multiple distinct instances), skip failures and don't
    -- propagate, since solving to one instance would break the others.
    connectInstance :: Bool -> Gamma -> [AnnoS (Indexed TypeU) f c] -> MorlocMonad Gamma
    connectInstance _ g0 [] = return g0
    connectInstance singleGroup g0 (AnnoS (Idx i t) _ _ : es) = do
      scope <- MM.getGeneralScope i
      case subtype scope (stripCoercionWrappers gt) t g0 of
        (Left _) -> connectInstance singleGroup g0 es
        (Right g1)
          | singleGroup -> connectInstance singleGroup g1 es
          | otherwise   -> connectInstance singleGroup g0 es

-- prepare a general, indexed typechecking error
throwTypeError :: Int -> MDoc -> MorlocMonad a
throwTypeError i msg = MM.throwSourcedError i ("General type error:" <+> msg)

checkG ::
  Gamma ->
  AnnoS Int ManyPoly Int ->
  TypeU ->
  MorlocMonad
    ( Gamma
    , TypeU
    , AnnoS (Indexed TypeU) ManyPoly Int
    )
checkG g (AnnoS i j e) t = do
  annotation <- MM.gets stateAnnotations
  (g', t', e') <- case Map.lookup j annotation of
    Nothing -> checkE' i g e t
    (Just annType) -> do
      gAnn <- subtype' i annType t g
      checkE' i gAnn e t
  return (g', t', AnnoS (Idx i t') j e')

synthG ::
  Gamma ->
  AnnoS Int ManyPoly Int ->
  MorlocMonad
    ( Gamma
    , TypeU
    , AnnoS (Indexed TypeU) ManyPoly Int
    )
synthG g (AnnoS gi ci e) = do
  annotation <- MM.gets stateAnnotations
  (g', t, e') <- case Map.lookup ci annotation of
    Nothing -> synthE' gi g e
    (Just annType) -> checkE' gi g e annType
  return (g', t, AnnoS (Idx gi t) ci e')

synthE ::
  Int ->
  Gamma ->
  ExprS Int ManyPoly Int ->
  MorlocMonad
    ( Gamma
    , TypeU
    , ExprS (Indexed TypeU) ManyPoly Int
    )
synthE _ g UniS = return (g, BT.unitU, UniS)
synthE _ g NullS =
  let (g1, v) = newvar "nullType_" g
   in return (g1, OptionalU v, NullS)
synthE _ g (RealS x) = return (g, BT.realU, RealS x)
synthE _ g (IntS x) = return (g, BT.intU, IntS x)
synthE _ g (LogS x) = return (g, BT.boolU, LogS x)
synthE _ g (StrS x) = return (g, BT.strU, StrS x)
-- Ensures pattern setting operations return the correct type.
-- Without this case, patterns that change type will pass silently, but lead to
-- corrupted data.
-- Setter pattern lambda: (\v -> .field v newVal) data
-- The body applies a pattern to 2+ args (data + set values).
-- Getters (1 arg) are NOT matched here and go through normal AppS.
synthE
  _
  g0
  ( AppS
      f0@( AnnoS
            _
            _
            ( LamS
                [_]
                ( AnnoS
                    _
                    _
                    ( AppS
                        ((AnnoS _ _ (ExeS (PatCall (PatternStruct _)))))
                        (_ : _ : _)
                      )
                  )
              )
          )
      [x0]
    ) = do
    (g1, patternType, f1) <- synthG g0 f0
    case patternType of
      (FunU _ selectType) -> do
        (g2, dataType, x1) <- checkG g1 x0 selectType
        return (g2, dataType, AppS f1 [x1])
      _ -> error "This should be unreachable"

-- synthesize a string interpolation pattern
synthE i g (AppS f@(AnnoS _ _ (ExeS (PatCall (PatternText _ _)))) es) = do
  (g1, _, f1) <- synthG g f
  (g2, _, es1, _) <- zipCheck i g1 es (take (length es) (repeat BT.strU))
  return (g2, BT.strU, AppS f1 es1)

-- handle getter patterns
synthE _ _ (AppS (AnnoS _ _ (ExeS (PatCall (PatternStruct _)))) []) = error "Unreachable application pattern to no data"
synthE _ g0 (AppS (AnnoS fgidx fcidx (ExeS (PatCall (PatternStruct s)))) [e0]) = do
  -- generate an existential type that contains the pattern
  (g1, datType) <- selectorType g0 s

  -- type returned from pattern (with one element for each extracted value)
  retType <- return $ case selectorGetter datType s of
    [] -> error "Illegal empty selection"
    [t] -> t
    ts -> BT.tupleU ts
  let ft = FunU [datType] retType

  -- use selector-derived type to update context and data expression
  (g2, _, e') <- checkG g1 e0 datType

  let f1 = (AnnoS (Idx fgidx ft) fcidx (ExeS (PatCall (PatternStruct s))))

  return (g2, apply g2 retType, AppS f1 [e'])

-- handle setter patterns
synthE _ g0 (AppS (AnnoS fgidx fcidx (ExeS (PatCall (PatternStruct s)))) (e0 : es0)) = do
  (g1, (unzip -> (setTypes, es1))) <-
    statefulMapM (\s' e -> synthG s' e |>> (\(a, b, c) -> (a, (b, c)))) g0 es0

  -- generate an existential type that contains the pattern
  (g2, outputType) <- selectorType g1 s |>> second (selectorSetter setTypes s)

  (g3, datType, e1) <- checkG g2 e0 outputType

  let patternType = apply g3 $ FunU (datType : setTypes) outputType
      f1 = AnnoS (Idx fgidx patternType) fcidx (ExeS (PatCall (PatternStruct s)))

  return (g3, apply g3 outputType, AppS f1 (e1 : es1))
synthE _ g (ExeS (PatCall (PatternText s ss@(length -> n)))) = do
  let t = FunU (take n (repeat BT.strU)) BT.strU
  return (g, t, ExeS (PatCall (PatternText s ss)))

--   -->E0
synthE _ g (AppS f []) = do
  (g1, t1, f1) <- synthG g f
  return (g1, t1, AppS f1 [])

--   -->E
synthE i g0 (AppS f xs0) = do
  -- synthesize the type of the function
  (g1, funType0, funExpr0) <- synthG g0 f

  -- Resolve nat labels: if the function has labeled nat params (m:Int syntax)
  -- and corresponding args are int literals, inject NatVarU solutions into gamma
  let g1' = resolveNatLabels f funType0 xs0 g1

  etaExpandSynthE i g1' funType0 funExpr0 f xs0

-- -->I==>
-- Synthesize lambda expressions. The key optimization here is to avoid
-- re-synthesizing after eta expansion - we synthesize the body once with
-- proper context, then construct the expanded form directly.
synthE parentIdx g0 (LamS vs x) = do
  -- Create existentials for lambda-bound variables and add to context
  let (g1, paramTypes) = statefulMap (\g' v -> newvar (unEVar v <> "_x") g') g0 vs
      g2 = g1 ++> zipWith AnnG vs paramTypes

  -- Synthesize body ONCE with bound variables in context
  (g3, bodyType, bodyExpr) <- synthG g2 x

  -- Check if body returns a function (needs eta expansion)
  let normalBody = normalizeType (apply g3 bodyType)
  case normalBody of
    FunU extraArgTypes retType -> do
      -- Body returns a function: eta-expand WITHOUT re-synthesizing
      -- Create new bound variables for the extra arguments
      (g4, newVarsWithTypes) <-
        statefulMapM
          ( \g' t -> do
              let (g'', v) = evarname g' "v"
              return (g'', (v, t))
          )
          g3
          extraArgTypes

      let newVars = map fst newVarsWithTypes
          appliedExtraTypes = map (apply g4 . snd) newVarsWithTypes

      -- Add type annotations for new bound variables
      let g5 = g4 ++> zipWith AnnG newVars appliedExtraTypes

      -- Create typed variable references for the new parameters
      newVarExprs <-
        mapM
          ( \(v, t) -> do
              idx <- MM.getCounterWithPos parentIdx
              return $ AnnoS (Idx idx t) idx (BndS v)
          )
          (zip newVars appliedExtraTypes)

      -- Create the application of body to new variables
      appIdx <- MM.getCounterWithPos parentIdx
      let appliedRetType = apply g5 retType
          appliedBodyExpr = AppS (applyGen g5 bodyExpr) newVarExprs
          appliedBodyAnno = AnnoS (Idx appIdx appliedRetType) appIdx appliedBodyExpr

      -- Construct the full function type
      let allParamTypes = map (apply g5) paramTypes ++ appliedExtraTypes
          fullType = FunU allParamTypes appliedRetType

      return (g5, fullType, LamS (vs ++ newVars) appliedBodyAnno)
    _ -> do
      -- Body is not a function: just return the lambda as-is
      let funType = apply g3 (FunU paramTypes bodyType)
      return (g3, funType, LamS vs (applyGen g3 bodyExpr))

--   List
synthE _ g (LstS []) =
  let (g1, itemType) = newvar "itemType_" g
      listType = BT.listU itemType
   in return (g1, listType, LstS [])
synthE i g (LstS (e : es)) = do
  (g1, itemType, itemExpr) <- synthG g e
  (g2, listType, listExpr) <- checkE' i g1 (LstS es) (BT.listU itemType)
  case listExpr of
    (LstS es') -> return (g2, listType, LstS (itemExpr : es'))
    _ -> error "impossible"

--   Tuple
synthE _ g (TupS []) =
  let t = BT.tupleU []
   in return (g, t, TupS [])
synthE i g (TupS (e : es)) = do
  -- synthesize head
  (g1, itemType, itemExpr) <- synthG g e

  -- synthesize tail
  (g2, tupleType, tupleExpr) <- synthE' i g1 (TupS es)

  -- merge the head and tail
  t3 <- case tupleType of
    (AppU _ ts) -> return $ BT.tupleU (apply g2 itemType : ts)
    _ -> error "impossible" -- the general tuple will always be (AppU _ _)
  xs' <- case tupleExpr of
    (TupS xs') -> return xs'
    _ -> error "impossible" -- synth does not change data constructors
  return (g2, t3, TupS (itemExpr : xs'))
synthE _ g0 (NamS rs) = do
  (g1, xs) <- statefulMapM (\s v -> synthG s v |>> (\(a, b, c) -> (a, (b, c)))) g0 (map snd rs)
  let (ts, es) = unzip xs
      ks = map fst rs
      (g2, t) = newvarRich ([], Closed) (zip ks ts, Closed) "record_" g1
      e = NamS (zip ks es)
  return (g2, t, e)

-- Any morloc variables should have been expanded by treeify. Any bound
-- variables should be checked against. I think (this needs formalization).
synthE _ g0 (VarS v (MonomorphicExpr (Just t0) xs0)) = do
  let (g1, t1) = rename g0 (etype t0)
      g1' = g1 ++> [AnnG v t1]
  (g2, t2, xs1) <- foldCheck g1' xs0 t1
  let xs2 = applyCon g2 $ VarS v (MonomorphicExpr (Just t0) xs1)
  return (g2, t2, xs2)
synthE _ g (VarS v (MonomorphicExpr Nothing (x : xs))) = do
  let (g0', freshT) = newvar (unEVar v <> "_rec") g
      g0'' = g0' ++> [AnnG v freshT]
  (g', t', x') <- synthG g0'' x
  (g'', t'', xs') <- foldCheck g' xs t'
  let xs'' = applyCon g'' $ VarS v (MonomorphicExpr Nothing (x' : xs'))
  return (g'', t'', xs'')
synthE _ g (VarS v (MonomorphicExpr Nothing [])) = do
  let (g', t) = newvar (unEVar v <> "_u") g
  return (g', t, VarS v (MonomorphicExpr Nothing []))
synthE i g0 (VarS v (PolymorphicExpr cls clsName t0 rs0)) = do
  (g1, rsChecked) <- checkInstances g0 (etype t0) rs0
  let (g2, t1) = rename g1 (etype t0)
  return (g2, t1, VarS v (PolymorphicExpr cls clsName t0 rsChecked))
  where
    -- Check each instance independently. Reset gammaContext between instances
    -- to prevent unbounded growth (each instance adds ~50-80 entries for
    -- existentials and solved types that are not needed by subsequent checks).
    checkInstances ::
      Gamma ->
      TypeU ->
      [(EType, [AnnoS Int ManyPoly Int])] ->
      MorlocMonad (Gamma, [(EType, [AnnoS (Indexed TypeU) ManyPoly Int])])
    checkInstances g _ [] = return (g, [])
    checkInstances g10 genType ((instType, es) : rs) = do
      -- convert qualified terms in the general type to existentials
      let (g11, genType') = toExistential g10 genType
      -- rename the instance type
      let (g12, instType') = rename g11 (etype instType)
      -- subtype the renamed instance type against the existential general
      g13 <- subtype' i instType' genType' g12
      -- Record the slot counter AFTER subtype'. Both toExistential and subtype'
      -- create ExistG entries that must be preserved: connectInstance (in
      -- resolveInstances) needs them in gammaContext to solve via access1.
      let slotAfterSubtype = gammaSlot g13
      -- check all implementations for this instance
      (g14, es') <- checkImplementations g13 genType' es

      -- Trim context back to post-subtype state. This removes entries
      -- from checkG (the main source of O(N^2) growth) while preserving
      -- existentials from toExistential and subtype' needed downstream.
      let gNext = gammaTrimAfter slotAfterSubtype g14

      -- Use the ORIGINAL general type, not the existentialized one above.
      -- Each instance gets its own existentials solved independently.
      (g15, rs') <- checkInstances gNext genType rs

      return (g15, (instType, es') : rs')

    -- check each implementation within each instance
    -- do not return modified Gamma state
    checkImplementations ::
      Gamma ->
      TypeU ->
      [AnnoS Int ManyPoly Int] ->
      MorlocMonad (Gamma, [AnnoS (Indexed TypeU) ManyPoly Int])
    checkImplementations g _ [] = return (g, [])
    checkImplementations g10 t (e@(AnnoS implGi _ _) : es) = do
      -- Temporarily remove any annotation that was propagated to this
      -- implementation's index via copyState/reindexExprI. An annotation
      -- like `mempty :: Str` on the usage site must not constrain checking
      -- of each instance implementation (e.g. the List instance's `[]`).
      implAnn <- MM.gets (Map.lookup implGi . stateAnnotations)
      MM.modify (\s -> s { stateAnnotations = Map.delete implGi (stateAnnotations s) })
      (g11, _, e') <- checkG g10 e t
      -- Restore
      case implAnn of
        Just ann' -> MM.modify (\s -> s { stateAnnotations = Map.insert implGi ann' (stateAnnotations s) })
        Nothing -> return ()

      -- check all the remaining implementations
      (g12, es') <- checkImplementations g11 t es

      -- return the final context and the applied expressions
      return (g12, applyGen g12 e' : es')

-- bare selector pattern (e.g., .0 or .1 used as a function argument, not applied)
synthE _ g0 (ExeS (PatCall (PatternStruct s))) = do
  (g1, datType) <- selectorType g0 s
  retType <- return $ case selectorGetter datType s of
    [] -> error "Illegal empty selection"
    [t] -> t
    ts -> BT.tupleU ts
  let ft = FunU [datType] retType
  return (g1, ft, ExeS (PatCall (PatternStruct s)))
-- This case will only be encountered in check, the existential generated here
-- will be subtyped against the type known from the VarS case.
synthE _ g (ExeS exe) = do
  let (g', t) = newvar "call_" g
  return (g', t, ExeS exe)
synthE _ g (BndS v) = do
  (g', t') <- case lookupE v g of
    (Just t) -> return (g, t)
    Nothing -> return $ newvar (unEVar v <> "_u") g
  return (g', t', BndS v)
synthE _ g (LetBndS v) = do
  (g', t') <- case lookupE v g of
    (Just t) -> return (g, t)
    Nothing -> return $ newvar (unEVar v <> "_u") g
  return (g', t', LetBndS v)
synthE _ g (CallS v) = do
  (g', t') <- case lookupE v g of
    (Just t) -> return (g, t)
    Nothing -> return $ newvar (unEVar v <> "_rec") g
  return (g', t', CallS v)
synthE _ g (LetS v e1 e2) = do
  (g1, t1, e1') <- synthG g e1
  let g2 = g1 ++> [AnnG v t1]
      -- Track known constant values for nat label resolution
      g2' = case tryEvalConst g2 (let AnnoS _ _ e = e1' in e) of
        Just val' -> g2 { gammaIntVals = Map.insert v val' (gammaIntVals g2) }
        Nothing -> g2
  (g3, t2, e2') <- synthG g2' e2
  return (g3, t2, LetS v e1' e2')
synthE i g (IfS cond thenE elseE) = do
  (g1, condType, cond') <- synthG g cond
  g2 <- subtype' i condType (VarU (TV "Bool")) g1
  (g3, t2, thenE') <- synthG g2 thenE
  (g4, t3, elseE') <- synthG g3 elseE
  g5 <- subtype' i t3 t2 g4
  return (g5, apply g5 t2, IfS cond' thenE' elseE')
synthE i g (DoBlockS e) = do
  (g1, t1, e1) <- synthG g e
  case apply g1 t1 of
    EffectU _ iT -> do
      -- Final expr is effectful: wrap it in EvalS so codegen forces the
      -- thunk and collectDoEffects picks up its effects alongside the
      -- non-final EvalS nodes.
      e1' <- wrapFinalEvalS i iT e1
      let collected = collectDoEffects e1'
      return (g1, EffectU collected iT, DoBlockS e1')
    bareT -> do
      -- Pure final: leave body as-is; tryCoerce CoerceToEffect will lift
      -- against an effectful expected type at the use site.
      let collected = collectDoEffects e1
      return (g1, EffectU collected bareT, DoBlockS e1)
synthE _ g (CoerceS coercion e) = do
  (g1, t1, e1) <- synthG g e
  return (g1, applyCoercion coercion t1, CoerceS coercion e1)
synthE i g (EvalS e) = do
  (g1, t1, e1) <- synthG g e
  let (g1', t1') = stripForallU g1 (apply g1 t1)
  case t1' of
    EffectU _ a -> return (g1', a, EvalS e1)
    ExistU _ _ _ -> do
      let (g2, bv) = tvarname g1' "effectInner_"
          bt = ExistU bv ([], Open) ([], Open)
          (g2b, ev) = tvarname g2 "effectVar_"
          thunkT = EffectU (EffectVar ev) bt
      g3 <- subtype' i (apply g2b t1') thunkT g2b
      return (g3, apply g3 bt, EvalS (applyGen g3 e1))
    t -> throwTypeError i $
      "Cannot force a non-effectful value (got type" <+> pretty t <> ")."
      <+> "The ! operator and non-final do-block statements require an effectful type <E> T."
      <+> "Pure expressions in a do-block should be bound via 'let' or moved to the final position."
synthE i g (IntrinsicS intr args) = do
  (g', argTypes, args') <- synthArgs g args
  g'' <- checkIntrinsicArgs i g' intr argTypes
  let (g''', expectedType) = intrinsicTypeG g'' intr
  return (g''', expectedType, IntrinsicS intr args')

-- | Strip ForallU wrappers by instantiating bound variables as existentials.
-- Follows the same pattern as `application` for ForallU.
stripForallU :: Gamma -> TypeU -> (Gamma, TypeU)
stripForallU g (ForallU v t) = stripForallU (g +> v) (substitute v t)
stripForallU g t = (g, t)

-- | Return type of a fully applied intrinsic, threading Gamma for fresh existentials
intrinsicTypeG :: Gamma -> Intrinsic -> (Gamma, TypeU)
intrinsicTypeG g IntrLoad =
  let (g', loadType) = newvar "load_" g
  in (g', EffectU ioEffectSet (OptionalU loadType))
intrinsicTypeG g IntrRead =
  let (g', readType) = newvar "read_" g
  in (g', OptionalU readType)
intrinsicTypeG g intr = (g, intrinsicType intr)

-- | Return type of a fully applied intrinsic (for intrinsics without fresh vars)
intrinsicType :: Intrinsic -> TypeU
intrinsicType IntrSave = EffectU ioEffectSet BT.unitU
intrinsicType IntrSaveM = EffectU ioEffectSet BT.unitU
intrinsicType IntrSaveJ = EffectU ioEffectSet BT.unitU
intrinsicType IntrLoad = EffectU ioEffectSet (OptionalU (ExistU (TV "load_a") ([], Open) ([], Open)))
intrinsicType IntrHash = BT.strU
intrinsicType IntrVersion = BT.strU
intrinsicType IntrCompiled = BT.strU
intrinsicType IntrLang = BT.strU
intrinsicType IntrSchema = BT.strU
intrinsicType IntrTypeof = BT.strU
intrinsicType IntrShow = BT.strU
intrinsicType IntrRead = OptionalU (ExistU (TV "read_a") ([], Open) ([], Open))
intrinsicType IntrDatafile = BT.strU

-- intrinsicArity is defined in Morloc.Namespace.Expr

-- | Synthesize types for a list of arguments
synthArgs ::
  Gamma ->
  [AnnoS Int ManyPoly Int] ->
  MorlocMonad (Gamma, [TypeU], [AnnoS (Indexed TypeU) ManyPoly Int])
synthArgs g [] = return (g, [], [])
synthArgs g (a:as) = do
  (g1, t1, a') <- synthG g a
  (g2, ts, as') <- synthArgs g1 as
  return (g2, t1:ts, a':as')

-- | Check intrinsic argument count and types
checkIntrinsicArgs ::
  Int -> Gamma -> Intrinsic -> [TypeU] -> MorlocMonad Gamma
checkIntrinsicArgs i g intr argTypes = do
  let expected = intrinsicArity intr
      actual = length argTypes
  if actual /= expected
    then throwTypeError i $
      "@" <> pretty (intrinsicName intr) <+> "expects" <+> pretty expected
        <+> "arguments but got" <+> pretty actual
    else do
      -- Check specific argument types
      case (intr, argTypes) of
        -- @save/@savem/@savej: a -> Str -> {()}
        (IntrSave, [_, pathT]) -> subtype' i pathT BT.strU g
        (IntrSaveM, [_, pathT]) -> subtype' i pathT BT.strU g
        (IntrSaveJ, [_, pathT]) -> subtype' i pathT BT.strU g
        -- @load: Str -> {?a}
        (IntrLoad, [pathT]) -> subtype' i pathT BT.strU g
        -- @hash: a -> Str
        (IntrHash, [_]) -> return g
        -- @schema/@typeof: a -> Str (value ignored at runtime)
        (IntrSchema, [_]) -> return g
        (IntrTypeof, [_]) -> return g
        -- @show: a -> Str (any type accepted)
        (IntrShow, [_]) -> return g
        -- @read: Str -> ?a (arg must be Str)
        (IntrRead, [strT]) -> subtype' i strT BT.strU g
        -- @datafile: Str -> Str (path must be string literal)
        (IntrDatafile, [pathT]) -> subtype' i pathT BT.strU g
        -- compile-time constants: no args
        (IntrVersion, []) -> return g
        (IntrCompiled, []) -> return g
        (IntrLang, []) -> return g
        _ -> return g

etaExpandSynthE ::
  Int ->
  Gamma ->
  TypeU ->
  AnnoS (Indexed TypeU) ManyPoly Int ->
  AnnoS Int ManyPoly Int ->
  [AnnoS Int ManyPoly Int] ->
  MorlocMonad
    ( Gamma
    , TypeU
    , ExprS (Indexed TypeU) ManyPoly Int
    )
etaExpandSynthE i g1 funType0 funExpr0 _f xs0 = do
  let normalType = normalizeType funType0
      numArgs = length xs0

  -- Check for arity errors before proceeding
  case normalType of
    FunU (length -> numParams) _
      | numArgs > numParams ->
          throwTypeError i $ "Invalid function application of type:\n  " <> prettyTypeU funType0
    _ -> return ()

  -- Process available args through application (no re-synthesis)
  (g2, funType1, inputExprs) <- application' i g1 xs0 normalType

  MM.sayVVV $
    "  funType1:" <+> pretty funType1
      <> "\n  inputExprs:" <+> list (map pretty inputExprs)

  case funType1 of
    FunU ts t -> case drop numArgs ts of
      -- full application
      [] -> return (g2, apply g2 t, AppS funExpr0 inputExprs)
      -- partial application: eta-expand without re-synthesis
      remainingParams -> do
        (g3, newVarsWithTypes) <-
          statefulMapM
            ( \g' tp -> do
                let (g'', v) = evarname g' "v"
                return (g'', (v, apply g2 tp))
            )
            g2
            remainingParams

        let newVars = map fst newVarsWithTypes
            newTypes = map snd newVarsWithTypes
            g4 = g3 ++> zipWith AnnG newVars newTypes

        -- Create typed variable references for the new params
        newVarExprs <-
          mapM
            ( \(v, tp) -> do
                idx <- MM.getCounterWithPos i
                return $ AnnoS (Idx idx tp) idx (BndS v)
            )
            newVarsWithTypes

        -- Build the application and lambda directly
        appIdx <- MM.getCounterWithPos i
        let retType = apply g4 t
            bodyExpr = AppS funExpr0 (inputExprs ++ newVarExprs)
            bodyAnno = AnnoS (Idx appIdx retType) appIdx bodyExpr
            fullType = FunU newTypes retType
        return (g4, fullType, LamS newVars bodyAnno)
    _ -> error "impossible"

expand :: Int -> Int -> Gamma -> ExprS Int f Int -> MorlocMonad (Gamma, ExprS Int f Int)
expand _ 0 g x = return (g, x)
expand parentIdx n g e@(AppS _ _) = do
  newIndex <- MM.getCounterWithPos parentIdx
  let (g', v') = evarname g "v"
  e' <- applyExistential parentIdx v' e
  let x' = LamS [v'] (AnnoS newIndex newIndex e')
  expand parentIdx (n - 1) g' x'
expand parentIdx n g (LamS vs' (AnnoS t ci e)) = do
  let (g', v') = evarname g "v"
  e' <- applyExistential parentIdx v' e
  expand parentIdx (n - 1) g' (LamS (vs' <> [v']) (AnnoS t ci e'))
expand _ _ g x = return (g, x)

applyExistential :: Int -> EVar -> ExprS Int f Int -> MorlocMonad (ExprS Int f Int)
applyExistential parentIdx v' (AppS f xs') = do
  newIndex <- MM.getCounterWithPos parentIdx
  return $ AppS f (xs' <> [AnnoS newIndex newIndex (BndS v')])
-- possibly illegal application, will type check after expansion
applyExistential parentIdx v' e = do
  appIndex <- MM.getCounterWithPos parentIdx
  varIndex <- MM.getCounterWithPos parentIdx
  return $ AppS (AnnoS appIndex appIndex e) [AnnoS varIndex varIndex (BndS v')]

application ::
  Int ->
  Gamma ->
  [AnnoS Int ManyPoly Int] -> -- the expressions that are passed to the function
  TypeU -> -- the function type
  MorlocMonad
    ( Gamma
    , TypeU -- output function type
    , [AnnoS (Indexed TypeU) ManyPoly Int] -- @e@, with type annotation
    )
--  g1 |- e <= A -| g2
-- ----------------------------------------- -->App
--  g1 |- A->C o e =>> C -| g2
application i g0 es0 (FunU as0 b0) = do
  (g1, as1, es1, remainder) <- zipCheck i g0 es0 as0
  let funType = apply g1 $ FunU (as1 <> remainder) b0
  insetSay $ "remainder:" <+> vsep (map pretty remainder)
  return (g1, funType, es1)

--  g1,Ea |- [Ea/a]A o e =>> C -| g2
-- ----------------------------------------- Forall App
--  g1 |- Forall x.A o e =>> C -| g2
application i g0 es (ForallU v s) = application' i (g0 +> v) es (substitute v s)
--  g1[Ea2, Ea1, Ea=Ea1->Ea2] |- e <= Ea1 -| g2
-- ----------------------------------------- EaApp
--  g1[Ea] |- Ea o e =>> Ea2 -| g2
application i g0 es (ExistU v@(TV s) ([], _) _) =
  case access1 v g0 of
    -- replace <t0> with <t0>:<ea1> -> <ea2>
    Just _ -> do
      let (g1, veas) = statefulMap (\g _ -> tvarname g "a_") g0 es
          (g2, vea) = tvarname g1 (s <> "o_")
          eas = [ExistU v' ([], Open) ([], Open) | v' <- veas]
          ea = ExistU vea ([], Open) ([], Open)
          f = FunU eas ea
      g3 <- case solveExistWith v f (map index eas ++ [index ea]) g2 of
        Left err -> throwTypeError i err
        Right Nothing -> return g2
        Right (Just g') -> return g'
      (g4, _, es', _) <- zipCheck i g3 es eas
      return (g4, apply g4 f, es')
    -- if the variable has already been solved, use solved value
    Nothing -> case lookupU v g0 of
      (Just (FunU ts t)) -> do
        (g1, ts', es', _) <- zipCheck i g0 es ts
        return (g1, apply g1 (FunU ts' t), es')
      (Just t) -> throwTypeError i $ "Application of term with non-functional type:\n   " <+> prettyTypeU t
      Nothing -> throwTypeError i $ "Expected function, but could not find type of term\n   " <+> pretty v
application i _ _ t =
  throwTypeError i $
    "Application of non-functional expression of type:" <+> prettyTypeU t

-- Tip together the arguments passed to an application
zipCheck ::
  Int ->
  Gamma ->
  [AnnoS Int ManyPoly Int] ->
  [TypeU] ->
  MorlocMonad
    ( Gamma
    , [TypeU]
    , [AnnoS (Indexed TypeU) ManyPoly Int]
    , [TypeU] -- remainder
    )
-- check the first elements, cdr down the remaining values
zipCheck i g0 (x0 : xs0) (t0 : ts0) = do
  (g1, t1, x1) <- checkG g0 x0 t0
  (g2, ts1, xs1, remainder) <- zipCheck i g1 xs0 ts0
  return (g2, t1 : ts1, x1 : xs1, remainder)
-- If there are fewer arguments than types, this may be OK, just partial application
zipCheck _ g0 [] ts = return (g0, [], [], ts)
-- If there are fewer types than arguments, then die
zipCheck i _ _ [] = MM.throwSourcedError i "Compiler bug (__FILE__:__LINE__): too many arguments in zipCheck"

foldCheck ::
  Gamma ->
  [AnnoS Int ManyPoly Int] ->
  TypeU ->
  MorlocMonad (Gamma, TypeU, [AnnoS (Indexed TypeU) ManyPoly Int])
foldCheck g [] t = return (g, t, [])
foldCheck g (x : xs) t = do
  (g', t', x') <- checkG g x t
  (g'', t'', xs') <- foldCheck g' xs t'
  return (g'', t'', x' : xs')

checkE ::
  Int ->
  Gamma ->
  ExprS Int ManyPoly Int ->
  TypeU ->
  MorlocMonad
    ( Gamma
    , TypeU
    , ExprS (Indexed TypeU) ManyPoly Int
    )
checkE i g1 (LstS (e : es)) (AppU v [t]) = do
  (g2, t2, e') <- checkG g1 e t
  -- LstS [] will go to the normal Sub case
  (g3, t3, LstS es') <- checkE' i g2 (LstS es) (AppU v [t2])
  return (g3, t3, LstS (map (applyGen g3) (e' : es')))
checkE i g0 e0@(LamS vs body) t@(FunU as b)
  | length vs == length as = do
      let g1 = g0 ++> zipWith AnnG vs as
      (g2, t2, e2) <- checkG g1 body b

      let t3 = apply g2 (FunU as t2)
          e3 = applyCon g2 (LamS vs e2)

      return (g2, t3, e3)
  | otherwise = do
      (g', e') <- expand i (length as - length vs) g0 e0
      checkE' i g' e' t
checkE i g1 e1 (ForallU v a) = do
  checkE' i (g1 +> v) e1 (substitute v a)
checkE i g (IfS cond thenE elseE) t = do
  (g1, condType, cond') <- synthG g cond
  g2 <- subtype' i condType (VarU (TV "Bool")) g1
  (g3, t2, thenE') <- checkG g2 thenE t
  (g4, _, elseE') <- checkG g3 elseE (apply g3 t2)
  return (g4, apply g4 t2, IfS cond' thenE' elseE')
-- DoBlockS falls through to the general synth+subtype/coerce case (below).
-- synthE DoBlockS produces a flattened EffectU, and subtype handles effectful
-- finals via <E1> T <: <E2> T, while tryCoerce handles pure-final auto-lift.
checkE i g (EvalS e) t = do
  -- Synthesize first to get concrete EffectSet in annotations,
  -- then check the inner type against the expected type.
  -- This avoids creating an EffectVar that is never solved.
  (g1, t1, e1) <- synthG g e
  let (g1', t1') = stripForallU g1 (apply g1 t1)
  case t1' of
    EffectU _ a -> do
      g2 <- subtype' i a t g1'
      return (g2, apply g2 t, EvalS e1)
    ExistU _ _ _ -> do
      let (g2, bv) = tvarname g1' "effectInner_"
          bt = ExistU bv ([], Open) ([], Open)
          (g2b, ev) = tvarname g2 "effectVar_"
          thunkT = EffectU (EffectVar ev) bt
      g3 <- subtype' i (apply g2b t1') thunkT g2b
      g4 <- subtype' i (apply g3 bt) t g3
      return (g4, apply g4 t, EvalS (applyGen g4 e1))
    t' -> throwTypeError i $
      "Cannot force a non-effectful value (got type" <+> pretty t' <> ")."
      <+> "The ! operator and non-final do-block statements require an effectful type <E> T."
      <+> "Pure expressions in a do-block should be bound via 'let' or moved to the final position."

-- Resolve solved existentials so specific handlers (LstS, TupS, etc.) can match
checkE i g e t@(ExistU v _ _)
  | Just _ <- lookupU v g
  = checkE' i g e (apply g t)
--   Sub (with coercion fallback)
checkE i g1 e1 b = do
  (g2, a, e2) <- synthE' i g1 e1
  let a' = apply g2 a
      b' = apply g2 b
  scope <- MM.getGeneralScope i
  case subtype scope a' b' g2 of
    Right g3 -> return (g3, apply g3 b', e2)
    Left err ->
      case tryCoerce scope a' b' g2 of
        Just (coercions, g3) -> do
          (finalExpr, _) <- foldlM
            (\(expr, currentType) coercion -> do
              idx <- MM.getCounterWithPos i
              let wrappedAnno = AnnoS (Idx idx currentType) i expr
              return (CoerceS coercion wrappedAnno, applyCoercion coercion currentType))
            (e2, apply g3 a')
            coercions
          return (g3, apply g3 b', finalExpr)
        Nothing -> MM.throwSourcedError i $
          "Type mismatch:"
          <> line <> "  expected: " <> prettyTypeU b'
          <> line <> "  inferred: " <> prettyTypeU a'
          <> line <> err

subtype' :: Int -> TypeU -> TypeU -> Gamma -> MorlocMonad Gamma
subtype' i a b g = do
  scope <- MM.getGeneralScope i
  insetSay $ parens (pretty a) <+> "<:" <+> parens (pretty b)
  case subtype scope a b g of
    (Left err') -> MM.throwSourcedError i err'
    (Right g') -> do
      let newDeferred = drop (length (gammaDeferred g)) (gammaDeferred g')
      mapM_ (\(t1, t2) ->
        MM.sayV $ "Warning: deferred Nat constraint:" <+> prettyTypeU t1 <+> "~" <+> prettyTypeU t2
        ) newDeferred
      return g'

-- | Try to find a coercion chain from type a to type b.
-- Returns a list of coercions (inside-out) and the resulting gamma.
-- Recursion terminates when the target is not OptionalU.
tryCoerce :: Scope -> TypeU -> TypeU -> Gamma -> Maybe ([Coercion], Gamma)
tryCoerce scope a (OptionalU b) g =
  case subtype scope a b g of
    Right g' -> Just ([CoerceToOptional], g')
    Left _ -> case tryCoerce scope a b g of
      Just (cs, g') -> Just (CoerceToOptional : cs, g')
      Nothing -> Nothing
-- Coerce a pure value to an effectful type: a -> <E> a
tryCoerce scope a (EffectU effs b) g =
  case subtype scope a b g of
    Right g' -> Just ([CoerceToEffect (resolveEffectSet effs)], g')
    Left _ -> case tryCoerce scope a b g of
      Just (cs, g') -> Just (CoerceToEffect (resolveEffectSet effs) : cs, g')
      Nothing -> Nothing
tryCoerce _ _ _ _ = Nothing

-- | Strip OptionalU wrappers that result from coercion.
-- Used in instance resolution to match the underlying type.
stripCoercionWrappers :: TypeU -> TypeU
stripCoercionWrappers (OptionalU t) = stripCoercionWrappers t
stripCoercionWrappers t = t

-- | Wrap the innermost (final) expression of a do-block body in EvalS.
-- Walks past LetS wrappers (introduced by desugarDo) and updates their type
-- annotations to the unwrapped inner type. A fresh index is allocated for
-- the new EvalS node so indexing metadata stays unique.
wrapFinalEvalS
  :: Int
  -> TypeU
  -> AnnoS (Indexed TypeU) ManyPoly Int
  -> MorlocMonad (AnnoS (Indexed TypeU) ManyPoly Int)
wrapFinalEvalS i iT (AnnoS (Idx gi _) ci (LetS v e1 e2)) = do
  e2' <- wrapFinalEvalS i iT e2
  return (AnnoS (Idx gi iT) ci (LetS v e1 e2'))
wrapFinalEvalS i iT final = do
  newIdx <- MM.getCounterWithPos i
  return (AnnoS (Idx newIdx iT) (annoSCtx final) (EvalS final))
  where
    annoSCtx (AnnoS _ c _) = c

-- | Collect effect labels from all EvalS nodes within a do-block body.
-- Deeply traverses the full expression tree to find nested EvalS nodes
-- (e.g., inside tuples, applications, let bindings).
collectDoEffects :: AnnoS (Indexed TypeU) f c -> EffectSet
collectDoEffects = go
  where
    go (AnnoS _ _ expr) = case expr of
      EvalS e -> effectOfAnno e `effUnion` go e
      LetS _ e1 e2 -> go e1 `effUnion` go e2
      AppS f args -> unions (go f : map go args)
      TupS es -> unions (map go es)
      LstS es -> unions (map go es)
      NamS rs -> unions (map (go . snd) rs)
      LamS _ e -> go e
      IfS c t e -> go c `effUnion` go t `effUnion` go e
      DoBlockS e -> go e
      CoerceS _ e -> go e
      IntrinsicS _ es -> unions (map go es)
      _ -> emptyEffectSet

    effectOfAnno (AnnoS (Idx _ (EffectU effs _)) _ _) = effs
    effectOfAnno _ = emptyEffectSet

    unions = foldl effUnion emptyEffectSet

    effUnion a b
      | a == emptyEffectSet = b
      | b == emptyEffectSet = a
      | a == b = a
      | otherwise = EffectUnion a b

-- helpers

-- apply context to a AnnoS
applyGen ::
  (Functor gf, Traversable f, Applicable g) =>
  Gamma ->
  AnnoS (gf g) f c ->
  AnnoS (gf g) f c
applyGen g = mapAnnoSG (fmap (apply g))

applyCon ::
  (Functor gf, Traversable f, Applicable g) =>
  Gamma ->
  ExprS (gf g) f c ->
  ExprS (gf g) f c
applyCon g = mapExprSG (fmap (apply g))

evaluateAnnoSTypes ::
  (Traversable f) => AnnoS (Indexed TypeU) f Int -> MorlocMonad (AnnoS (Indexed TypeU) f Int)
evaluateAnnoSTypes = mapAnnoSGM resolve
  where
    resolve :: Indexed TypeU -> MorlocMonad (Indexed TypeU)
    resolve (Idx m t) = do
      scope <- getScope m
      case TE.evaluateType scope t of
        (Left (SystemError e)) -> MM.throwSourcedError m e
        (Left e) -> MM.throwError e
        (Right tu) -> return (Idx m tu)

    getScope :: Int -> MorlocMonad Scope
    getScope i = do
      globalMap <- MM.gets stateGeneralTypedefs
      case GMap.lookup i globalMap of
        GMapNoFst -> return Map.empty
        GMapNoSnd -> return Map.empty
        GMapJust scope -> return scope

---- debugging

synthE' ::
  Int ->
  Gamma ->
  ExprS Int ManyPoly Int ->
  MorlocMonad
    ( Gamma
    , TypeU
    , ExprS (Indexed TypeU) ManyPoly Int
    )
synthE' i g x = do
  enter "synthE"
  insetSay $ "synthesize type for: " <> peakSExpr x
  r@(g', t, _) <- synthE i g x
  leave "synthE"
  seeGamma g'
  insetSay $ "synthesized type = " <> pretty t
  return r

checkE' ::
  Int ->
  Gamma ->
  ExprS Int ManyPoly Int ->
  TypeU ->
  MorlocMonad
    ( Gamma
    , TypeU
    , ExprS (Indexed TypeU) ManyPoly Int
    )
checkE' i g x t = do
  enter "checkE"
  insetSay $ "check if expr: " <> peakSExpr x
  insetSay $ "matches type: " <> pretty t
  r@(g', t', _) <- checkE i g x t
  leave "checkE"
  seeGamma g'
  seeType t'
  return r

application' ::
  Int ->
  Gamma ->
  [AnnoS Int ManyPoly Int] ->
  TypeU ->
  MorlocMonad
    ( Gamma
    , TypeU
    , [AnnoS (Indexed TypeU) ManyPoly Int]
    )
application' i g es t = do
  enter "application"
  seeType t
  insetSay $ "es:" <+> list [peakSExpr e | (AnnoS _ _ e) <- es]
  r@(g', t', _) <- application i g es t
  leave "application"
  seeGamma g'
  seeType t'
  return r

-- | Try to reduce an expression to a compile-time constant. Handles:
--   - Integer literals
--   - Tuple literals (recursively)
--   - Let-bound and lambda-bound variable references (via gammaIntVals)
--   - Let expressions (with local constant propagation)
--   - Index accessors on tuples: .0 (5, 6, 7) => 5
-- Returns Nothing for anything involving foreign function calls,
-- non-constant variables, or unsupported expression forms.
tryEvalConst :: Gamma -> ExprS g f c -> Maybe ConstVal
tryEvalConst _ (IntS n) = Just (ConstInt n)
tryEvalConst g (LetBndS v) = Map.lookup v (gammaIntVals g)
tryEvalConst g (BndS v) = Map.lookup v (gammaIntVals g)
tryEvalConst g (TupS es) = ConstTup <$> mapM (\(AnnoS _ _ e) -> tryEvalConst g e) es
tryEvalConst g (LetS v (AnnoS _ _ e1) (AnnoS _ _ e2)) = do
  val' <- tryEvalConst g e1
  tryEvalConst (g { gammaIntVals = Map.insert v val' (gammaIntVals g) }) e2
-- Index accessor on tuple literal or known tuple: .i (a, b, c) => element i
tryEvalConst g (AppS (AnnoS _ _ (ExeS (PatCall (PatternStruct
  (SelectorIdx (idx, SelectorEnd) []))))) [AnnoS _ _ inner])
  = case tryEvalConst g inner of
      Just (ConstTup vs) | idx >= 0, idx < length vs -> Just (vs !! idx)
      _ -> Nothing
-- Lambda application: (\x -> body) arg => beta-reduce
tryEvalConst g (AppS (AnnoS _ _ (LamS vs (AnnoS _ _ body))) args)
  | length vs == length args = do
    vals <- mapM (\(AnnoS _ _ e) -> tryEvalConst g e) args
    let g' = g { gammaIntVals = foldl (\m (v', val') -> Map.insert v' val' m) (gammaIntVals g) (zip vs vals) }
    tryEvalConst g' body
tryEvalConst _ _ = Nothing

-- | Try to reduce an expression to an integer constant.
tryEvalInt :: Gamma -> ExprS g f c -> Maybe Integer
tryEvalInt g e = case tryEvalConst g e of
  Just (ConstInt n) -> Just n
  _ -> Nothing

tryExtractIntPre :: Gamma -> AnnoS Int ManyPoly Int -> Maybe Integer
tryExtractIntPre g (AnnoS _ _ e) = tryEvalInt g e

-- | Resolve nat labels from int literal arguments.
-- When a function has labeled nat params (e.g., m:Int -> Tensor1 m Real)
-- and the corresponding arguments are int literals or let-bound ints,
-- inject NatVarU solutions into gamma so the return type gets concrete dimensions.
resolveNatLabels ::
  AnnoS Int ManyPoly Int ->  -- the function expression (pre-synthesis)
  TypeU ->                    -- the synthesized (renamed) function type
  [AnnoS Int ManyPoly Int] -> -- the arguments
  Gamma -> Gamma
resolveNatLabels (AnnoS _ _ (VarS _ (MonomorphicExpr (Just et) _))) funType args g
  | not (Map.null labels) =
    let origNvs = nub (collectNatVarNames (etype et))
        renamedNvs = nub (collectNatVarNames funType)
        renMap = Map.fromList (zip origNvs renamedNvs)
        solutions = Map.fromList
          [ (renamedVar, NatLitU n)
          | (origVar, argIdx) <- Map.toList labels
          , Just renamedVar <- [Map.lookup origVar renMap]
          , argIdx < length args
          , Just n <- [tryExtractIntPre g (args !! argIdx)]
          ]
    in g { gammaNatSubs = Map.union solutions (gammaNatSubs g) }
  where
    labels = enatLabels et
resolveNatLabels _ _ _ g = g

peakSExpr :: ExprS Int ManyPoly Int -> MDoc
peakSExpr UniS = "UniS"
peakSExpr NullS = "NullS"
peakSExpr (VarS v (MonomorphicExpr mayT _)) = "VarS" <+> pretty v <+> "::" <+> maybe "?" pretty mayT
peakSExpr (VarS v (PolymorphicExpr cls _ t _)) = "VarS" <+> pretty cls <+> " => " <+> pretty v <+> "::" <+> pretty t
peakSExpr (BndS v) = "BndS" <+> pretty v
peakSExpr (AppS _ xs) = "AppS" <+> "nargs=" <> pretty (length xs)
peakSExpr (LamS vs _) = "LamS" <> tupled (map pretty vs)
peakSExpr (LstS xs) = "LstS" <> "n=" <> pretty (length xs)
peakSExpr (TupS xs) = "TupS" <> "n=" <> pretty (length xs)
peakSExpr (NamS rs) = "NamS" <> encloseSep "{" "}" "," (map (pretty . fst) rs)
peakSExpr (RealS x) = "RealS" <+> viaShow x
peakSExpr (IntS x) = "IntS" <+> pretty x
peakSExpr (LogS x) = "LogS" <+> pretty x
peakSExpr (StrS x) = "StrS" <+> pretty x
peakSExpr (ExeS exe) = "ExeS" <+> pretty exe
peakSExpr (LetS v _ _) = "LetS" <+> pretty v
peakSExpr (LetBndS v) = "LetBndS" <+> pretty v
peakSExpr (CallS v) = "CallS" <+> pretty v
peakSExpr (DoBlockS _) = "DoBlockS"
peakSExpr (EvalS _) = "EvalS"
peakSExpr (CoerceS _ _) = "CoerceS"
peakSExpr (IfS _ _ _) = "IfS"
peakSExpr (IntrinsicS intr _) = "@" <> pretty (intrinsicName intr)


================================================
FILE: library/Morloc/Frontend/Valuecheck.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Frontend.Valuecheck
Description : Detect contradictions between alternative implementations
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

When a term has multiple implementations (e.g. a declaration and a source,
or multiple sources), this module checks that they are not provably
contradictory. For instance, two constant expressions that return different
literal values for the same type are flagged as errors.
-}
module Morloc.Frontend.Valuecheck (valuecheck, checkPair) where

import qualified Data.Set as Set
import qualified Data.Text as DT
import Morloc.Data.Doc
import Morloc.Frontend.Namespace
import qualified Morloc.Monad as MM

-- Convert AnnoS objects to a simple intermediate type
toE :: AnnoS (Indexed Type) Many Int -> E
toE (AnnoS g _ UniS) = LitP g MUni
toE (AnnoS g _ NullS) = LitP g MNull
toE (AnnoS g _ (BndS v)) = BndP g v
toE (AnnoS g _ (VarS v (Many es))) = VarP g v (map toE es)
toE (AnnoS g _ (AppS e es)) = AppP g (toE e) (map toE es)
toE (AnnoS g _ (LamS vs e)) = LamP g vs (toE e)
toE (AnnoS g _ (LstS es)) = LstP g (map toE es)
toE (AnnoS g _ (TupS es)) = TupP g (map toE es)
toE (AnnoS g _ (NamS rs)) = NamP g (map (second toE) rs)
toE (AnnoS g _ (RealS x)) = LitP g (MNum x)
toE (AnnoS g _ (IntS x)) = LitP g (MInt x)
toE (AnnoS g _ (LogS x)) = LitP g (MLog x)
toE (AnnoS g _ (StrS x)) = LitP g (MStr x)
toE (AnnoS g _ (ExeS (SrcCall s))) = SrcP g s
toE (AnnoS g _ (ExeS (PatCall (PatternText s ss)))) =
  LitP g (MStr (s <> DT.concat ["#{}" <> s' | s' <- ss]))
toE (AnnoS g _ (ExeS (PatCall (PatternStruct s)))) = PatP g s
toE (AnnoS g _ (LetBndS v)) = BndP g v
toE (AnnoS g _ (CallS v)) = BndP g v
toE (AnnoS _ _ (LetS _ _ body)) = toE body
toE (AnnoS g _ (IfS c t e)) = IfP g (toE c) (toE t) (toE e)
toE (AnnoS g _ (DoBlockS e)) = DoBlockP g (toE e)
toE (AnnoS g _ (EvalS e)) = EvalP g (toE e)
toE (AnnoS g _ (CoerceS c e)) = CoerceP c g (toE e)
toE (AnnoS g _ (IntrinsicS intr es)) = IntrinsicP g intr (map toE es)

indexOfE :: E -> Int
indexOfE (BndP (Idx i _) _) = i
indexOfE (VarP (Idx i _) _ _) = i
indexOfE (AppP (Idx i _) _ _) = i
indexOfE (LamP (Idx i _) _ _) = i
indexOfE (LstP (Idx i _) _) = i
indexOfE (TupP (Idx i _) _) = i
indexOfE (NamP (Idx i _) _) = i
indexOfE (LitP (Idx i _) _) = i
indexOfE (SrcP (Idx i _) _) = i
indexOfE (PatP (Idx i _) _) = i
indexOfE (IfP (Idx i _) _ _ _) = i
indexOfE (DoBlockP (Idx i _) _) = i
indexOfE (EvalP (Idx i _) _) = i
indexOfE (CoerceP _ (Idx i _) _) = i
indexOfE (IntrinsicP (Idx i _) _ _) = i

-- Check the harmony of typed implementations.
--
-- A naive implementation of this functions (and mine is naive as heck) will run
-- in exponential time in some cases. This can be avoided with a touch of
-- memoization. But I will leave that as an exercise for my user (PR's accepted).
valuecheck :: AnnoS (Indexed Type) Many Int -> MorlocMonad (AnnoS (Indexed Type) Many Int)
valuecheck e0 = check (toE e0) >> return e0

-- walk through a tree
-- find the sets of implementations in VarS expressions
-- compare all pairs of implementations
check :: E -> MorlocMonad ()
check (VarP (Idx i _) _ es) = mapM_ (uncurry (checkPair i)) (pairwise es)
  where
    -- find all unique pairs
    pairwise :: [a] -> [(a, a)]
    pairwise xs = [(xs !! i', xs !! j') | i' <- [0 .. length xs - 1], j' <- [0 .. length xs - 1], j' > i']
check (AppP _ e es) = mapM_ check (e : es)
check (LamP _ _ e) = check e
check (LstP _ es) = mapM_ check es
check (TupP _ es) = mapM_ check es
check (NamP _ (map snd -> es)) = mapM_ check es
check (IfP _ c t e) = mapM_ check [c, t, e]
check (DoBlockP _ e) = check e
check (EvalP _ e) = check e
check (CoerceP _ _ e) = check e
check _ = return ()

-- check for contradictions in one pair of expressions
checkPair :: Int -> E -> E -> MorlocMonad ()
-- These pass
--   foo x y = (x, y)
--   foo a b = (a, b)
--
-- These do not except in the special case where a=b
--   foo x y = (x, y)
--   foo a b = (b, a)
--
-- This requires unified names (see LamS case)
checkPair i e1@(BndP _ v1) e2@(BndP _ v2)
  | v1 == v2 = return ()
  | otherwise = valueError i e1 e2 "Non-equivalent variable patterns"
checkPair _ e1@(VarP g v1 es1) (VarP _ v2 es2)
  -- Same term, so es1 and es2 must be identical
  | v1 == v2 = check e1
  -- If the terms are different all the instances must still be the same and the
  -- type will be the same, so we can simply combine them.
  | otherwise = check (VarP g v1 (es1 <> es2))
-- evaluate all applications of lambdas
--  case #1 remove an empty lambda
checkPair i (AppP _ (LamP _ [] e1) _) e2 = checkPair i e1 e2
--  case #2 remove an empty application
checkPair i (AppP _ f@LamP {} []) e2 = checkPair i f e2
--  case #3 substitute on argument into the lambda
checkPair i (AppP g1 (LamP g2 (v : vs) e1) (x : xs)) e2 =
  let e1' = substituteExpr v x e1
   in checkPair i (AppP g1 (LamP g2 vs e1') xs) e2
--  if there is an applied lambda on the other side, reverse
checkPair i e1 e2@(AppP _ LamP {} _) = checkPair i e2 e1
-- No value checking is possible between applications
--
-- If the function applied is not the same in both terms, we can
-- say nothing without source analysis.
--
-- If the function applied is the same, we also need more information to make
-- any decisions. For example:
--
-- foo x y
-- foo y x
--
-- Here the applied function is the same, but the arguments are switched. But
-- whether this causes the terms to be non-equal depends on whether the function
-- commutes. For example, `add x y` == `add y x`.
--
-- In general, a function is free to map different inputs to the same
-- output. Without further information, we can conclude nothing. So all
-- applications must pass.
checkPair _ AppP {} AppP {} = return ()
checkPair i e1@AppP {} e2 = valueError i e1 e2 "Cannot check beyond source boundary"
checkPair i e1 e2@AppP {} = valueError i e1 e2 "Cannot check beyond source boundary"
-- Not that SrcP is something sourced, not necessarily a function, it may be a
-- constant.
checkPair i (SrcP (Idx _ t) src1) (SrcP _ src2) = compareForeignFunctions i t src1 src2
checkPair i e1@(SrcP _ _) e2 = checkPair i e2 e1
checkPair i e1 e2@SrcP {}
  | isSimple e1 = valueError i e1 e2 "Cannot compare source value to non-source expression"
  | otherwise = return ()
  where
    -- For VarP, simplicity of ANY instance indicates an error
    isSimple (VarP _ _ es) = any isSimple es
    -- For other expressions, only simplicity of ALL elements is error
    isSimple (LstP _ es) = all isSimple es
    isSimple (TupP _ es) = all isSimple es
    isSimple (NamP _ (map snd -> es)) = all isSimple es
    isSimple BndP {} = True
    isSimple LitP {} = True
    isSimple AppP {} = False
    isSimple LamP {} = False
    isSimple SrcP {} = False
    isSimple PatP {} = False
    isSimple (IfP _ _ _ _) = False
    isSimple (DoBlockP _ e) = isSimple e
    isSimple (EvalP _ e) = isSimple e
    isSimple (CoerceP _ _ e) = isSimple e
    isSimple (IntrinsicP _ _ _) = False

-- reduce empty lambdas
--
-- -- initial
-- \x y -> (\a b -> bar b a) x y
-- \k j -> bar k j
--
-- -- unify terms
-- \m n -> (\a b -> bar b a) m n
-- \m n -> bar m n
--
-- -- apply if not in canonical form
-- \m n -> bar n m
-- \m n -> bar m n
--
-- -- compare calls
-- bar
-- bar -- same function is called, so their arguments must be the comparable
--
-- -- compare arguments, starting with first
-- n
-- m
checkPair i (LamP _ vs1 s1) (LamP _ vs2 s2) = checkPair i s1' s2'
  where
    used =
      Set.unions
        [ freeTerms s1
        , freeTerms s2
        , Set.fromList (vs1 <> vs2)
        ]

    -- list of original variable names
    newvars =
      filter
        (\v -> not $ Set.member v used)
        [EV $ DT.pack ("x" <> show j) | j <- [(0 :: Int) ..]]

    s1' = foldr (\(v, r) s -> substituteEVar v r s) s1 (zip vs1 newvars)
    s2' = foldr (\(v, r) s -> substituteEVar v r s) s2 (zip vs2 newvars)
checkPair _ _ (LamP {}) = error "Illegal empty lambda"
checkPair _ (LamP {}) _ = error "Illegal empty lambda"
-- check all container elements
--  * their sizes must agree
--  * their pairwise elements must agree
checkPair i e1@(LstP _ xs) e2@(LstP _ ys)
  | length xs /= length ys = valueError i e1 e2 "Containers of unequal length"
  | otherwise = mapM_ (uncurry (checkPair i)) (zip xs ys)
checkPair i (TupP _ xs) (TupP _ ys) =
  mapM_ (uncurry (checkPair i)) (zip xs ys)
-- check records, no assumption of order
checkPair _ (NamP _ []) (NamP _ _) = return ()
checkPair i (NamP g1 ((k, x) : rs1)) (NamP g2 rs2) =
  case lookup k rs2 of
    (Just y) -> checkPair i x y >> checkPair i (NamP g1 rs1) (NamP g2 rs2)
    Nothing -> error "Unreachable if typechecker has passed"
-- Primitives must be equal
checkPair i e1@(LitP _ x) e2@(LitP _ y)
  | x == y = return ()
  | otherwise =
      valueError i e1 e2 $
        "Cannot equate non-equal primitives:\n"
          <> "a:" <+> pretty x
          <> "b:" <+> pretty y
-- All other cases should fail.
--
-- Actually, all other cases should already have failed while typechecking.
--
-- It should not be possible to reach this case, should it?
checkPair i e1 e2 = valueError i e1 e2 "Non-equivalent forms"

-- Currently we do not check the equivalence of sourced terms
--
-- This is the function to implement when we decided to start
-- checking source code
--
-- This operation may be expensive (if we are doing it right)
compareForeignFunctions :: Int -> Type -> Source -> Source -> MorlocMonad ()
compareForeignFunctions _ _ _ _ = return ()

valueError :: Int -> E -> E -> MDoc -> MorlocMonad ()
valueError i e1 e2 msg = MM.throwUnificationError (indexOfE e1) (indexOfE e2) i ("Error in value checker:" <+> msg)

substituteEVar :: EVar -> EVar -> E -> E
substituteEVar oldVar newVar e0
  | oldVar == newVar = e0
  | otherwise = f usedVars 0 e0
  where
    -- list of free term variables
    usedVars = Set.union (freeTerms e0) (Set.fromList [oldVar, newVar])

    f :: Set.Set EVar -> Int -> E -> E
    f _ _ e@(BndP g v)
      | v == oldVar = BndP g newVar
      | otherwise = e
    f used idx (LamP g vs e) =
      let (used', idx', vs', e') = relabelLam used idx vs e
       in LamP g vs' (f used' idx' e')
    f _ _ e@(VarP g v es)
      | v == oldVar = VarP g newVar es
      | otherwise = e
    f used idx (AppP g e es) = AppP g (f used idx e) $ map (f used idx) es
    f used idx (LstP g es) = LstP g $ map (f used idx) es
    f used idx (TupP g es) = TupP g $ map (f used idx) es
    f used idx (NamP g rs) = NamP g $ map (second (f used idx)) rs
    f used idx (IfP g c t e) = IfP g (f used idx c) (f used idx t) (f used idx e)
    f used idx (DoBlockP g e) = DoBlockP g (f used idx e)
    f used idx (EvalP g e) = EvalP g (f used idx e)
    f used idx (CoerceP c g e) = CoerceP c g (f used idx e)
    f _ _ e = e

    relabelLam :: Set.Set EVar -> Int -> [EVar] -> E -> (Set.Set EVar, Int, [EVar], E)
    relabelLam used idx [] e = (used, idx, [], e)
    relabelLam used idx (v : vs) e
      | Set.member v used =
          let (idx', v') = newvar used idx
           in let (used', idx'', vs', e') = relabelLam (Set.insert v' used) idx' vs (substituteEVar v v' e)
               in (used', idx'', v' : vs', e')
      | otherwise =
          let (used', idx', vs', e') = relabelLam used idx vs e
           in (used', idx', v : vs', e')

    newvar :: Set.Set EVar -> Int -> (Int, EVar)
    newvar used i =
      let x = EV (DT.pack $ "x" <> show i)
       in if Set.member x used
            then newvar used (i + 1)
            else (i, x)

-- Find all names in a term that are not bound under a lambda
freeTerms :: E -> Set.Set EVar
freeTerms = f Set.empty
  where
    f :: Set.Set EVar -> E -> Set.Set EVar
    f boundterms (BndP _ v)
      | Set.member v boundterms = Set.empty
      | otherwise = Set.singleton v
    f boundterms (VarP _ v es)
      | Set.member v boundterms = error "Bug found, somewhere Var and Bnd are getting mixed"
      | otherwise = Set.insert v . Set.unions . fmap (f boundterms) $ es
    f boundterms (LamP _ vs e) =
      let boundterms' = Set.union boundterms (Set.fromList vs)
       in f boundterms' e
    f boundterms (AppP _ e es) = Set.unions . map (f boundterms) $ (e : es)
    f boundterms (LstP _ es) = Set.unions . map (f boundterms) $ es
    f boundterms (TupP _ es) = Set.unions . map (f boundterms) $ es
    f boundterms (NamP _ (map snd -> es)) = Set.unions . map (f boundterms) $ es
    f boundterms (IfP _ c t e) = Set.unions [f boundterms c, f boundterms t, f boundterms e]
    f boundterms (DoBlockP _ e) = f boundterms e
    f boundterms (EvalP _ e) = f boundterms e
    f boundterms (CoerceP _ _ e) = f boundterms e
    f _ _ = Set.empty

substituteExpr :: EVar -> E -> E -> E
substituteExpr oldVar replacementExpr = f
  where
    f e@(BndP _ v)
      | v == oldVar = replacementExpr
      | otherwise = e
    f e@(VarP _ v _)
      | v == oldVar = replacementExpr
      | otherwise = e
    f e@(LamP g vs body)
      | oldVar `elem` vs = e -- stop if term is shadowed
      | otherwise = LamP g vs (f body)
    f (AppP g e es) = AppP g (f e) (map f es)
    f (LstP g es) = LstP g (map f es)
    f (TupP g es) = TupP g (map f es)
    f (NamP g rs) = NamP g (map (second f) rs)
    f e@LitP {} = e
    f e@SrcP {} = e
    f e@PatP {} = e
    f (IfP g c t e) = IfP g (f c) (f t) (f e)
    f (DoBlockP g e) = DoBlockP g (f e)
    f (EvalP g e) = EvalP g (f e)
    f (CoerceP c g e) = CoerceP c g (f e)
    f (IntrinsicP g intr es) = IntrinsicP g intr (map f es)


================================================
FILE: library/Morloc/Internal.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Internal
Description : Proto-prelude re-exporting common utilities
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

A project-wide prelude that re-exports commonly used modules (Data.Maybe,
Data.Either, Control.Monad, etc.) along with custom Bifunctor\/Bifoldable
typeclasses and utility functions. Imported transitively by nearly every
module via "Morloc.Namespace.Prim".

This module must NOT import anything from Morloc (other than Data.*) to
avoid circular dependencies, since the lexer depends on it.
-}
module Morloc.Internal
  ( concatMapM
  , unique
  , duplicates
  , module Data.Maybe
  , module Data.Either
  , module Data.List.Extra
  , module Control.Monad
  , module Control.Monad.IO.Class
  , module Data.Monoid
  , module Data.Traversable
  , module Morloc.Data.Bifoldable
  , module Morloc.Data.Bifunctor
  , module Morloc.Data.Annotated
  , isLower
  , isUpper
  , toLower

    -- * Data.Foldable re-exports
  , foldlM
  , foldrM

    -- * Tuple utilities
  , return2

    -- * Operators
  , (|>>)
  , (</>)
  , (<|>)
  , (&&&)
  , (***)

    -- * Safe re-exports
  , module Safe

    -- * Stateful mapping
  , statefulMap
  , statefulMapM
  , filterApart

    -- * Length-checked zips (fail on mismatched lengths, indicating compiler bugs)
  , safeZip
  , safeZipWith
  , safeZipWithM
  ) where

import Control.Applicative ((<|>))
import Control.Monad
import Control.Monad.IO.Class
import Data.Char (isLower, isUpper, toLower)
import Data.Either
import Data.Foldable (foldlM, foldrM)
import Data.List.Extra hiding (list)
import qualified Data.Map.Strict as Map
import Data.Maybe
import Data.Monoid
import qualified Data.Set as Set
import Data.Traversable
import Data.Tuple.Extra ((&&&), (***))
import Morloc.Data.Annotated
import Morloc.Data.Bifoldable
import Morloc.Data.Bifunctor
import Safe hiding (at, headDef, lastDef)
import System.FilePath
import Prelude hiding (mapM)

-- | Lift a binary function into a monadic return
return2 :: (Monad m) => (a -> b -> c) -> (a -> b -> m c)
return2 f x y = return $ f x y

-- | Concatenate the results of a monadic map
concatMapM :: (Monad m) => (a -> m [b]) -> [a] -> m [b]
concatMapM f = fmap concat . mapM f

-- | Remove duplicate elements while preserving first-occurrence order
unique :: (Ord a) => [a] -> [a]
unique = unique' Set.empty
  where
    unique' _ [] = []
    unique' set (x : xs)
      | Set.member x set = unique' set xs
      | otherwise = x : unique' (Set.insert x set) xs

-- | Return elements that appear more than once, in first-occurrence order
duplicates :: (Ord a) => [a] -> [a]
duplicates xs = unique $ filter isDuplicated xs
  where
    countMap = Map.fromList . map (\ks -> (head ks, length ks)) . group . sort $ xs
    isDuplicated k = fromJust (Map.lookup k countMap) > 1

-- | Map with threaded state
statefulMap :: (s -> a -> (s, b)) -> s -> [a] -> (s, [b])
statefulMap _ s [] = (s, [])
statefulMap f s0 (x : xs) =
  let (s1, y) = f s0 x
   in let (sn, ys) = statefulMap f s1 xs
       in (sn, y : ys)

-- | Monadic 'statefulMap'
statefulMapM :: (Monad m) => (s -> a -> m (s, b)) -> s -> [a] -> m (s, [b])
statefulMapM _ s [] = return (s, [])
statefulMapM f s (x : xs) = do
  (s', x') <- f s x
  (s'', xs') <- statefulMapM f s' xs
  return (s'', x' : xs')

-- | Extract the first element matching a predicate, returning it and the rest
filterApart :: (a -> Bool) -> [a] -> (Maybe a, [a])
filterApart _ [] = (Nothing, [])
filterApart f (x : xs)
  | f x = (Just x, xs)
  | otherwise = case filterApart f xs of
      (r, xs') -> (r, x : xs')

-- | Zip two lists, returning 'Nothing' if lengths differ
safeZip :: [a] -> [b] -> Maybe [(a, b)]
safeZip (x : xs) (y : ys) = (:) (x, y) <$> safeZip xs ys
safeZip [] [] = Just []
safeZip _ _ = Nothing

-- | 'zipWith' returning 'Nothing' if lengths differ
safeZipWith :: (a -> b -> c) -> [a] -> [b] -> Maybe [c]
safeZipWith f xs ys
  | length xs == length ys = Just $ zipWith f xs ys
  | otherwise = Nothing

-- | Monadic 'safeZipWith'
safeZipWithM :: (Monad m) => (a -> b -> m c) -> [a] -> [b] -> m (Maybe [c])
safeZipWithM f xs ys
  | length xs == length ys = zipWithM f xs ys |>> Just
  | otherwise = return Nothing

-- | Piped fmap: @x |>> f == fmap f x@
infixl 1 |>>

(|>>) :: (Functor f) => f a -> (a -> b) -> f b
(|>>) = flip fmap


================================================
FILE: library/Morloc/LangRegistry.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.LangRegistry
Description : Language registry loaded from lang.yaml and languages.yaml
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Provides metadata about all supported languages. Built from embedded
lang.yaml files at startup and extended with discovered plugin languages
at parse time.
-}
module Morloc.LangRegistry
  ( LangRegistry (..)
  , LangRegistryEntry (..)
  , emptyRegistry
  , buildDefaultRegistry
  , extendRegistry
  , lookupLang
  , lookupByAlias
  , buildLangMap
  , registryPairwiseCost
  , registryLanguageCost
  , registrySerialType
  , registryIsCompiled
  , registryRunCommand
  , registryMakeExtension
  , registryMakeExecutablePoolName
  , registryMakeSourcePoolName
  , parseLangYamlFile
  ) where

import Data.Aeson ((.!=), (.:), (.:?))
import qualified Data.Aeson as Aeson
import qualified Data.ByteString as BS
import Data.Map.Strict (Map)
import qualified Data.Map.Strict as Map
import Data.Text (Text)
import qualified Data.Text as T
import qualified Data.Text.Encoding as TE
import qualified Data.Yaml as Y
import Morloc.Language (Lang (..))

data LangRegistry = LangRegistry
  { lrEntries :: Map Text LangRegistryEntry -- keyed by canonical name
  , lrAliases :: Map Text Text -- alias -> canonical name
  , lrSameLangCosts :: Map Text Int
  , lrCrossLangCosts :: Map Text Int
  , lrOptimizedPairs :: Map (Text, Text) Int
  , lrDefaultSameCost :: Int
  , lrDefaultCrossCost :: Int
  }
  deriving (Show)

data LangRegistryEntry = LangRegistryEntry
  { lreExtension :: !String
  , lreIsCompiled :: !Bool
  , lreRunCommand :: ![Text]
  , lreSerialType :: !Text
  , lreCost :: !Int
  , lrePreamble :: ![Text]
  }
  deriving (Show)

emptyRegistry :: LangRegistry
emptyRegistry = LangRegistry Map.empty Map.empty Map.empty Map.empty Map.empty 10 10000

-- | Build the default registry from embedded lang.yaml files and languages.yaml
buildDefaultRegistry :: [(String, Text)] -> Text -> Either String LangRegistry
buildDefaultRegistry langFiles languagesText = do
  langs <- mapM parseLangYaml langFiles
  costs <- parseLanguagesYaml languagesText
  let entries = Map.fromList [(lymName ly, entryFromYaml ly) | ly <- langs]
      aliases =
        Map.fromList $
          concatMap (\ly -> [(a, lymName ly) | a <- lymAliases ly] ++ [(lymName ly, lymName ly)]) langs
  return
    costs
      { lrEntries = entries
      , lrAliases = aliases
      }

-- | Extend the registry with a new language entry (for plugins)
extendRegistry :: Text -> LangRegistryEntry -> [Text] -> LangRegistry -> LangRegistry
extendRegistry name entry newAliases reg =
  reg
    { lrEntries = Map.insert name entry (lrEntries reg)
    , lrAliases = Map.union (Map.fromList $ (name, name) : [(a, name) | a <- newAliases]) (lrAliases reg)
    }

lookupLang :: Text -> LangRegistry -> Maybe LangRegistryEntry
lookupLang name reg = Map.lookup name (lrEntries reg)

-- | Look up by alias, returning (canonical name, entry)
lookupByAlias :: Text -> LangRegistry -> Maybe (Text, LangRegistryEntry)
lookupByAlias alias reg = do
  canonical <- Map.lookup (T.toLower alias) (lrAliases reg)
  entry <- Map.lookup canonical (lrEntries reg)
  return (canonical, entry)

{- | Build a map from all aliases (lowercased) to Lang values.
Used by the parser to resolve language names.
-}
buildLangMap :: LangRegistry -> Map Text Lang
buildLangMap reg =
  Map.fromList
    [ (alias, Lang canonical (lreExtension entry))
    | (alias, canonical) <- Map.toList (lrAliases reg)
    , Just entry <- [Map.lookup canonical (lrEntries reg)]
    ]

registryPairwiseCost :: LangRegistry -> Text -> Text -> Int
registryPairwiseCost reg from to
  | from == to = case Map.lookup from (lrSameLangCosts reg) of
      Just c -> c
      Nothing -> lrDefaultSameCost reg
  | otherwise = case Map.lookup (from, to) (lrOptimizedPairs reg) of
      Just c -> c
      Nothing -> case Map.lookup to (lrCrossLangCosts reg) of
        Just c -> c
        Nothing -> lrDefaultCrossCost reg

registryLanguageCost :: LangRegistry -> Text -> Int
registryLanguageCost reg name = case Map.lookup name (lrEntries reg) of
  Just entry -> lreCost entry
  Nothing -> 5

registrySerialType :: LangRegistry -> Text -> Text
registrySerialType reg name = case Map.lookup name (lrEntries reg) of
  Just entry -> lreSerialType entry
  Nothing -> "bytes"

registryIsCompiled :: LangRegistry -> Text -> Bool
registryIsCompiled reg name = case Map.lookup name (lrEntries reg) of
  Just entry -> lreIsCompiled entry
  Nothing -> False

registryRunCommand :: LangRegistry -> Text -> [Text]
registryRunCommand reg name = case Map.lookup name (lrEntries reg) of
  Just entry -> lreRunCommand entry
  Nothing -> []

registryMakeExtension :: LangRegistry -> Text -> String
registryMakeExtension reg name = case Map.lookup name (lrEntries reg) of
  Just entry -> lreExtension entry
  Nothing -> T.unpack name

registryMakeExecutablePoolName :: LangRegistry -> Text -> String -> String
registryMakeExecutablePoolName reg name base =
  if registryIsCompiled reg name
    then base <> "-" <> T.unpack name <> ".out"
    else base <> "." <> registryMakeExtension reg name

registryMakeSourcePoolName :: LangRegistry -> Text -> String -> String
registryMakeSourcePoolName reg name base =
  base <> "." <> registryMakeExtension reg name

-- internal YAML types

data LangYamlMeta = LangYamlMeta
  { lymName :: Text
  , lymExtension :: String
  , lymAliases :: [Text]
  , lymIsCompiled :: Bool
  , lymRunCommand :: [Text]
  , lymSerialType :: Text
  , lymCost :: Int
  , lymPreamble :: [Text]
  }
  deriving (Show)

instance Aeson.FromJSON LangYamlMeta where
  parseJSON = Aeson.withObject "LangYamlMeta" $ \o ->
    LangYamlMeta
      <$> o .: "name"
      <*> o .: "extension"
      <*> o .:? "aliases" .!= []
      <*> o .:? "is_compiled" .!= False
      <*> o .:? "run_command" .!= []
      <*> o .:? "serial_type" .!= "bytes"
      <*> o .:? "cost" .!= 5
      <*> o .:? "preamble" .!= []

data LanguagesYaml = LanguagesYaml
  { lysSameLangCosts :: Map Text Int
  , lysCrossLangCosts :: Map Text Int
  , lysOptimizedPairs :: [(Text, Text, Int)]
  , lysDefaultSame :: Int
  , lysDefaultCross :: Int
  }
  deriving (Show)

instance Aeson.FromJSON LanguagesYaml where
  parseJSON = Aeson.withObject "LanguagesYaml" $ \o -> do
    same <- o .:? "same_language_costs" .!= Map.empty
    cross <- o .:? "cross_language_costs" .!= Map.empty
    pairs <- o .:? "optimized_pairs" .!= []
    defSame <- o .:? "default_same_language" .!= 10
    defCross <- o .:? "default_cross_language" .!= 10000
    parsedPairs <- mapM parsePair pairs
    return $ LanguagesYaml same cross parsedPairs defSame defCross
    where
      parsePair = Aeson.withObject "OptimizedPair" $ \o ->
        (,,) <$> o .: "from" <*> o .: "to" <*> o .: "cost"

entryFromYaml :: LangYamlMeta -> LangRegistryEntry
entryFromYaml ly =
  LangRegistryEntry
    { lreExtension = lymExtension ly
    , lreIsCompiled = lymIsCompiled ly
    , lreRunCommand = lymRunCommand ly
    , lreSerialType = lymSerialType ly
    , lreCost = lymCost ly
    , lrePreamble = lymPreamble ly
    }

-- | Parse a lang.yaml file from the filesystem, returning (canonical name, extension)
parseLangYamlFile :: FilePath -> IO (Either String (Text, String))
parseLangYamlFile path = do
  content <- TE.decodeUtf8 <$> BS.readFile path
  case parseLangYaml ("file:" ++ path, content) of
    Left err -> return (Left err)
    Right meta -> return (Right (lymName meta, lymExtension meta))

parseLangYaml :: (String, Text) -> Either String LangYamlMeta
parseLangYaml (name, content) =
  case Y.decodeEither' (TE.encodeUtf8 content) of
    Left err -> Left $ "Failed to parse lang.yaml for " ++ name ++ ": " ++ Y.prettyPrintParseException err
    Right meta -> Right meta

parseLanguagesYaml :: Text -> Either String LangRegistry
parseLanguagesYaml content =
  case Y.decodeEither' (TE.encodeUtf8 content) of
    Left err -> Left $ "Failed to parse languages.yaml: " ++ Y.prettyPrintParseException err
    Right lys ->
      Right $
        LangRegistry
          { lrEntries = Map.empty
          , lrAliases = Map.empty
          , lrSameLangCosts = lysSameLangCosts lys
          , lrCrossLangCosts = lysCrossLangCosts lys
          , lrOptimizedPairs = Map.fromList [((f, t), c) | (f, t, c) <- lysOptimizedPairs lys]
          , lrDefaultSameCost = lysDefaultSame lys
          , lrDefaultCrossCost = lysDefaultCross lys
          }


================================================
FILE: library/Morloc/Language.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Language
Description : Language type and utilities
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

The Lang type is a simple name+extension record. All language metadata
lives in the LangRegistry (loaded from lang.yaml files).
-}
module Morloc.Language
  ( Lang (..)
  , makeExtension
  , showLangName
  , makeExecutablePoolName
  , makeSourcePoolName
  , makeLang
  ) where

import Data.Text (Text)
import Morloc.Data.Doc

{- | A programming language in the Morloc ecosystem.
Identity is determined solely by the canonical name.
-}
data Lang = Lang
  { langName :: !Text -- canonical lowercase name: "py", "r", "cpp", etc.
  , langExtension :: !String -- file extension: "py", "R", "cpp", etc.
  }
  deriving (Show)

instance Eq Lang where
  a == b = langName a == langName b

instance Ord Lang where
  compare a b = compare (langName a) (langName b)

instance Pretty Lang where
  pretty = pretty . langName

-- | Construct a Lang from canonical name and extension
makeLang :: Text -> String -> Lang
makeLang = Lang

-- | Get the file extension for a language
makeExtension :: Lang -> String
makeExtension = langExtension

-- | Get the canonical name of a language
showLangName :: Lang -> Text
showLangName = langName

makeSourceName :: Lang -> String -> String
makeSourceName lang base = base ++ "." ++ makeExtension lang

makeExecutableName :: Lang -> String -> String
makeExecutableName lang base
  | langName lang == "c" = base <> "-c.out"
  | langName lang == "cpp" = base <> "-cpp.out"
  | otherwise = makeSourceName lang base

makeExecutablePoolName :: Lang -> String
makeExecutablePoolName lang = makeExecutableName lang "pool"

makeSourcePoolName :: Lang -> String
makeSourcePoolName lang = makeSourceName lang "pool"


================================================
FILE: library/Morloc/Module.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Module
Description : Module discovery, metadata loading, and installation
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Handles all aspects of the morloc module system:

 * finding modules on the local filesystem (by name or path)
 * loading package YAML metadata
 * finding headers and shared libraries required by modules
 * installing modules from GitHub via @morloc install@
-}
module Morloc.Module
  ( findModule
  , loadModuleMetadata
  , findMainLocFile

    -- * Module installation
  , OverwriteProtocol (..)
  , GitProtocol (..)
  , InstallReason (..)
  , TypecheckFn
  , installModule
  , extractMorlocDeps
  , extractModuleName
  ) where

import Control.Applicative (optional)
import Control.Exception (onException)
import Text.Parsec (Parsec, try, parse, many, many1)
import Text.Parsec.Char (char, string, alphaNum, digit, satisfy)
import Text.Parsec.Text ()

import qualified Data.Aeson as Aeson
import qualified Data.Aeson.KeyMap as KM
import qualified Data.ByteString.Char8 as BS8
import qualified Data.ByteString.Lazy as BL
import qualified Data.Vector as V  -- from aeson's transitive dependency
import qualified Data.Char as DC
import qualified Data.Map as Map
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text.IO as TIO
import qualified Data.Time.Clock.POSIX as Time
import qualified Data.Yaml.Config as YC
import qualified Morloc.Config as Config
import Morloc.Data.Doc
import Morloc.Data.Json
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import qualified Morloc.ProgramBuilder.Install as Install
import qualified Morloc.System as MS
import qualified Network.HTTP.Simple as HTTP
import System.Directory
import System.Process (callProcess, readProcess)

data InstallReason = ExplicitInstall | AutoDependency
  deriving (Show, Eq)

moduleInstallError :: MDoc -> MorlocMonad a
moduleInstallError msg = MM.throwSystemError $ "Failed to install module:" <+> msg

-- | Is this a local (.dot-prefixed) import?
isLocalImport :: MVar -> Bool
isLocalImport (MV x) = "." `MT.isPrefixOf` x

-- | Look for a morloc module: local (.dot-prefixed) or bare (system/plane).
findModule :: (Maybe Path, MVar) -> MVar -> MorlocMonad Path
findModule (_, currentModule) importModule
  | isLocalImport importModule = findLocalModule currentModule importModule
  | otherwise = findBareModule currentModule importModule

-- | Resolve a local import from the project root.
-- e.g., .foo.bar -> <root>/foo/bar.loc or <root>/foo/bar/main.loc
findLocalModule :: MVar -> MVar -> MorlocMonad Path
findLocalModule currentModule importModule = do
  projectRoot <- MM.gets stateProjectRoot
  case projectRoot of
    Nothing -> MM.throwSystemError $
      "Cannot resolve local import" <+> squotes (pretty importModule)
        <+> "without a project root (are you reading from stdin?)"
    Just root -> do
      let MV importText = importModule
          nameParts = map MT.unpack $ MT.splitOn "." (MT.drop 1 importText)
          candidates =
            [ MS.joinPath (root : init nameParts ++ [last nameParts ++ ".loc"])
            , MS.joinPath (root : nameParts ++ ["main.loc"])
            ]
      existingPaths <- liftIO . fmap catMaybes . mapM getFile $ candidates
      case existingPaths of
        (x : _) -> return x
        [] -> MM.throwSystemError $
          "Within module" <+> squotes (pretty currentModule)
            <> "," <+> "failed to import local module" <+> squotes (pretty importModule)
            <> "\nThe following paths were searched:\n"
            <+> indent 4 (vsep (map pretty candidates))

-- | Resolve a bare (non-dot-prefixed) import: search system/plane paths,
-- with deprecated fallback to local paths (project root).
-- Supports namespaced imports: "owner/name" searches lib/plane/owner/name/
-- Bare imports: "foo" searches lib/plane/morloclib/foo/ first, then lib/plane/foo/
findBareModule :: MVar -> MVar -> MorlocMonad Path
findBareModule currentModule importModule = do
  config <- MM.ask
  projectRoot <- MM.gets stateProjectRoot
  let lib = Config.configLibrary config
      plane = Config.configPlane config
      planeCore = Config.configPlaneCore config
      namePath = splitModuleName importModule
      -- Check if this is a namespaced import (contains "/")
      MV importText = importModule
      isNamespaced = "/" `MT.isInfixOf` importText
      -- For namespaced: "owner/name" -> [owner, name] as filesystem path
      -- For bare: "foo" -> search morloclib/foo first, then foo
      namespacedPath = case MT.splitOn "/" importText of
        [owner, name] -> [MT.unpack owner, MT.unpack name]
        _ -> namePath  -- fallback
      systemPaths
        | isNamespaced =
            -- Namespaced import: only search the explicit namespace path
            [ MS.joinPath ([lib, plane] <> namespacedPath <> ["main.loc"])
            , MS.joinPath ([lib, plane] <> init namespacedPath <> [last namespacedPath <> ".loc"])
            ]
        | otherwise =
            -- Bare import: search core org namespace first, then flat paths
            [ MS.joinPath ([lib, plane, planeCore] <> namePath <> ["main.loc"])
            , MS.joinPath ([lib, plane, planeCore] <> init namePath <> [last namePath <> ".loc"])
            , MS.joinPath ([lib, plane] <> init namePath <> [last namePath <> ".loc"])
            , MS.joinPath ([lib, plane] <> namePath <> ["main.loc"])
            , MS.joinPath (lib : init namePath <> [last namePath <> ".loc"])
            , MS.joinPath (lib : namePath <> ["main.loc"])
            ]
      localPaths
        | isNamespaced = []  -- namespaced imports are never local
        | otherwise = case projectRoot of
            Just root ->
              [ MS.joinPath (root : init namePath <> [last namePath <> ".loc"])
              , MS.joinPath (root : namePath <> ["main.loc"])
              ]
            Nothing ->
              [ MS.joinPath (init namePath <> [last namePath <> ".loc"])
              , MS.joinPath (namePath <> ["main.loc"])
              ]
  existingSystem <- liftIO . fmap catMaybes . mapM getFile $ systemPaths
  existingLocal <- liftIO . fmap catMaybes . mapM getFile $ localPaths
  case (existingSystem, existingLocal) of
    (s:_, l:_) ->
      MM.throwSystemError $
        "Ambiguous import" <+> squotes (pretty importModule)
          <+> "from module" <+> squotes (pretty currentModule)
          <> "\nFound in system:" <+> pretty s
          <> "\nFound locally:" <+> pretty l
          <> "\nUse" <+> squotes (pretty ("import ." <> unMVar importModule))
          <+> "for local or ensure the system module is installed"
    (x:_, []) -> return x
    ([], x:_) -> do
      MM.say $
        "WARNING: bare import" <+> squotes (pretty importModule)
          <+> "resolved locally."
          <+> "Use" <+> squotes (pretty ("import ." <> unMVar importModule))
          <+> "for explicit local imports."
      return x
    ([], []) -> do
      let allPaths = systemPaths <> localPaths
          nameNameLoc = namePath <> [last namePath <> ".loc"]
          hintPaths =
            map
              MS.joinPath
              [ nameNameLoc
              , lib : nameNameLoc
              , [lib, plane] <> nameNameLoc
              ]
      existingHints <- liftIO . fmap catMaybes . mapM getFile $ hintPaths
      let hintMsg = case existingHints of
            (found : _) ->
              let expected = MS.combine (MS.takeDirectory found) "main.loc"
               in "\n\nFound"
                    <+> squotes (pretty found)
                    <+> "but expected"
                    <+> squotes (pretty expected)
                    <> "\n  Rename the entry point: mv"
                      <+> pretty found
                      <+> pretty expected
            [] -> mempty
      MM.throwSystemError $
        "Within module" <+> squotes (pretty currentModule)
          <> ","
            <+> "failed to import module"
            <+> squotes (pretty importModule)
          <> "\n"
          <> "The following paths were searched:\n"
            <+> indent 4 (vsep (map pretty allPaths))
          <> "\nMaybe try running: morloc install" <+> pretty importModule
          <> hintMsg

{- | Give a module path (e.g. "/your/path/foo.loc") find the package metadata.
It currently only looks for a file named "package.yaml" in the same folder
as the main "*.loc" file.
-}
findModuleMetadata :: Path -> IO (Maybe Path)
findModuleMetadata mainFile =
  getFile $ MS.combine (MS.takeDirectory mainFile) "package.yaml"

loadModuleMetadata :: Path -> MorlocMonad ()
loadModuleMetadata main = do
  maybef <- liftIO $ findModuleMetadata main
  meta <-
    case maybef of
      (Just f) -> liftIO $ YC.loadYamlSettings [f] [] YC.ignoreEnv
      Nothing -> return defaultValue
  -- Reject include entries that escape the package directory. Absolute
  -- paths and `..` traversals are not allowed because they would break
  -- reproducibility and tie installs to ambient filesystem layout.
  case packageInclude meta of
    Just pats -> liftIO $ Install.validateIncludeScope pats
    Nothing -> return ()
  state <- MM.get
  MM.put (appendMeta meta state)
  where
    appendMeta :: PackageMeta -> MorlocState -> MorlocState
    appendMeta m s = s {statePackageMeta = m : statePackageMeta s}

splitModuleName :: MVar -> [String]
splitModuleName (MV x) = map MT.unpack $ MT.splitOn "." x


getFile :: Path -> IO (Maybe Path)
getFile x = do
  exists <- MS.doesFileExist x
  return $
    if exists
      then Just x
      else Nothing

-- {{{ definitions

data GitProtocol = SshProtocol | HttpsProtocol
  deriving (Show, Eq, Ord)

data OverwriteProtocol
  = ForceOverwrite
  | DoNotOverwrite
  deriving (Show, Eq, Ord)

data RemoteSource
  = RemoteGithub
  | RemoteGitlab
  | RemoteBitbucket
  | RemoteCodeberg
  | RemoteAzure
  deriving (Show, Eq, Ord)

data GitSnapshotSelector
  = LatestDefaultBranch
  | LatestOnBranch Text
  | CommitHash Text
  | ReleaseTag Text
  deriving (Show, Eq, Ord)

data GitRemote = GitRemote
  { gitRemoteSource :: RemoteSource
  , gitReference :: GitSnapshotSelector
  , gitUsername :: Text
  , gitReponame :: Text
  }
  deriving (Show, Eq, Ord)

-- | Specify where a module is located
data ModuleSource
  = -- | Module in a local directory (may or may not be a git repo)
    ModuleSourceLocal Text (Maybe GitSnapshotSelector)
  | -- | A module stored in an arbitrary users github repo, e.g., (GithubRepo "weena" "math")
    ModuleSourceRemoteGit GitRemote
  | -- | A module from the morloc registry (owner, name)
    ModuleSourceRegistry Text Text
  deriving (Show, Eq, Ord)

-- }}}

-- | Check that a resolved module name is a valid identifier
validateModuleName :: Text -> Text -> Either Text Text
validateModuleName modstr name
  | MT.null name =
      Left $ "Could not determine module name from '" <> modstr <> "'"
  | not (DC.isAlphaNum (MT.head name)) =
      Left $ "Module name '" <> name <> "' (from '" <> modstr <> "') must start with an alphanumeric character"
  | MT.any (\c -> not (DC.isAlphaNum c) && c /= '-') name =
      Left $ "Module name '" <> name <> "' (from '" <> modstr <> "') contains invalid characters (only alphanumeric and hyphens allowed)"
  | otherwise = Right name

{- | Extract the module name from an install string.
For "github:user/repo" -> "repo", for "math" -> "math",
for "./path/to/foo" -> "foo", for "." -> current directory name
-}
extractModuleName :: Text -> IO Text
extractModuleName modstr = do
  name <- case parse (moduleInstallParser "morloclib") "" modstr of
    Right (Right (ModuleSourceLocal path _)) ->
      MT.pack . MS.takeFileName <$> (MS.makeAbsolute . MS.dropTrailingPathSeparator . MT.unpack $ path)
    Right (Right (ModuleSourceRemoteGit remote)) ->
      return $ gitReponame remote
    Right (Right (ModuleSourceRegistry _ n)) ->
      return n
    _ -> return modstr
  case validateModuleName modstr name of
    Left err -> ioError . userError $ MT.unpack err
    Right n -> return n

{- | Typecheck callback: takes a filepath, returns list of (name, type) exports.
Passed in from the executable layer to avoid circular imports.
-}
type TypecheckFn = FilePath -> MorlocMonad [(Text, Text)]

installModule ::
  -- | How should overwrites be handled
  OverwriteProtocol ->
  -- | Remote Git download protocol (HTTPS by default)
  GitProtocol ->
  -- | Absolute path to folder where modules are installed for the given plane
  Path ->
  -- | Default github org for the given plane for pulling core modules
  Path ->
  -- | Optional typecheck callback (Nothing = skip typecheck)
  Maybe TypecheckFn ->
  -- | User-specified module sources from the CLI batch (name -> install-string)
  Map.Map Text Text ->
  -- | Modules currently being installed (cycle detection)
  Set.Set Text ->
  -- | Why this module is being installed
  InstallReason ->
  -- | Installation string, such as "github:weena/math@version:0.1.0"
  Text ->
  MorlocMonad ()
installModule overwrite gitprot libpath coreorg mayTypecheck userSources inProgress reason modstr = do
  config <- MM.ask
  let registry = Config.configRegistry config
  -- Try registry first for bare names when a registry is configured
  case (registry, tryParseRegistryModule (MT.pack coreorg) modstr) of
    (Just _, Just (owner, name)) -> do
      let targetDir = libpath </> MT.unpack owner </> MT.unpack name
      if Set.member name inProgress
        then return ()
        else do
          targetExists <- liftIO $ doesDirectoryExist targetDir
          case (targetExists, overwrite) of
            (True, DoNotOverwrite) -> do
              case reason of
                ExplicitInstall ->
                  MM.say $ "Module" <+> pretty name <+> "is already installed, use --force to reinstall"
                AutoDependency ->
                  MM.sayVVV $ "Module" <+> pretty name <+> "already installed, skipping"
              return ()
            (True, ForceOverwrite) -> do
              liftIO $ removeDirectoryRecursive targetDir
              doInstall (ModuleSourceRegistry owner name) name targetDir
            (False, _) ->
              doInstall (ModuleSourceRegistry owner name) name targetDir
    _ -> installModuleClassic
  where
    installModuleClassic = case parse (moduleInstallParser (MT.pack coreorg)) "" modstr of
      (Left errstr) -> moduleInstallError (pretty . show $ errstr)
      (Right (Left errstr)) -> moduleInstallError $ pretty errstr
      (Right (Right source)) -> do
        rawName <- case source of
              ModuleSourceLocal path _ ->
                liftIO $ MT.pack . MS.takeFileName <$> (MS.makeAbsolute . MS.dropTrailingPathSeparator . MT.unpack $ path)
              ModuleSourceRemoteGit remote -> return $ gitReponame remote
              ModuleSourceRegistry _ n -> return n
        name <- case validateModuleName modstr rawName of
          Left err -> moduleInstallError $ pretty err
          Right n -> return n
        let targetDir = libpath </> MT.unpack name

        if Set.member name inProgress
          then return ()
          else do
            -- Check if already installed
            targetExists <- liftIO $ doesDirectoryExist targetDir
            case (targetExists, overwrite) of
              (True, DoNotOverwrite) -> do
                case reason of
                  ExplicitInstall ->
                    MM.say $ "Module" <+> pretty name <+> "is already installed, use --force to reinstall"
                  AutoDependency ->
                    MM.sayVVV $ "Module" <+> pretty name <+> "already installed, skipping"
                return ()
              (True, ForceOverwrite) -> do
                liftIO $ removeDirectoryRecursive targetDir
                doInstall source name targetDir
              (False, _) ->
                doInstall source name targetDir


    doInstall :: ModuleSource -> Text -> FilePath -> MorlocMonad ()
    doInstall source name targetDir = do
      let inProgress' = Set.insert name inProgress

      -- create the library path if it is missing
      liftIO $ createDirectoryIfMissing True libpath

      -- Copy/clone files, with cleanup on exception
      liftIO $ createDirectoryIfMissing True (MS.takeDirectory targetDir)
      config' <- MM.ask
      let ioAction = case source of
            ModuleSourceLocal path selector ->
              installLocalIO targetDir selector path
            ModuleSourceRemoteGit remote ->
              installRemoteIO gitprot targetDir remote
            ModuleSourceRegistry owner' modName ->
              case Config.configRegistry config' of
                Just regUrl -> installFromRegistry regUrl owner' modName targetDir
                Nothing -> ioError $ userError "Registry URL not configured"
          cleanup = do
            exists <- doesDirectoryExist targetDir
            when exists $ removeDirectoryRecursive targetDir
      liftIO $ ioAction `onException` cleanup

      -- Read package.yaml for metadata and dependencies
      meta <- liftIO $ do
        let pkgYaml = targetDir </> "package.yaml"
        exists <- doesFileExist pkgYaml
        if exists
          then YC.loadYamlSettings [pkgYaml] [] YC.ignoreEnv
          else return defaultValue

      -- Determine morloc dependencies by scanning .loc imports
      morlocDeps <- do
        mainFile <- liftIO $ findMainLocFile targetDir (MT.unpack name)
        case mainFile of
          Nothing -> return []
          Just f -> liftIO $ extractMorlocDeps f

      -- Recursively install dependencies
      forM_ morlocDeps $ \dep -> do
        let depDir = libpath </> MT.unpack dep
            depDirNs = libpath </> coreorg </> MT.unpack dep
        depExists <- liftIO $ (||) <$> doesDirectoryExist depDir <*> doesDirectoryExist depDirNs
        unless (depExists || Set.member dep inProgress') $ do
          let depModstr = case Map.lookup dep userSources of
                Just s -> s
                Nothing -> dep
          MM.say $ "Auto-installing dependency:" <+> pretty dep
          installModule
            DoNotOverwrite
            gitprot
            libpath
            coreorg
            mayTypecheck
            userSources
            inProgress'
            AutoDependency
            depModstr

      -- Typecheck the module (if callback provided)
      exports <- case mayTypecheck of
        Nothing -> return []
        Just typecheckFn -> do
          mainFile <- liftIO $ findMainLocFile targetDir (MT.unpack name)
          case mainFile of
            Nothing -> return []
            Just f -> typecheckFn f

      -- Write module manifest to fdb/
      config <- MM.ask
      let fdbDir = Config.configHome config </> "fdb"
      liftIO $ createDirectoryIfMissing True fdbDir
      installTime <- liftIO $ floor <$> Time.getPOSIXTime
      let manifestPath = fdbDir </> MT.unpack name ++ ".module"
          manifestJson =
            buildModuleManifest
              meta
              name
              morlocDeps
              exports
              targetDir
              modstr
              reason
              installTime
      liftIO $ TIO.writeFile manifestPath manifestJson
      MM.say $ "Installed module" <+> squotes (pretty name)

-- | Find the main .loc file in a module directory
findMainLocFile :: FilePath -> String -> IO (Maybe FilePath)
findMainLocFile dir name = do
  dirExists <- doesDirectoryExist dir
  if not dirExists
    then return Nothing
    else do
      let mainLoc = dir </> "main.loc"
          nameLoc = dir </> name ++ ".loc"
      mainExists <- doesFileExist mainLoc
      if mainExists
        then return (Just mainLoc)
        else do
          nameExists <- doesFileExist nameLoc
          return $ if nameExists then Just nameLoc else Nothing

-- | Build a module manifest JSON string
buildModuleManifest ::
  PackageMeta ->
  Text ->
  [Text] ->
  [(Text, Text)] ->
  FilePath ->
  Text ->
  InstallReason ->
  Int ->
  Text
buildModuleManifest meta name morlocDeps exports installPath installSource reason installTime =
  jsonObj
    [ ("kind", jsonStr "module")
    , ("name", jsonStr name)
    , ("version", jsonStr (packageVersion meta))
    , ("synopsis", jsonStr (packageSynopsis meta))
    , ("author", jsonStr (packageAuthor meta))
    , ("license", jsonStr (packageLicense meta))
    , ("homepage", jsonStr (packageHomepage meta))
    , ("c_dependencies", jsonStrArr (packageDependencies meta))
    , ("morloc_dependencies", jsonStrArr morlocDeps)
    ,
      ( "exports"
      , jsonArr
          [ jsonObj [("name", jsonStr n), ("type", jsonStr t)]
          | (n, t) <- exports
          ]
      )
    , ("install_path", jsonStr (MT.pack installPath))
    , ("install_source", jsonStr installSource)
    , ("install_reason", jsonStr (reasonText reason))
    , ("install_time", jsonInt installTime)
    ]
  where
    reasonText ExplicitInstall = "explicit"
    reasonText AutoDependency = "auto"

{- | Extract morloc module dependencies by scanning a .loc file for import statements.
This is a lightweight text scan, not using the full parser.
-}
extractMorlocDeps :: FilePath -> IO [Text]
extractMorlocDeps path = do
  content <- TIO.readFile path
  let ls = MT.lines content
      imports = concatMap extractImport (removeComments ls)
  return (unique imports)
  where
    extractImport :: Text -> [Text]
    extractImport ln =
      let stripped = MT.stripStart ln
       in case MT.stripPrefix "import " stripped of
            Nothing -> []
            Just rest ->
              let modName = MT.strip (MT.takeWhile (\c -> c /= '(' && c /= ' ') rest)
               in if "." `MT.isPrefixOf` modName
                    then [] -- skip local (.dot-prefixed) imports
                    else if "/" `MT.isInfixOf` modName
                      then [modName]  -- namespaced import: keep "owner/name" as-is
                      else case MT.splitOn "." modName of
                             (topLevel : _) | not (MT.null topLevel) -> [topLevel]
                             _ -> []

    removeComments :: [Text] -> [Text]
    removeComments = go False
      where
        go _ [] = []
        go True (l : ls)
          | MT.isInfixOf "-}" l = go False ls
          | otherwise = go True ls
        go False (l : ls)
          | MT.isPrefixOf "--" (MT.stripStart l) = go False ls
          | MT.isPrefixOf "{-" (MT.stripStart l) = go True ls
          | otherwise = l : go False ls

-- {{{ parse module source

type Parser = Parsec Text ()

decimal :: Parser Int
decimal = read <$> many1 digit

data ModulePath
  = ModulePathCore Text
  | ModulePathGit Text Text
  | ModulePathLocal Text
  deriving (Show, Eq, Ord)

data RefForm = RefHash | RefBranch | RefVersion

moduleInstallParser :: Text -> Parser (Either Text ModuleSource)
moduleInstallParser coreorg = do
  maySrcform <- optional (try parseSrcForm)
  modPath <- parseModname maySrcform
  ref <- optional (try parseRef)
  return $ makeModuleSource maySrcform modPath ref
  where
    makeModuleSource ::
      Maybe RemoteSource -> ModulePath -> Maybe GitSnapshotSelector -> Either Text ModuleSource
    makeModuleSource mayRemote (ModulePathCore modname) selector
      | mayRemote == Just RemoteGithub || mayRemote == Nothing =
          return . ModuleSourceRemoteGit $
            GitRemote
              { gitRemoteSource = RemoteGithub
              , gitReference = fromMaybe LatestDefaultBranch selector
              , gitUsername = coreorg
              , gitReponame = modname
              }
      | otherwise = Left "Core modules are only imported from github"
    makeModuleSource (Just _) (ModulePathLocal _) _ =
      Left "Invalid mix of local and remote import names"
    makeModuleSource (maybe RemoteGithub id -> remote) (ModulePathGit user repo) selector =
      return . ModuleSourceRemoteGit $
        GitRemote
          { gitRemoteSource = remote
          , gitReference = fromMaybe LatestDefaultBranch selector
          , gitUsername = user
          , gitReponame = repo
          }
    makeModuleSource Nothing (ModulePathLocal path) selector = return $ ModuleSourceLocal path selector

-- codeberg:weena/calendar@version:1.0.0
-- --------
parseSrcForm :: Parser RemoteSource
parseSrcForm = do
  remote <-
    try (string "github" >> return RemoteGithub)
      <|> try (string "gitlab" >> return RemoteGitlab)
      <|> try (string "bitbucket" >> return RemoteBitbucket)
      <|> try (string "codeberg" >> return RemoteCodeberg)
      <|> (string "azure" >> return RemoteAzure)
  _ <- char ':'
  return remote

-- codeberg:???????@version:1.0.0
--          -------
parseModname :: Maybe RemoteSource -> Parser ModulePath
parseModname (Just _) = try parseRemoteModule <|> parseCoreModule
parseModname Nothing =
  parseCoreModule -- must start with letter
    <|> parseLocalModule -- must start with [.~/]

-- codeberg:weena/calendar@version:1.0.0
--          --------------
parseRemoteModule :: Parser ModulePath
parseRemoteModule = do
  user <- parseModuleSegment
  _ <- char '/'
  repo <- parseModuleSegment
  return $ ModulePathGit user repo

-- root@version:1.0.0
-- ----
parseCoreModule :: Parser ModulePath
parseCoreModule = ModulePathCore <$> parseModuleSegment

parseModuleSegment :: Parser Text
parseModuleSegment = do
  firstChar <- alphaNum
  rest <- many (alphaNum <|> char '-')
  case rest of
    [] -> return (MT.pack [firstChar])
    _ | last rest == '-' -> fail "Module name cannot end with a dash"
      | otherwise -> return (MT.pack (firstChar : rest))

-- parse a local file
--   .
--   ./my/morloc/dir
--   ~/my/mod
parseLocalModule :: Parser ModulePath
parseLocalModule = do
  fstChar <- char '.' <|> char '/' <|> char '~'
  remaining <- MT.pack <$> many (satisfy (/= '@'))
  return $ ModulePathLocal (MT.cons fstChar remaining)

-- codeberg:weena/calendar@version:1.0.0
--                         -------------
parseRef :: Parser GitSnapshotSelector
parseRef = do
  char '@'
  mayForm <- optional (try parseRefForm)
  parseRefStr mayForm

-- codeberg:weena/calendar@version:1.0.0
--                         -------
parseRefForm :: Parser RefForm
parseRefForm = do
  form <-
    try (string "hash" >> return RefHash)
      <|> try (string "branch" >> return RefBranch)
      <|> try (string "version" >> return RefVersion)
      <|> try (string "tag" >> return RefVersion) -- same diff
  char ':'
  return form

-- codeberg:weena/calendar@version:1.0.0
--                                 -----
parseRefStr :: Maybe RefForm -> Parser GitSnapshotSelector
parseRefStr Nothing =
  try parseHash
    <|> try parseVersion
    <|> try parseBranch
parseRefStr (Just RefHash) = parseHash
parseRefStr (Just RefVersion) = parseVersion
parseRefStr (Just RefBranch) = parseBranch

-- match hexadecimal characters of 7 characters or more
parseHash :: Parser GitSnapshotSelector
parseHash = do
  hash <- MT.pack <$> many1 (satisfy isHexDigit)
  if MT.length hash >= 7
    then return $ CommitHash hash
    else fail "Hash must be at least 7 characters"
  where
    isHexDigit c = (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F')

-- match semantic version (with option of omitting patch, so v1.0 is legal)
parseVersion :: Parser GitSnapshotSelector
parseVersion = do
  version <- versionParser
  return $ ReleaseTag version
  where
    versionParser = do
      -- Optional 'v' prefix
      v <- optional (MT.pack <$> string "v")

      -- Parse major.minor
      major <- MT.show' <$> decimal
      _ <- char '.'
      minor <- MT.show' <$> decimal

      -- Optional .patch
      patchMay <- optional . try $ do
        _ <- char '.'
        MT.show' <$> decimal

      -- Optional pre-release (after '-')
      preRelease <- optional . try $ do
        _ <- char '-'
        MT.pack <$> many1 (satisfy (\c -> DC.isAlphaNum c || c == '.'))

      -- Optional build metadata (after '+')
      buildMeta <- optional . try $ do
        _ <- char '+'
        MT.pack <$> many1 (satisfy (\c -> DC.isAlphaNum c || c == '.'))

      -- Reconstruct the full version string
      return $
        mconcat
          [ fromMaybe "" v
          , major
          , "."
          , minor
          , maybe "" ("." <>) patchMay
          , maybe "" ("-" <>) preRelease
          , maybe "" ("+" <>) buildMeta
          ]

{- | Parse a legal git branch name according to git-check-ref-format

Git reference naming rules (from git-check-ref-format man page):
1. Cannot begin or end with slash '/'
2. Cannot contain two consecutive dots '..'
3. Cannot contain ASCII control characters (< 0x20), space, ~, ^, :, ?, *, [
4. Cannot end with '.lock'
5. Cannot end with a dot '.'
6. Cannot contain a backslash '\'
7. Cannot contain '@{' sequence (reflog syntax)
8. Cannot be a single '@' character
9. Components between slashes cannot begin with a dot '.'
10. Cannot contain multiple consecutive slashes '//'

Current implementation deviations from spec:
- Missing: check for '@{' sequence (reflog syntax - rule 7)
- Missing: check for '@' as sole character (rule 8)
- Missing: check that components don't start with '.' (rule 9)
- Missing: check for consecutive slashes '//' (rule 10)
- Missing: check for ASCII control characters (< 0x20)
- Incomplete: allows '@' freely, but spec restricts it in certain contexts
-}
parseBranch :: Parser GitSnapshotSelector
parseBranch = do
  branch <- MT.pack <$> many1 (satisfy isBranchChar)

  if isValidBranchName branch
    then return $ LatestOnBranch branch
    else fail $ "Invalid git branch name: " ++ MT.unpack branch
  where
    -- Characters allowed in branch names
    -- Note: We're permissive in parsing, strict in validation
    isBranchChar c =
      c > '\x1F' -- No ASCII control characters (0x00-0x1F)
        && c /= ' '
        && c /= '~'
        && c /= '^'
        && c /= ':'
        && c /= '?'
        && c /= '*'
        && c /= '['
        && c /= '\\'
        && c /= '\DEL' -- Also exclude DEL (0x7F)

    -- Comprehensive validation according to git-check-ref-format
    isValidBranchName branchName =
      not (MT.null branchName) -- Must have content
        && branchName /= "@" -- Cannot be just '@'
        && not (MT.isPrefixOf "/" branchName) -- Cannot start with /
        && not (MT.isSuffixOf "/" branchName) -- Cannot end with /
        && not (MT.isSuffixOf "." branchName) -- Cannot end with .
        && not (MT.isSuffixOf ".lock" branchName) -- Cannot end with .lock
        && not (".." `MT.isInfixOf` branchName) -- No consecutive dots
        && not ("@{" `MT.isInfixOf` branchName) -- No reflog syntax
        && not ("//" `MT.isInfixOf` branchName) -- No consecutive slashes
        && not (hasComponentStartingWithDot branchName) -- Components can't start with .
        && not (MT.any isInvalidChar branchName) -- Final safety check

    -- Check if any path component starts with a dot
    hasComponentStartingWithDot txt =
      let components = MT.splitOn "/" txt
       in any (MT.isPrefixOf ".") components

    -- Characters that should never appear (belt-and-suspenders check)
    isInvalidChar c =
      c <= '\x1F' -- Control characters
        || c == '\DEL'
        || c `elem` (" ~^:?*[\\" :: String)

-- }}}

-- | Try to parse a module string as a registry-resolvable module.
-- Bare names like "foo" -> (coreorg, "foo").
-- Namespaced names like "user/foo" -> ("user", "foo").
-- Returns Nothing for local paths, explicit remote sources, or git refs.
tryParseRegistryModule :: Text -> Text -> Maybe (Text, Text)
tryParseRegistryModule coreorg modstr
  -- Reject anything with remote source prefixes, git ref selectors, or local paths
  | MT.any (\c -> c == ':' || c == '@' || c == '.' || c == '~') modstr = Nothing
  -- Namespaced: "owner/name"
  | "/" `MT.isInfixOf` modstr =
      case MT.splitOn "/" modstr of
        [owner, name] | isValidSegment owner && isValidSegment name -> Just (owner, name)
        _ -> Nothing
  -- Bare name: resolve to core org
  | isValidSegment modstr = Just (coreorg, modstr)
  | otherwise = Nothing
  where
    isValidSegment t =
      not (MT.null t)
        && DC.isAlphaNum (MT.head t)
        && MT.all (\c -> DC.isAlphaNum c || c == '-') t

-- | Install a module from the morloc registry by downloading its tarball.
installFromRegistry :: Text -> Text -> Text -> FilePath -> IO ()
installFromRegistry registryUrl owner name targetDir = do
  -- Get latest version metadata
  let metaUrl = MT.unpack registryUrl <> "/api/registry/" <> MT.unpack owner <> "/" <> MT.unpack name
  metaReq <- HTTP.parseRequest metaUrl
  metaResp <- HTTP.httpLBS metaReq
  let metaStatus = HTTP.getResponseStatusCode metaResp
  when (metaStatus /= 200) $
    ioError . userError $
      "Registry lookup failed for " <> MT.unpack owner <> "/" <> MT.unpack name
        <> " (HTTP " <> show metaStatus <> ")"

  -- Extract latest version from the response
  let metaBody = HTTP.getResponseBody metaResp
  latestVersion <- case Aeson.decode metaBody of
    Just (Aeson.Object obj) -> case KM.lookup "versions" obj of
      Just (Aeson.Array arr) | not (V.null arr) -> case V.head arr of
        Aeson.Object vobj -> case KM.lookup "version" vobj of
          Just (Aeson.String v) -> return v
          _ -> ioError $ userError "Could not parse version from registry response"
        _ -> ioError $ userError "Could not parse version from registry response"
      _ -> ioError $ userError "No versions found for module"
    _ -> ioError $ userError "Could not parse registry response"

  -- Download tarball
  let tarUrl = metaUrl <> "/" <> MT.unpack latestVersion <> "/tarball"
  tarReq <- HTTP.parseRequest tarUrl
  tarResp <- HTTP.httpLBS tarReq
  let tarStatus = HTTP.getResponseStatusCode tarResp
  when (tarStatus /= 200) $
    ioError . userError $
      "Tarball download failed for " <> MT.unpack owner <> "/" <> MT.unpack name
        <> "@" <> MT.unpack latestVersion <> " (HTTP " <> show tarStatus <> ")"

  let tarball = HTTP.getResponseBody tarResp

  -- Extract tarball to target directory
  createDirectoryIfMissing True targetDir
  let tarballPath = targetDir <> ".tar.gz"
  BL.writeFile tarballPath tarball

  -- Verify SHA-256 if provided by the server
  case HTTP.getResponseHeader "X-Checksum-Sha256" tarResp of
    (expectedHash:_) -> do
      output <- readProcess "sha256sum" [tarballPath] ""
      let actualHash = takeWhile (/= ' ') output
          expected = BS8.unpack expectedHash
      when (actualHash /= expected) $ do
        removeFile tarballPath
        ioError . userError $
          "SHA-256 mismatch for " <> MT.unpack owner <> "/" <> MT.unpack name
    [] -> return ()

  readProcess "tar" ["xzf", tarballPath, "-C", targetDir] ""
  removeFile tarballPath

-- {{{ install from module source (IO-level helpers)

-- | Install from a local source (pure IO, no MorlocMonad)
installLocalIO ::
  FilePath -> Maybe GitSnapshotSelector -> Text -> IO ()
installLocalIO targetDir maySelector modulePath = do
  sourceDir <- MS.makeAbsolute . MS.dropTrailingPathSeparator . MT.unpack $ modulePath

  sourceExists <- doesDirectoryExist sourceDir
  unless sourceExists $
    ioError $ userError $
      "Source directory does not exist: " ++ sourceDir

  let gitDir = sourceDir </> ".git"
  isGitRepo <- doesDirectoryExist gitDir

  if isGitRepo
    then installLocalGitRepoIO sourceDir targetDir (fromMaybe LatestDefaultBranch maySelector)
    else Install.copyAllFiltered sourceDir targetDir

installLocalGitRepoIO :: FilePath -> FilePath -> GitSnapshotSelector -> IO ()
installLocalGitRepoIO sourceDir targetDir selector = do
  case selector of
    LatestDefaultBranch ->
      -- Copy the working tree, filtering out .git and ignored files
      Install.copyAllFiltered sourceDir targetDir
    LatestOnBranch branch -> do
      callProcess "git" ["clone", "-q", sourceDir, targetDir]
      callProcess "git" ["-C", targetDir, "checkout", "refs/heads/" ++ MT.unpack branch]
    CommitHash hash -> do
      callProcess "git" ["clone", "-q", sourceDir, targetDir]
      callProcess "git" ["-C", targetDir, "checkout", "--detach", MT.unpack hash]
    ReleaseTag tag -> do
      callProcess "git" ["clone", "-q", sourceDir, targetDir]
      callProcess "git" ["-C", targetDir, "checkout", "refs/tags/" ++ MT.unpack tag]

  -- Remove .git and ignored files from installed copy
  Install.cleanIgnoredFiles targetDir

-- | Install from a remote git source (pure IO)
installRemoteIO :: GitProtocol -> FilePath -> GitRemote -> IO ()
installRemoteIO gitprot targetDir remote = do
  let gitUrl = buildGitUrl gitprot remote
  callProcess "git" ["clone", "-q", gitUrl, targetDir]
  checkoutRefIO targetDir (gitReference remote)
  Install.cleanIgnoredFiles targetDir

-- | Build a git URL from protocol and remote info
buildGitUrl :: GitProtocol -> GitRemote -> String
buildGitUrl protocol remote =
  let username = MT.unpack $ gitUsername remote
      reponame = MT.unpack $ gitReponame remote
      source = gitRemoteSource remote
      baseUrl = getBaseUrl source
   in case protocol of
        HttpsProtocol -> "https://" ++ baseUrl ++ "/" ++ username ++ "/" ++ reponame
        SshProtocol -> "git@" ++ baseUrl ++ ":" ++ username ++ "/" ++ reponame ++ ".git"

-- | Get base URL for each remote source
getBaseUrl :: RemoteSource -> String
getBaseUrl RemoteGithub = "github.com"
getBaseUrl RemoteGitlab = "gitlab.com"
getBaseUrl RemoteBitbucket = "bitbucket.org"
getBaseUrl RemoteCodeberg = "codeberg.org"
getBaseUrl RemoteAzure = "dev.azure.com"

-- | Checkout a specific git reference (pure IO)
checkoutRefIO :: FilePath -> GitSnapshotSelector -> IO ()
checkoutRefIO targetDir selector = case selector of
  LatestDefaultBranch -> return ()
  LatestOnBranch branch -> do
    callProcess "git" ["-C", targetDir, "checkout", MT.unpack branch]
    callProcess "git" ["-C", targetDir, "pull"]
  CommitHash hash ->
    callProcess "git" ["-C", targetDir, "checkout", MT.unpack hash]
  ReleaseTag tag ->
    callProcess "git" ["-C", targetDir, "checkout", "tags/" ++ MT.unpack tag]

-- }}}


================================================
FILE: library/Morloc/Monad.hs
================================================
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Monad
Description : Compiler monad runner and accessors
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

'MorlocMonad' is the main effect stack used throughout the compiler:

@Reader Config (Except MorlocError (Writer [Text] (State MorlocState IO)))@

This module provides the runner ('runMorlocMonad'), error formatting
('makeMorlocError' with source snippets), state accessors (counter,
depth, metadata lookups), logging ('say'\/'sayV'\/'sayVV'), system call
wrappers, and an independent 'Index' monad for local re-indexing passes.
-}
module Morloc.Monad
  ( MorlocReturn
  , runMorlocMonad
  , writeMorlocReturn
  , makeMorlocError
  , runCommand
  , runCommandWith
  , logFile
  , logFileWith
  , readLang

    -- * re-exports
  , module Control.Monad.Trans
  , module Control.Monad.Except
  , module Control.Monad.Reader
  , module Control.Monad.State
  , module Control.Monad.Writer
  , module Control.Monad.Identity

    -- * reusable counter
  , startCounter
  , getCounter
  , getCounterWithPos
  , setCounter
  , takeFromCounter

    -- * metadata accessors
  , metaSources
  , metaName
  , getDocStrings
  , getConcreteScope
  , getGeneralScope
  , getConcreteUniversalScope
  , getGeneralUniversalScope

    -- * handling tree depth
  , incDepth
  , getDepth
  , decDepth
  , setDepth

    -- * messages
  , say
  , sayV
  , sayVV
  , sayVVV

    -- * throwing errors
  , throwSystemError
  , throwSourcedError
  , throwUnificationError

    -- * naming helpers
  , getModuleName
  , getOutfileName

    -- * Indexing monad
  , Index
  , IndexState (..)
  , runIndex
  , newIndex
  , getIndex
  , setIndex
  ) where

import Control.Monad.Except
import Control.Monad.Identity
import Control.Monad.Reader
import Control.Monad.State
import Control.Monad.Trans
import Control.Monad.Writer
import Data.Text (Text)
import Morloc.Data.Doc
import qualified Morloc.Data.GMap as GMap
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import qualified Morloc.DataFiles as DF
import qualified Morloc.LangRegistry as LR
import qualified Morloc.Language as ML
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type
import qualified Morloc.System as MS
import qualified System.Exit as SE
import System.IO (stderr)
import qualified System.Process as SP

runMorlocMonad ::
  Maybe Path -> Int -> Config -> BuildConfig -> MorlocMonad a -> IO (MorlocReturn a)
runMorlocMonad outfile v config buildConfig ev = do
  let langFiles = [(n, DF.embededFileText f) | (n, f) <- DF.langRegistryFiles]
      languagesText = DF.embededFileText DF.languagesYaml
      registry = case LR.buildDefaultRegistry langFiles languagesText of
        Right r -> r
        Left err -> error $ "Failed to build language registry: " ++ err
      state0 = emptyState outfile v
      state1 =
        state0
          { stateBuildConfig = buildConfig
          , stateLangRegistry = registry
          }
  runStateT (runWriterT (runExceptT (runReaderT ev config))) state1

emptyState :: Maybe Path -> Int -> MorlocState
emptyState path v =
  defaultValue
    { stateVerbosity = v
    , stateOutfile = path
    }

startCounter :: MorlocMonad ()
startCounter = do
  s <- get
  put $ s {stateCounter = 0}

getCounter :: MorlocMonad Int
getCounter = do
  s <- get
  let i = stateCounter s
  put $ s {stateCounter = stateCounter s + 1}
  return i

-- | Create a new index that inherits the source position of a parent index
getCounterWithPos :: Int -> MorlocMonad Int
getCounterWithPos parentIdx = do
  i <- getCounter
  s <- get
  case Map.lookup parentIdx (stateSourceMap s) of
    Just loc -> put $ s {stateSourceMap = Map.insert i loc (stateSourceMap s)}
    Nothing -> return ()
  return i

takeFromCounter :: Int -> MorlocMonad [Int]
takeFromCounter 0 = return []
takeFromCounter i = do
  x <- getCounter
  xs <- takeFromCounter (i - 1)
  return (x : xs)

setCounter :: Int -> MorlocMonad ()
setCounter i = do
  s <- get
  put $ s {stateCounter = i}
  return ()

incDepth :: MorlocMonad Int
incDepth = do
  s <- get
  let i = stateDepth s + 1
  put $ s {stateDepth = i}
  return i

getDepth :: MorlocMonad Int
getDepth = gets stateDepth

decDepth :: MorlocMonad Int
decDepth = do
  s <- get
  let i = stateDepth s - 1
  put $ s {stateDepth = i}
  return i

setDepth :: Int -> MorlocMonad ()
setDepth i = do
  s <- get
  put $ s {stateDepth = i}
  return ()

writeMorlocReturn :: MorlocReturn a -> IO Bool
writeMorlocReturn ((Left err', msgs), st) = do
  writeMessages
  MT.hPutStrLn stderr (render $ makeMorlocError st err')
  return False
  where
    writeMessages
      | length msgs > 0 = MT.hPutStrLn stderr (MT.unlines msgs)
      | otherwise = return ()
writeMorlocReturn ((Right _, _), _) = return True

makeMorlocError :: MorlocState -> MorlocError -> MDoc
makeMorlocError st (SourcedError i msg) =
  case Map.lookup i (stateSourceMap st) of
    Just loc -> pretty loc <> ": error:" <> line <> msg <> snippet st loc
    Nothing -> "Compiler bug, broken index" <+> pretty i <+> "with attached error:" <+> msg
makeMorlocError _ (SystemError msg) = msg
makeMorlocError st (UnificationError lhs rhs context msg) =
  case (Map.lookup lhs srcMap, Map.lookup rhs srcMap, Map.lookup context srcMap) of
    (Just lhsLoc, rhsLoc, contextLoc) ->
      "Unification error:" <+> msg
        <> line
        <> "Found while unifying" <+> maybe mempty pretty contextLoc
        <> line
        <> "With values"
        <> line
        <> snippet st lhsLoc
        <> maybe mempty (\l -> "and" <> line <> snippet st l) rhsLoc
    _ -> "Compiler bug, broken indices" <+> pretty (lhs, rhs, context) <+> "with attached error:" <+> msg
  where
    srcMap = stateSourceMap st

{- | Render a source code snippet with error location markers.
For single-line spans: ^~~~^ underline from start to end column.
For multi-line spans: Elm-style vertical bar in the gutter with ^ at start and end.
Spans > 10 lines are truncated to first 5 and last 5 lines.
-}
snippet :: MorlocState -> SrcLoc -> MDoc
snippet st (SrcLoc path ln col endLn endCol) =
  case path >>= \p -> Map.lookup p (stateSourceText st) of
    Nothing -> mempty
    Just src ->
      let srcLines = MT.lines src
          n = length srcLines
       in if n == 0 || ln < 1
            then mempty
            else
              let startLine = min ln n
                  finishLine = min endLn n
                  gw = length (show finishLine)
                  gutter = pretty (MT.replicate gw " ")
                  fmtLineNum num =
                    let s = MT.show' num
                     in pretty (MT.replicate (gw - MT.length s) " ") <> pretty s
               in if startLine == finishLine
                    then snippetSingleLine srcLines startLine col endCol gutter fmtLineNum
                    else snippetMultiLine srcLines startLine col finishLine endCol gutter fmtLineNum
  where
    snippetSingleLine srcLines lineNum startCol eCol gutter fmtNum =
      let errLine = srcLines !! (lineNum - 1)
          sc = max 1 (min startCol (MT.length errLine + 1))
          ec = max sc (min eCol (MT.length errLine + 1))
          pointer
            | sc == ec = pretty (MT.replicate (sc - 1) " ") <> "^"
            | ec > sc + 1 =
                pretty (MT.replicate (sc - 1) " ")
                  <> "^"
                  <> pretty (MT.replicate (ec - sc - 2) "~")
                  <> "^"
            | otherwise = pretty (MT.replicate (sc - 1) " ") <> "^^"
       in line
            <> gutter <+> "|"
            <> line
            <> fmtNum lineNum <+> "|" <+> pretty errLine
            <> line
            <> gutter <+> "|" <+> pointer
            <> line

    snippetMultiLine srcLines startLine startCol finishLine eCol gutter fmtNum =
      let totalLines = finishLine - startLine + 1
          lineNums
            | totalLines <= 10 = [startLine .. finishLine]
            | otherwise = [startLine .. startLine + 4] ++ [finishLine - 4 .. finishLine]
          needsElision = totalLines > 10
          elisionPoint = startLine + 5

          renderLine num =
            let srcLine = srcLines !! (num - 1)
             in fmtNum num <+> "| |" <+> pretty srcLine

          renderStartPointer =
            let sc = max 1 startCol
             in gutter <+> "| |" <+> pretty (MT.replicate (sc - 1) " ") <> "^"

          renderEndPointer =
            let endLine = srcLines !! (finishLine - 1)
                ec = max 1 (min eCol (MT.length endLine + 1))
             in gutter <+> "| |" <+> pretty (MT.replicate (ec - 1) " ") <> "^"

          elisionLine = gutter <+> "  ..."

          renderLines [] = mempty
          renderLines (num : rest)
            | needsElision && num == elisionPoint =
                elisionLine <> line <> renderLines (dropWhile (< finishLine - 4) rest)
            | num == startLine =
                renderLine num
                  <> line
                  <> renderStartPointer
                  <> line
                  <> renderLines rest
            | otherwise =
                renderLine num
                  <> line
                  <> renderLines rest
       in line
            <> gutter <+> "|"
            <> line
            <> renderLines lineNums
            <> renderEndPointer
            <> line

throwSystemError :: (MonadError MorlocError m) => MDoc -> m a
throwSystemError = throwError . SystemError

throwSourcedError :: (MonadError MorlocError m) => Int -> MDoc -> m a
throwSourcedError i = throwError . SourcedError i

throwUnificationError :: (MonadError MorlocError m) => Int -> Int -> Int -> MDoc -> m a
throwUnificationError lhs rhs context msg = throwError $ UnificationError lhs rhs context msg

systemCallError :: Text -> Text -> String -> MorlocMonad a
systemCallError cmd loc msg =
  throwSystemError $
    "System call failed at ("
      <> pretty loc
      <> "):\n"
      <> " cmd> "
      <> pretty cmd
      <> "\n"
      <> " msg>\n"
      <> pretty msg

-- | Execute a system call
runCommand ::
  Text -> -- function making the call (used only in debugging messages on error)
  Text -> -- system command
  MorlocMonad ()
runCommand loc cmd = do
  liftIO $ MT.hPutStrLn stderr ("$ " <> cmd)
  (exitCode, _, err') <-
    liftIO $ SP.readCreateProcessWithExitCode (SP.shell . MT.unpack $ cmd) []
  case exitCode of
    SE.ExitSuccess -> tell [MT.pack err']
    _ -> systemCallError cmd loc err'

sayIf :: Int -> MDoc -> MorlocMonad ()
sayIf i d = do
  verbosity <- gets stateVerbosity
  when (verbosity >= i) $ liftIO $ MT.hPutStrLn stderr (render d)

-- print anytime
say :: MDoc -> MorlocMonad ()
say = sayIf 0

-- print for verbose level 1
-- messages that may be of interest to the user
sayV :: MDoc -> MorlocMonad ()
sayV = sayIf 1

-- print for verbose level 2
-- messages for the programmer
sayVV :: MDoc -> MorlocMonad ()
sayVV = sayIf 2

-- print for verbose level 3
-- really boring shit that probably no one wants to ever hear, but we spent a
-- lot of time working on it and don't want to delete it.
sayVVV :: MDoc -> MorlocMonad ()
sayVVV = sayIf 3

-- | Execute a system call and return a function of the STDOUT
runCommandWith ::
  Text -> -- function making the call (used only in debugging messages on error)

  -- | A function of the output (run on success)
  (Text -> a) ->
  -- | System command
  Text ->
  MorlocMonad a
runCommandWith loc f cmd = do
  liftIO $ MT.hPutStrLn stderr ("$ " <> cmd)
  (exitCode, out, err') <-
    liftIO $ SP.readCreateProcessWithExitCode (SP.shell . MT.unpack $ cmd) []
  case exitCode of
    SE.ExitSuccess -> return $ f (MT.pack out)
    _ -> systemCallError cmd loc err'

-- | Write a object to a file in the Morloc temporary directory
logFile ::
  (Show a) =>
  -- | A filename
  String ->
  a ->
  MorlocMonad a
logFile s m = do
  tmpdir <- asks configTmpDir
  liftIO $ MS.createDirectoryIfMissing True tmpdir
  let path = MS.combine tmpdir s
  liftIO $ MT.writeFile path (MT.pretty m)
  return m

-- | Write a object to a file in the Morloc temporary directory
logFileWith ::
  (Show b) =>
  -- | A filename
  String ->
  -- | A function to convert a to something presentable
  (a -> b) ->
  a ->
  MorlocMonad a
logFileWith s f m = do
  tmpdir <- asks configTmpDir
  liftIO $ MS.createDirectoryIfMissing True tmpdir
  let path = MS.combine tmpdir s
  liftIO $ MT.writeFile path (MT.pretty (f m))
  return m

-- | Look up a language by name or alias using the registry.
readLang :: Text -> MorlocMonad Lang
readLang langStr = do
  reg <- gets stateLangRegistry
  case LR.lookupByAlias langStr reg of
    Just (name, entry) -> return (ML.makeLang name (LR.lreExtension entry))
    Nothing -> throwSystemError $ "Unknown language" <> squotes (pretty langStr)

{- | Return sources for constructing an object. These are used by `NamE NamObject`
expressions. Sources here includes some that are not linked to signatures, such
as language-specific imports of object constructors. So this supersets the
stateSignatures field's sources.
-}
metaSources :: Int -> MorlocMonad [Source]
metaSources i = do
  s <- gets stateSources
  case GMap.lookup i s of
    GMapNoFst -> return []
    GMapNoSnd -> error "Compiler bug: Internal GMap key missing"
    (GMapJust srcs) -> return srcs

----- TODO: metaName should no longer be required - remove

{- | The name of a morloc composition. These names are stored in the monad
after they are resolved away. For example in:
  import math
  export foo
  bar x y = add x (inc y)
  foo x = add (bar x 5) 1
`foo` and `bar` are morloc composition. `foo` will be resolved to
  add (add x (inc 5) 1
The terms "foo" and "bar" have disappeared. They aren't technically needed
anymore. However, the nexus needs a subcommand name to give the user for
calling "foo". In the generated code and in error messages, it is also nice
to keep the label "bar" attached to the second `add` function. `metaName`
can retrieve these names based on the index of the CallS expressions that
wrap the two `add` functions.

The name is linked to the SAnno general data structure.
-}
metaName :: Int -> MorlocMonad (Maybe EVar)
metaName i = gets (Map.lookup i . stateName)

-- Get the docstrings associated with an item
getDocStrings ::
  Int -> -- expression index
  MorlocMonad ArgDoc
getDocStrings i = do
  sgmap <- gets stateSignatures
  case GMap.lookup i sgmap of
    (GMapJust (Monomorphic (TermTypes (Just e) _ _))) -> return $ edocs e
    (GMapJust (Polymorphic _ _ e _)) -> return $ edocs e
    GMapNoSnd -> error "Compiler bug: Internal GMap key missing"
    _ -> error "Compiler bug: No entry found for index in stateSignatures"

getConcreteScope :: Int -> Lang -> MorlocMonad Scope
getConcreteScope i lang = do
  p <- gets stateConcreteTypedefs
  return $ case GMap.lookup i p of
    (GMapJust langmap) -> case Map.lookup lang langmap of
      (Just scope) -> scope
      Nothing -> Map.empty
    _ -> Map.empty

getGeneralScope :: Int -> MorlocMonad Scope
getGeneralScope i = do
  p <- gets stateGeneralTypedefs
  return $ case GMap.lookup i p of
    (GMapJust scope) -> scope
    _ -> Map.empty

getConcreteUniversalScope :: Lang -> MorlocMonad Scope
getConcreteUniversalScope lang = do
  scopeMap <- gets stateUniversalConcreteTypedefs
  case Map.lookup lang scopeMap of
    (Just scope) -> return scope
    Nothing -> return Map.empty

getGeneralUniversalScope :: MorlocMonad Scope
getGeneralUniversalScope = gets stateUniversalGeneralTypedefs

{- | Get the module name from state, falling back to "nexus" if unset.
This is the canonical name for pool subdirectories and manifest references.
-}
getModuleName :: MorlocMonad String
getModuleName = do
  st <- get
  return $ case stateModuleName st of
    Just (MV n) -> MT.unpack n
    Nothing -> "nexus"

{- | Get the output file name: the -o value if given, else the module name.
This controls only the wrapper script filename.
-}
getOutfileName :: MorlocMonad String
getOutfileName = do
  st <- get
  case stateOutfile st of
    Just name -> return name
    Nothing -> getModuleName

newtype IndexState = IndexState {index :: Int}
type Index a = StateT IndexState Identity a

runIndex :: Int -> Index a -> a
runIndex i x = evalState x (IndexState i)

newIndex :: Index Int
newIndex = do
  s <- get
  let i = index s
  put $ s {index = index s + 1}
  return i

getIndex :: Index Int
getIndex = gets index

setIndex :: Int -> Index ()
setIndex i = do
  s <- get
  put $ s {index = i}
  return ()


================================================
FILE: library/Morloc/Namespace/Expr.hs
================================================
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Namespace.Expr
Description : Frontend AST, source/config types, post-typecheck tree
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Expression types at three stages of the compiler pipeline:

* 'Expr' \/ 'ExprI' -- parser output (untyped AST with integer indices)
* 'E' -- intermediate typed tree used during typechecking
* 'AnnoS' \/ 'ExprS' -- post-typecheck annotated tree passed to code generation

Also defines 'Source' (foreign function binding), config types
('ManifoldConfig', 'ModuleConfig', 'BuildConfig'), and mapping combinators
over the 'AnnoS' tree.
-}
module Morloc.Namespace.Expr
  ( -- * Source and config types
    Source (..)
  , RemoteResources (..)
  , ManifoldConfig (..)
  , ModuleConfig (..)
  , BuildConfig (..)

    -- * Mostly frontend expressions
  , Symbol (..)
  , AliasedSymbol (..)
  , Signature (..)
  , Typeclass (..)
  , Selector (..)
  , ungroup
  , Pattern (..)
  , Intrinsic (..)
  , intrinsicName
  , intrinsicArity
  , parseIntrinsic
  , Expr (..)
  , ExprI (..)
  , E (..)
  , Lit (..)
  , Import (..)
  , Export (..)
  , ExportGroup (..)
  , Fixity (..)
  , Associativity (..)

    -- * Post-typechecking tree
  , ExecutableExpr (..)
  , AnnoS (..)
  , ExprS (..)
  , Coercion (..)
  , applyCoercion
  , unapplyCoercion
  , ManyPoly (..)
  , mapAnnoSM
  , mapExprSM
  , mapAnnoS
  , mapExprS
  , mapAnnoSC
  , mapAnnoSCM
  , mapAnnoSG
  , mapAnnoSGM
  , mapExprSC
  , mapExprSCM
  , mapExprSG
  , mapExprSGM

    -- * JSON helpers
  , stripPrefixAndKebabCase
  , convertToKebabCase
  ) where

import Control.Monad.Identity (runIdentity)
import Data.Aeson (FromJSON (..))
import qualified Data.Aeson as Aeson
import Data.Aeson.Types (Options (..), defaultOptions)
import Data.Foldable (toList)
import qualified Data.Map as Map
import Data.Scientific (Scientific)
import qualified Data.Set as Set
import Data.Text (Text)
import GHC.Generics (Generic)
import Morloc.Data.Doc
import Morloc.Namespace.Prim
import Morloc.Namespace.Type

---- Source and config types

data Source
  = Source
  { srcName :: SrcName
  , srcLang :: Lang
  , srcPath :: Maybe Path
  , srcAlias :: EVar
  , srcLabel :: Maybe Label
  , srcRsize :: [Int]
  , srcNote :: [Text]
  , srcInline :: !Bool
  , srcOperator :: !Bool
  }
  deriving (Ord, Eq, Show)

data RemoteResources = RemoteResources
  { remoteResourcesThreads :: Maybe Int
  , remoteResourcesMemory :: Maybe Int
  , remoteResourcesTime :: Maybe TimeInSeconds
  , remoteResourcesGpus :: Maybe Int
  }
  deriving (Show, Ord, Eq, Generic)

data ManifoldConfig = ManifoldConfig
  { manifoldConfigCache :: Maybe Bool
  , manifoldConfigBenchmark :: Maybe Bool
  , manifoldConfigRemote :: Maybe RemoteResources
  }
  deriving (Show, Ord, Eq, Generic)

data ModuleConfig = ModuleConfig
  { moduleConfigDefaultGroup :: Maybe ManifoldConfig
  , moduleConfigLabeledGroups :: Map.Map Text ManifoldConfig
  }
  deriving (Show, Generic)

data BuildConfig = BuildConfig
  { buildConfigSlurmSupport :: Maybe Bool
  , buildConfigSanitize :: Maybe Bool
  }
  deriving (Show, Generic)

---- Expressions

data Symbol
  = TypeSymbol TVar
  | TermSymbol EVar
  | ClassSymbol ClassName
  deriving (Show, Ord, Eq)

data ExportGroup = ExportGroup
  { exportGroupName :: !Text
  , exportGroupDesc :: [Text]
  , exportGroupMembers :: Set.Set (Int, Symbol)
  }
  deriving (Show, Ord, Eq)

data Export
  = ExportMany (Set.Set (Int, Symbol)) [ExportGroup]
  | ExportAll
  deriving (Show, Ord, Eq)

data AliasedSymbol
  = AliasedType TVar TVar
  | AliasedTerm EVar EVar
  | AliasedClass ClassName
  deriving (Show, Ord, Eq)

data Signature = Signature EVar (Maybe Label) EType
  deriving (Show, Ord, Eq)

data Typeclass a = Typeclass [Constraint] ClassName [TVar] [a]
  deriving (Show, Ord, Eq)

data Selector
  = SelectorKey (Text, Selector) [(Text, Selector)]
  | SelectorIdx (Int, Selector) [(Int, Selector)]
  | SelectorEnd
  deriving (Show, Ord, Eq)

ungroup :: Selector -> [[Either Int Text]]
ungroup SelectorEnd = [[]]
ungroup (SelectorKey (k, SelectorEnd) []) = [[Right k]]
ungroup (SelectorIdx (i, SelectorEnd) []) = [[Left i]]
ungroup (SelectorKey x xs) = concat [map ((:) (Right k)) (ungroup s) | (k, s) <- (x : xs)]
ungroup (SelectorIdx x xs) = concat [map ((:) (Left i)) (ungroup s) | (i, s) <- (x : xs)]

data Pattern
  = PatternText Text [Text]
  | PatternStruct Selector
  deriving (Show, Ord, Eq)

-- | Compiler intrinsics: functions the compiler generates specialized code for.
data Intrinsic
  = IntrSave      -- ^ @save   :: a -> Str -> {()}   -- voidstar format
  | IntrSaveM     -- ^ @savem  :: a -> Str -> {()}   -- msgpack format
  | IntrSaveJ     -- ^ @savej  :: a -> Str -> {()}   -- JSON format
  | IntrLoad      -- ^ @load   :: Str -> {?a}        -- auto-detect format
  | IntrHash      -- ^ @hash   :: a -> Str           -- xxhash, hex string
  | IntrVersion   -- ^ @version :: Str               -- compiler version
  | IntrCompiled  -- ^ @compiled :: Str              -- compile timestamp
  | IntrLang      -- ^ @lang    :: Str               -- current pool language
  | IntrSchema    -- ^ @schema  :: a -> Str          -- schema string
  | IntrTypeof    -- ^ @typeof  :: a -> Str          -- concrete type name
  | IntrShow      -- ^ @show   :: a -> Str           -- serialize to JSON string
  | IntrRead      -- ^ @read   :: Str -> ?a          -- deserialize from JSON string
  | IntrDatafile  -- ^ @datafile :: Str -> Str       -- resolve installed data file path
  deriving (Show, Ord, Eq)

-- | Map intrinsic to its canonical name
intrinsicName :: Intrinsic -> Text
intrinsicName IntrSave = "save"
intrinsicName IntrSaveM = "savem"
intrinsicName IntrSaveJ = "savej"
intrinsicName IntrLoad = "load"
intrinsicName IntrHash = "hash"
intrinsicName IntrVersion = "version"
intrinsicName IntrCompiled = "compiled"
intrinsicName IntrLang = "lang"
intrinsicName IntrSchema = "schema"
intrinsicName IntrTypeof = "typeof"
intrinsicName IntrShow = "show"
intrinsicName IntrRead = "read"
intrinsicName IntrDatafile = "datafile"

-- | Parse a name to an intrinsic (Nothing if not a known intrinsic)
parseIntrinsic :: Text -> Maybe Intrinsic
parseIntrinsic "save" = Just IntrSave
parseIntrinsic "savem" = Just IntrSaveM
parseIntrinsic "savej" = Just IntrSaveJ
parseIntrinsic "load" = Just IntrLoad
parseIntrinsic "hash" = Just IntrHash
parseIntrinsic "version" = Just IntrVersion
parseIntrinsic "compiled" = Just IntrCompiled
parseIntrinsic "lang" = Just IntrLang
parseIntrinsic "schema" = Just IntrSchema
parseIntrinsic "typeof" = Just IntrTypeof
parseIntrinsic "show" = Just IntrShow
parseIntrinsic "read" = Just IntrRead
parseIntrinsic "datafile" = Just IntrDatafile
parseIntrinsic _ = Nothing

-- | Expected number of arguments for each intrinsic
intrinsicArity :: Intrinsic -> Int
intrinsicArity IntrSave = 2
intrinsicArity IntrSaveM = 2
intrinsicArity IntrSaveJ = 2
intrinsicArity IntrLoad = 1
intrinsicArity IntrHash = 1
intrinsicArity IntrVersion = 0
intrinsicArity IntrCompiled = 0
intrinsicArity IntrLang = 0
intrinsicArity IntrSchema = 1
intrinsicArity IntrTypeof = 1
intrinsicArity IntrShow = 1
intrinsicArity IntrRead = 1
intrinsicArity IntrDatafile = 1

data ExprI = ExprI Int Expr
  deriving (Show, Ord, Eq)

data Expr
  = ModE MVar [ExprI]
  | ClsE (Typeclass Signature)
  | IstE ClassName [TypeU] [ExprI]
  | TypE ExprTypeE
  | ImpE Import
  | ExpE Export
  | SrcE Source
  | SigE Signature
  | AssE EVar ExprI [ExprI]
  | FixE Fixity
  | BopE ExprI Int EVar ExprI
  | UniE
  | NullE
  | VarE ManifoldConfig EVar
  | HolE
  | LstE [ExprI]
  | TupE [ExprI]
  | NamE [(Key, ExprI)]
  | AppE ExprI [ExprI]
  | LamE [EVar] ExprI
  | AnnE ExprI TypeU
  | LetE [(EVar, ExprI)] ExprI
  | RealE Scientific
  | IntE Integer
  | LogE Bool
  | StrE Text
  | PatE Pattern
  | IfE ExprI ExprI ExprI
  | DoBlockE ExprI
  | EvalE ExprI
  | IntrinsicE Intrinsic [ExprI]
  | ParenE !ExprI  -- ^ transient parenthesization wrapper (eliminated by handleBinops)
  deriving (Show, Ord, Eq)

data Import
  = Import
  { importModuleName :: MVar
  , importInclude :: Maybe [AliasedSymbol]
  , importExclude :: [Symbol]
  , importNamespace :: Maybe EVar
  }
  deriving (Ord, Eq, Show)

data Associativity
  = InfixL
  | InfixR
  | InfixN
  deriving (Show, Ord, Eq, Enum)

data Fixity = Fixity
  { fixityAssoc :: Associativity
  , fixityPrecedence :: Int
  , fixityOperators :: [EVar]
  }
  deriving (Show, Ord, Eq)

data Lit
  = MNum Scientific
  | MInt Integer
  | MLog Bool
  | MStr Text
  | MUni
  | MNull
  deriving (Ord, Eq, Show)

data E
  = BndP (Indexed Type) EVar
  | VarP (Indexed Type) EVar [E]
  | AppP (Indexed Type) E [E]
  | LamP (Indexed Type) [EVar] E
  | LstP (Indexed Type) [E]
  | TupP (Indexed Type) [E]
  | NamP (Indexed Type) [(Key, E)]
  | LitP (Indexed Type) Lit
  | SrcP (Indexed Type) Source
  | PatP (Indexed Type) Selector
  | IfP (Indexed Type) E E E
  | DoBlockP (Indexed Type) E
  | EvalP (Indexed Type) E
  | CoerceP Coercion (Indexed Type) E
  | IntrinsicP (Indexed Type) Intrinsic [E]
  deriving (Ord, Eq, Show)

-- | Coercion tag for implicit type conversions inserted by the typechecker.
-- Extensible: future coercions (e.g., numeric widening) add constructors here.
data Coercion
  = CoerceToOptional
  | CoerceToEffect (Set.Set EffectLabel)
  deriving (Show, Eq, Ord)

-- | Apply a coercion to a type, returning the coerced type.
applyCoercion :: Coercion -> TypeU -> TypeU
applyCoercion CoerceToOptional t = OptionalU t
applyCoercion (CoerceToEffect effs) t = EffectU (EffectSet effs) t

-- | Invert a coercion on a resolved Type.
unapplyCoercion :: Coercion -> Type -> Type
unapplyCoercion CoerceToOptional (OptionalT t) = t
unapplyCoercion CoerceToOptional t = t  -- defensive fallback
unapplyCoercion (CoerceToEffect _) (EffectT _ t) = t
unapplyCoercion (CoerceToEffect _) t = t  -- defensive fallback

data ExecutableExpr = SrcCall Source | PatCall Pattern
  deriving (Ord, Eq, Show)

data AnnoS g f c = AnnoS g c (ExprS g f c)

data ExprS g f c
  = UniS
  | NullS
  | BndS EVar
  | VarS EVar (f (AnnoS g f c))
  | AppS (AnnoS g f c) [AnnoS g f c]
  | LamS [EVar] (AnnoS g f c)
  | LstS [AnnoS g f c]
  | TupS [AnnoS g f c]
  | NamS [(Key, AnnoS g f c)]
  | RealS Scientific
  | IntS Integer
  | LogS Bool
  | StrS Text
  | ExeS ExecutableExpr
  | LetS EVar (AnnoS g f c) (AnnoS g f c)
  | LetBndS EVar
  | CallS EVar  -- recursive call back-edge
  | IfS (AnnoS g f c) (AnnoS g f c) (AnnoS g f c)
  | DoBlockS (AnnoS g f c)
  | EvalS (AnnoS g f c)
  | CoerceS Coercion (AnnoS g f c)
  | IntrinsicS Intrinsic [AnnoS g f c]

data ManyPoly a = MonomorphicExpr (Maybe EType) [a] | PolymorphicExpr ClassName EVar EType [(EType, [a])]
  deriving (Show, Eq, Ord)

---- Class instances

instance HasOneLanguage Source where
  langOf s = Just (srcLang s)
  langOf' s = srcLang s

instance Functor ManyPoly where
  fmap f (MonomorphicExpr t xs) = MonomorphicExpr t (map f xs)
  fmap f (PolymorphicExpr cls v t xs) = PolymorphicExpr cls v t (map (second (map f)) xs)

instance Traversable ManyPoly where
  traverse f (MonomorphicExpr t xs) = MonomorphicExpr t <$> traverse f xs
  traverse f (PolymorphicExpr cls v t xs) = PolymorphicExpr cls v t <$> traverse f2 xs
    where
      f2 (t', x) = (,) t' <$> traverse f x

instance Foldable ManyPoly where
  foldr f b (MonomorphicExpr _ xs) = foldr f b xs
  foldr f b (PolymorphicExpr _ _ _ (concatMap snd -> xs)) = foldr f b xs

instance Defaultable ModuleConfig where
  defaultValue =
    ModuleConfig
      { moduleConfigDefaultGroup = Nothing
      , moduleConfigLabeledGroups = Map.empty
      }

instance Defaultable BuildConfig where
  defaultValue =
    BuildConfig
      { buildConfigSlurmSupport = Nothing
      , buildConfigSanitize = Nothing
      }

instance Defaultable RemoteResources where
  defaultValue =
    RemoteResources
      { remoteResourcesThreads = Nothing
      , remoteResourcesMemory = Nothing
      , remoteResourcesTime = Nothing
      , remoteResourcesGpus = Nothing
      }

instance Defaultable ManifoldConfig where
  defaultValue =
    ManifoldConfig
      { manifoldConfigCache = Just False
      , manifoldConfigBenchmark = Just False
      , manifoldConfigRemote = Nothing
      }

instance FromJSON ModuleConfig where
  parseJSON =
    Aeson.genericParseJSON $
      defaultOptions {fieldLabelModifier = stripPrefixAndKebabCase "moduleConfig"}

instance FromJSON ManifoldConfig where
  parseJSON =
    Aeson.genericParseJSON $
      defaultOptions {fieldLabelModifier = stripPrefixAndKebabCase "manifoldConfig"}

instance FromJSON RemoteResources where
  parseJSON =
    Aeson.genericParseJSON $
      defaultOptions {fieldLabelModifier = stripPrefixAndKebabCase "remoteResources"}

instance FromJSON BuildConfig where
  parseJSON =
    Aeson.genericParseJSON $
      defaultOptions {fieldLabelModifier = stripPrefixAndKebabCase "buildConfig"}

---- JSON helpers

-- Helper function to strip prefixes and convert to kebab-case
stripPrefixAndKebabCase :: String -> String -> String
stripPrefixAndKebabCase prefix str =
  let stripped = drop (length prefix) str
   in case stripped of
        [] -> []
        (x : xs) -> toLower x : convertToKebabCase xs

-- Convert remaining characters to kebab-case
convertToKebabCase :: String -> String
convertToKebabCase [] = []
convertToKebabCase (x : xs)
  | isUpper x = '-' : toLower x : convertToKebabCase xs
  | otherwise = x : convertToKebabCase xs

---- Helper functions for AnnoS/ExprS

mapExprSM ::
  (Traversable f, Monad m) => (AnnoS g f c -> m (AnnoS g' f c')) -> ExprS g f c -> m (ExprS g' f c')
mapExprSM f (VarS v xs) = VarS v <$> traverse f xs
mapExprSM f (AppS x xs) = AppS <$> f x <*> mapM f xs
mapExprSM f (LamS vs x) = LamS vs <$> f x
mapExprSM f (LstS xs) = LstS <$> mapM f xs
mapExprSM f (TupS xs) = TupS <$> mapM f xs
mapExprSM f (NamS rs) = NamS <$> mapM (secondM f) rs
mapExprSM _ UniS = return UniS
mapExprSM _ NullS = return NullS
mapExprSM _ (BndS v) = return $ BndS v
mapExprSM _ (RealS x) = return $ RealS x
mapExprSM _ (IntS x) = return $ IntS x
mapExprSM _ (LogS x) = return $ LogS x
mapExprSM _ (StrS x) = return $ StrS x
mapExprSM _ (ExeS x) = return $ ExeS x
mapExprSM f (LetS v e1 e2) = LetS v <$> f e1 <*> f e2
mapExprSM _ (LetBndS v) = return $ LetBndS v
mapExprSM _ (CallS v) = return $ CallS v
mapExprSM f (IfS c t e) = IfS <$> f c <*> f t <*> f e
mapExprSM f (DoBlockS e) = DoBlockS <$> f e
mapExprSM f (EvalS e) = EvalS <$> f e
mapExprSM f (CoerceS c e) = CoerceS c <$> f e
mapExprSM f (IntrinsicS intr es) = IntrinsicS intr <$> mapM f es

mapAnnoSM ::
  (Traversable f, Monad m) =>
  (ExprS g f c -> g -> c -> m (g', c')) ->
  AnnoS g f c ->
  m (AnnoS g' f c')
mapAnnoSM fun (AnnoS g c e) = do
  e' <- mapExprSM (mapAnnoSM fun) e
  (g', c') <- fun e g c
  return (AnnoS g' c' e')

mapAnnoS :: (Traversable f) => (ExprS g f c -> g -> c -> (g', c')) -> AnnoS g f c -> AnnoS g' f c'
mapAnnoS fun = runIdentity . mapAnnoSM (\x g c -> return (fun x g c))

mapExprS :: (Traversable f) => (AnnoS g f c -> AnnoS g' f c') -> ExprS g f c -> ExprS g' f c'
mapExprS fun = runIdentity . mapExprSM (return . fun)

mapAnnoSGM :: (Traversable f, Monad m) => (g -> m g') -> AnnoS g f c -> m (AnnoS g' f c)
mapAnnoSGM f = mapAnnoSM (\_ gi ci -> (,) <$> f gi <*> pure ci)

mapAnnoSCM :: (Traversable f, Monad m) => (c -> m c') -> AnnoS g f c -> m (AnnoS g f c')
mapAnnoSCM f = mapAnnoSM (\_ gi ci -> (,) gi <$> f ci)

mapAnnoSG :: (Traversable f) => (g -> g') -> AnnoS g f c -> AnnoS g' f c
mapAnnoSG f = mapAnnoS (\_ gi ci -> (f gi, ci))

mapAnnoSC :: (Traversable f) => (c -> c') -> AnnoS g f c -> AnnoS g f c'
mapAnnoSC f = mapAnnoS (\_ gi ci -> (gi, f ci))

mapExprSGM :: (Traversable f, Monad m) => (g -> m g') -> ExprS g f c -> m (ExprS g' f c)
mapExprSGM f = mapExprSM (\(AnnoS gi ci e) -> AnnoS <$> f gi <*> pure ci <*> mapExprSGM f e)

mapExprSCM :: (Traversable f, Monad m) => (c -> m c') -> ExprS g f c -> m (ExprS g f c')
mapExprSCM f = mapExprSM (\(AnnoS gi ci e) -> AnnoS gi <$> f ci <*> mapExprSCM f e)

mapExprSG :: (Traversable f) => (g -> g') -> ExprS g f c -> ExprS g' f c
mapExprSG f = mapExprS (\(AnnoS gi ci e) -> AnnoS (f gi) ci (mapExprSG f e))

mapExprSC :: (Traversable f) => (c -> c') -> ExprS g f c -> ExprS g f c'
mapExprSC f = mapExprS (\(AnnoS gi ci e) -> AnnoS gi (f ci) (mapExprSC f e))

----- Pretty instances -------------------------------------------------------

instance Pretty Lit where
  pretty (MNum x) = viaShow x
  pretty (MInt x) = pretty x
  pretty (MLog x) = pretty x
  pretty (MStr x) = pretty x
  pretty MUni = "Unit"
  pretty MNull = "Null"

instance Pretty E where
  pretty (BndP _ v) = pretty v
  pretty (VarP _ v _) = pretty v
  pretty (AppP _ e es) = pretty e <+> hsep (map f es)
    where
      f x@AppP {} = parens (pretty x)
      f x@LamP {} = parens (pretty x)
      f x@SrcP {} = parens (pretty x)
      f x = pretty x
  pretty (LamP _ vs e) = "\\" <+> hsep (map pretty vs) <+> "->" <+> pretty e
  pretty (LstP _ es) = list (map pretty es)
  pretty (TupP _ es) = tupled (map pretty es)
  pretty (NamP _ rs) = encloseSep "{" "}" "," [pretty k <+> "=" <+> pretty e | (k, e) <- rs]
  pretty (LitP _ l) = pretty l
  pretty (SrcP _ src) = pretty src
  pretty (PatP _ s) = pretty (PatternStruct s)
  pretty (IfP _ c t e) = "if" <+> pretty c <+> "then" <+> pretty t <+> "else" <+> pretty e
  pretty (DoBlockP _ e) = "{" <> pretty e <> "}"
  pretty (EvalP _ e) = "!" <> pretty e
  pretty (CoerceP _ _ e) = "coerce(" <> pretty e <> ")"
  pretty (IntrinsicP _ intr args) = "@" <> pretty (intrinsicName intr) <+> hsep (map pretty args)

instance Pretty Source where
  pretty s =
    "source" <+> pretty (srcLang s)
      <> maybe "" (\path -> " from" <+> dquotes (pretty path)) (srcPath s)
        <+> dquotes (pretty (srcName s))
        <+> "as"
        <+> pretty (srcAlias s)
      <> maybe "" (\t -> ":" <> pretty t) (srcLabel s)

instance Pretty ExportGroup where
  pretty (ExportGroup name desc members) =
    "--*" <+> pretty name
      <> maybe "" (\d -> ":" <+> pretty d) (listToMaybe desc)
        <+> tupled (map pretty (Set.toList members))

instance Pretty Symbol where
  pretty (TypeSymbol x) = pretty x
  pretty (TermSymbol x) = pretty x
  pretty (ClassSymbol x) = pretty x

instance Pretty AliasedSymbol where
  pretty (AliasedType x alias)
    | x == alias = pretty x
    | otherwise = pretty x <+> "as" <+> pretty alias
  pretty (AliasedTerm x alias)
    | x == alias = pretty x
    | otherwise = pretty x <+> "as" <+> pretty alias
  pretty (AliasedClass x) = pretty x

instance Pretty ExprI where
  pretty (ExprI i e) = parens (pretty e) <> ":" <> pretty i

instance Pretty Pattern where
  pretty (PatternText s ss) = dquotes $ hcat (pretty s : ["#{}" <> pretty s' | s' <- ss])
  pretty (PatternStruct s) = pretty s

instance Pretty Selector where
  pretty SelectorEnd = ""
  pretty (SelectorKey (k, s) []) = "." <> pretty k <> pretty s
  pretty (SelectorIdx (i, s) []) = "." <> pretty i <> pretty s
  pretty (SelectorKey r rs) = "." <> tupled ["." <> pretty k <> pretty s | (k, s) <- (r : rs)]
  pretty (SelectorIdx r rs) = "." <> tupled ["." <> pretty i <> pretty s | (i, s) <- (r : rs)]

instance Pretty Expr where
  pretty HolE = "_"
  pretty (PatE pat) = "pattern:" <+> pretty pat
  pretty UniE = "()"
  pretty (ModE v es) = align . vsep $ ("module" <+> pretty v) : map pretty es
  pretty (ClsE (Typeclass constraints cls vs sigs)) =
    "class" <+> consStr <> pretty cls <+> hsep (map pretty vs) <> (align . vsep . map pretty) sigs
    where
      consStr = case constraints of
        [] -> ""
        [c] -> pretty c <+> "=> "
        _ -> tupled (map pretty constraints) <+> "=> "
  pretty (IstE cls ts es) = "instance" <+> pretty cls <+> hsep (map (parens . pretty) ts) <> (align . vsep . map pretty) es
  pretty (TypE (ExprTypeE lang v vs t _)) =
    "type" <+> pretty lang
      <> "@"
      <> pretty v
        <+> sep (map (either pretty (parens . pretty)) vs)
        <+> "="
        <+> pretty t
  pretty (ImpE (Import m Nothing _ _)) = "import" <+> pretty m
  pretty (ImpE (Import m (Just xs) _ _)) = "import" <+> pretty m <+> tupled (map pretty xs)
  pretty (ExpE ExportAll) = "export *"
  pretty (ExpE (ExportMany symbols groups)) =
    "export"
      <+> tupled
        ( map pretty (Set.toList symbols)
            ++ [pretty g | g <- groups]
        )
  pretty (VarE _ s) = pretty s
  pretty (LamE v e) = "\\" <+> pretty v <+> "->" <+> pretty e
  pretty (AnnE e t) = parens (pretty e <+> "::" <+> pretty t)
  pretty (LstE es) = encloseSep "[" "]" "," (map pretty es)
  pretty (TupE es) = encloseSep "[" "]" "," (map pretty es)
  pretty (AppE f es) = vsep (map pretty (f : es))
  pretty (NamE rs) = block 4 "<RECORD>" (vsep [pretty k <+> "::" <+> pretty x | (k, x) <- rs])
  pretty (RealE x) = pretty (show x)
  pretty (IntE x) = pretty (show x)
  pretty (StrE x) = dquotes (pretty x)
  pretty (LogE x) = pretty x
  pretty (LetE bindings body) = vsep [pretty v <+> "=" <+> pretty e | (v, e) <- bindings] <+> "in" <+> pretty body
  pretty (AssE v e es) = pretty v <+> "=" <+> pretty e <+> "where" <+> (align . vsep . map pretty) es
  pretty (SrcE (Source srcname lang file' alias _ rsizes _ _ _)) =
    "source"
      <+> viaShow lang
      <> maybe "" (\f -> "from" <+> pretty f) file'
        <+> "where\n"
      <> indent
        2
        ( vsep
            [ "--' srcname: " <> pretty srcname
            , "--' rsize: " <> encloseSep "" "" " " (map pretty rsizes)
            , pretty alias
            ]
        )
  pretty (SigE (Signature v _ e)) =
    pretty v <+> "::" <+> pretty e
  pretty (FixE (Fixity assoc prec ops)) =
    assocStr <+> pretty prec <+> hsep (map pretty ops)
    where
      assocStr :: Doc ann
      assocStr = case assoc of
        InfixL -> "infixl"
        InfixR -> "infixr"
        InfixN -> "infix"
  pretty (ParenE e) = parens (pretty e)
  pretty (BopE e1 _ v e2) = pretty e1 <+> pretty v <+> pretty e2
  pretty (IfE c t e) = "if" <+> pretty c <+> "then" <+> pretty t <+> "else" <+> pretty e
  pretty NullE = "Null"
  pretty (DoBlockE e) = "{" <> pretty e <> "}"
  pretty (EvalE e) = "!" <> pretty e
  pretty (IntrinsicE intr args) = "@" <> pretty (intrinsicName intr) <+> hsep (map pretty args)

instance (Foldable f) => Pretty (AnnoS a f b) where
  pretty (AnnoS _ _ e) = pretty e

instance (Foldable f) => Pretty (ExprS a f b) where
  pretty (AppS e es) = "(AppS" <+> list (map pretty (e : es)) <> ")"
  pretty (VarS v res) = "(VarS" <+> pretty v <+> "=" <+> list (map pretty (toList res)) <> ")"
  pretty (LamS vs e) = "(LamS" <+> list (map pretty vs) <+> "->" <+> pretty e <> ")"
  pretty (LstS es) = "(LstS" <+> list (map pretty es) <> ")"
  pretty (TupS es) = "(TupS" <+> list (map pretty es) <> ")"
  pretty (NamS rs) = "(NamS" <+> list [pretty k <> "=" <> pretty v | (k, v) <- rs] <> ")"
  pretty UniS = "UniS"
  pretty NullS = "NullS"
  pretty (BndS x) = "(BndS" <+> pretty x <> ")"
  pretty (RealS x) = viaShow x
  pretty (IntS x) = viaShow x
  pretty (LogS x) = viaShow x
  pretty (StrS x) = viaShow x
  pretty (ExeS x) = pretty x
  pretty (LetS v e1 e2) = "(LetS" <+> pretty v <+> "=" <+> pretty e1 <+> "in" <+> pretty e2 <> ")"
  pretty (LetBndS x) = "(LetBndS" <+> pretty x <> ")"
  pretty (CallS v) = "(CallS" <+> pretty v <> ")"
  pretty (IfS c t e) = "(IfS" <+> pretty c <+> pretty t <+> pretty e <> ")"
  pretty (DoBlockS e) = "(DoBlockS" <+> pretty e <> ")"
  pretty (EvalS e) = "(EvalS" <+> pretty e <> ")"
  pretty (CoerceS c e) = "(CoerceS" <+> viaShow c <+> pretty e <> ")"
  pretty (IntrinsicS intr es) = "(IntrinsicS" <+> viaShow intr <+> list (map pretty es) <> ")"

instance Pretty ExecutableExpr where
  pretty (SrcCall src) = pretty src
  pretty (PatCall pat) = pretty pat

instance Pretty Signature where
  pretty (Signature v _ e) = pretty v <+> "::" <+> pretty (etype e)


================================================
FILE: library/Morloc/Namespace/Prim.hs
================================================
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Namespace.Prim
Description : Foundation types with zero dependency on other Namespace modules
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Primitive types (newtypes for names, keys, paths) and small data structures
(DAG, GMap, Or, None, etc.) used across the compiler. Re-exports
"Morloc.Internal" so that downstream modules get the proto-prelude for free.
-}
module Morloc.Namespace.Prim
  ( -- ** re-exports
    module Morloc.Internal

    -- ** Synonyms
  , MDoc
  , DAG

    -- ** Other functors
  , None (..)
  , One (..)
  , Or (..)
  , Many (..)

    -- ** Other classes
  , Three (..)
  , Defaultable (..)

    -- ** Indexed
  , IndexedGeneral (..)
  , Indexed

    -- ** Newtypes
  , MVar (..)
  , EVar (..)
  , TVar (..)
  , ClassName (..)
  , CVar (..)
  , Key (..)
  , Label (..)
  , SrcName (..)
  , Path
  , Code (..)
  , TimeInSeconds (..)
  , DirTree (File, Dir, Failed)
  , AnchoredDirTree ((:/))
  , failures
  , writeDirectoryWith

    -- ** Data
  , GMap (..)
  , GMapRet (..)

    -- ** Source locations
  , SrcLoc (..)

    -- ** Typeclasses
  , HasOneLanguage (..)

    -- ** Language
  , Lang (..)

    -- ** Kinds
  , Kind (..)
  ) where

import Data.Aeson (FromJSON (..))
import qualified Data.Aeson as Aeson
import Data.Binary (Binary)
import Data.Map.Strict (Map)
import qualified Data.Map.Strict as Map
import Data.Text (Text)
import qualified Data.Text as DT
import GHC.Generics (Generic)
import Morloc.Data.Doc
import Morloc.Internal
import Morloc.Language (Lang (..))
import System.Directory.Tree (AnchoredDirTree ((:/)), DirTree (Dir, Failed, File), failures, writeDirectoryWith)
import Text.Read (readMaybe)

---- Kinds

-- | Kind of a type variable: either a proper type or a natural number (for dimensions)
data Kind = KindType | KindNat
  deriving (Show, Ord, Eq)

---- Typeclasses

-- | Types that are associated with exactly one language
class HasOneLanguage a where
  langOf :: a -> Maybe Lang
  langOf' :: a -> Lang

  langOf x = Just (langOf' x)
  langOf' x = fromJust (langOf x)

-- | Types with a sensible default (used for initial state, config, etc.)
class Defaultable a where
  defaultValue :: a

---- Type definitions

-- | Unannotated pretty-printer document
type MDoc = Doc ()

{- | A directed acyclic graph. Each key maps to a node value and a list of
@(child-key, edge-data)@ pairs. The structure is not enforced to be acyclic;
'Morloc.Data.DAG.synthesize' detects cycles at runtime.
-}
type DAG key edge node = Map key (node, [(key, edge)])

{- | A two-level map: outer keys -> inner keys -> values. Multiple outer keys
may share the same inner key. See "Morloc.Data.GMap" for operations.
-}
data GMap a b c = GMap (Map a b) (Map b c)
  deriving (Show, Ord, Eq)

-- | Result of a 'GMap' lookup
data GMapRet c
  = -- | Outer key not found
    GMapNoFst
  | -- | Inner key not found (possible bug)
    GMapNoSnd
  | -- | Successful lookup
    GMapJust c
  deriving (Show, Ord, Eq)

-- | Source location span for error reporting
data SrcLoc = SrcLoc
  { srcLocPath :: Maybe Path
  , srcLocLine :: Int
  , srcLocCol :: Int
  , srcLocEndLine :: Int
  , srcLocEndCol :: Int
  }
  deriving (Show, Ord, Eq)

-- | Module name (e.g., @\"math\"@, @\"bio.algo\"@)
newtype MVar = MV {unMVar :: Text} deriving (Show, Eq, Ord)

-- | Term\/expression variable name
newtype EVar = EV {unEVar :: Text} deriving (Show, Eq, Ord)

-- | Type variable name
newtype TVar = TV {unTVar :: Text} deriving (Show, Eq, Ord)

-- | Typeclass name
newtype ClassName = ClassName {unClassName :: Text} deriving (Show, Eq, Ord)

-- | Concrete type name (language-specific)
newtype CVar = CV {unCVar :: Text} deriving (Show, Eq, Ord)

-- | Record field key
newtype Key = Key {unKey :: Text} deriving (Show, Eq, Ord, Generic)

instance Binary Key

-- | Source label for grouping manifold configurations
newtype Label = Label {unLabel :: Text} deriving (Show, Eq, Ord)

{- | Name of a foreign function (may contain characters illegal in morloc,
e.g., the R function @file.exists@)
-}
newtype SrcName = SrcName {unSrcName :: Text} deriving (Show, Eq, Ord)

-- | A blob of generated code
newtype Code = Code {unCode :: Text} deriving (Show, Eq, Ord)

-- | Duration in seconds (parsed from SLURM time format)
newtype TimeInSeconds = TimeInSeconds {unTimeInSeconds :: Int} deriving (Show, Eq, Ord)

-- | Filesystem path (String because filepath libraries expect String)
type Path = String

-- | A three-way sum type
data Three a b c = A a | B b | C c
  deriving (Ord, Eq, Show)

-- | A type carrying no information (used as a placeholder edge type in DAGs)
data None = None
  deriving (Show)

-- | A single wrapped value
newtype One a = One {unOne :: a}
  deriving (Show)

-- | A wrapped list
newtype Many a = Many {unMany :: [a]}
  deriving (Show)

-- | A value that may be left, right, or both
data Or a b = L a | R b | LR a b
  deriving (Ord, Eq, Show)

-- | 'IndexedGeneral' specialized to 'Int' keys
type Indexed = IndexedGeneral Int

-- | A value paired with an index
data IndexedGeneral k a = Idx k a
  deriving (Show, Ord, Eq)

---- Fundamental class instances

instance Functor (IndexedGeneral k) where
  fmap f (Idx i x) = Idx i (f x)

instance Functor One where
  fmap f (One x) = One (f x)

instance Functor Many where
  fmap f (Many x) = Many (map f x)

instance Traversable One where
  traverse f (One x) = One <$> f x

instance Traversable Many where
  traverse f (Many xs) = Many <$> traverse f xs

instance Foldable One where
  foldr f b (One a) = f a b

instance Foldable Many where
  foldr f b (Many xs) = foldr f b xs

instance Bifunctor Or where
  bimapM f _ (L a) = L <$> f a
  bimapM _ g (R a) = R <$> g a
  bimapM f g (LR a b) = LR <$> f a <*> g b

instance Bifoldable Or where
  bilistM f _ (L a) = f a |>> return
  bilistM _ g (R b) = g b |>> return
  bilistM f g (LR a b) = do
    c1 <- f a
    c2 <- g b
    return [c1, c2]

instance Annotated IndexedGeneral where
  val (Idx _ x) = x
  ann (Idx i _) = i
  annotate i x = Idx i x

-- Custom FromJSON instance for TimeInSeconds
instance FromJSON TimeInSeconds where
  parseJSON (Aeson.String t) = case parseSlurmTime (DT.unpack t) of
    Just seconds -> return $ TimeInSeconds seconds
    Nothing -> fail $ "Invalid SLURM time format: " ++ DT.unpack t
  parseJSON _ = fail "Expected a string for SLURM time"

-- Convert SLURM time string (e.g., "01-00:00:00") to seconds
parseSlurmTime :: String -> Maybe Int
parseSlurmTime str = case splitOn "-" str of
  [days, hms] -> do
    d <- readMaybe days :: Maybe Int
    s <- parseHMS hms
    return $ d * 86400 + s
  [hms] -> parseHMS hms -- No days specified
  _ -> Nothing

-- Helper to parse "HH:MM:SS" into seconds
parseHMS :: String -> Maybe Int
parseHMS hms = case splitOn ":" hms of
  [hours, minutes, seconds] -> do
    h <- readMaybe hours :: Maybe Int
    m <- readMaybe minutes :: Maybe Int
    s <- readMaybe seconds :: Maybe Int
    return $ h * 3600 + m * 60 + s
  _ -> Nothing

----- Pretty instances -------------------------------------------------------

instance Pretty Kind where
  pretty KindType = "Type"
  pretty KindNat = "Nat"

instance Pretty SrcLoc where
  pretty (SrcLoc path ln col endLn endCol)
    | ln == endLn && col == endCol =
        maybe "<unknown>" pretty path <> ":" <> pretty ln <> ":" <> pretty col
    | ln == endLn =
        maybe "<unknown>" pretty path <> ":" <> pretty ln <> ":" <> pretty col <> "-" <> pretty endCol
    | otherwise =
        maybe "<unknown>" pretty path
          <> ":"
          <> pretty ln
          <> ":"
          <> pretty col
          <> "-"
          <> pretty endLn
          <> ":"
          <> pretty endCol

instance (Pretty a, Pretty b) => Pretty (Or a b) where
  pretty (L x) = parens ("L" <+> pretty x)
  pretty (R x) = parens ("R" <+> pretty x)
  pretty (LR x y) = parens ("LR" <+> pretty x <> "," <+> pretty y)

instance Pretty EVar where
  pretty (EV v) = pretty v

instance Pretty MVar where
  pretty = pretty . unMVar

instance Pretty TimeInSeconds where
  pretty = pretty . unTimeInSeconds

instance Pretty TVar where
  pretty (TV v) = pretty v

instance Pretty ClassName where
  pretty = pretty . unClassName

instance Pretty Key where
  pretty (Key v) = pretty v

instance Pretty CVar where
  pretty v = pretty (unCVar v)

instance Pretty Label where
  pretty (Label v) = pretty v

instance Pretty SrcName where
  pretty = pretty . unSrcName

instance Pretty Code where
  pretty = pretty . unCode

instance Pretty None where
  pretty None = "()"

instance (Pretty a) => Pretty (One a) where
  pretty (One x) = pretty x

instance (Pretty a) => Pretty (Many a) where
  pretty (Many xs) = list $ map pretty xs

instance (Pretty k, Pretty a) => Pretty (IndexedGeneral k a) where
  pretty (Idx i x) = parens (pretty i <> ":" <+> pretty x)

instance (Pretty k1, Pretty k2, Pretty v) => Pretty (GMap k1 k2 v) where
  pretty (GMap m1 m2) = "GMap" <+> (align . vsep $ [pretty (Map.toList m1), pretty (Map.toList m2)])


================================================
FILE: library/Morloc/Namespace/State.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Namespace.State
Description : Compiler state, monad stack, config, errors
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

The compiler monad ('MorlocMonad') and its components:

* 'Config' -- read-only configuration loaded from @~\/.local\/share\/morloc\/config@
* 'MorlocError' -- all compiler error types
* 'MorlocState' -- mutable state threading type info, sources, and metadata
  through the pipeline
* 'Gamma' \/ 'GammaIndex' -- typechecking context (ordered list of assumptions)
* 'Script' -- a generated pool file with its build commands
-}
module Morloc.Namespace.State
  ( -- * Morloc monad
    MorlocMonadGen
  , MorlocMonad
  , MorlocReturn
  , MorlocState (..)
  , SignatureSet (..)
  , Instance (..)
  , TermTypes (..)

    -- * Error handling
  , MorlocError (..)

    -- * Configuration
  , Config (..)

    -- * Package metadata
  , PackageMeta (..)

    -- * Typechecking
  , Gamma (..)
  , GammaIndex (..)
  , ConstVal (..)

    -- * Data files
  , NexusSource (..)

    -- * Sockets
  , Socket (..)

    -- * System
  , SysCommand (..)
  , Script (..)

    -- * Language registry
  , LangRegistry (..)
  , LangRegistryEntry (..)
  ) where

import Control.Monad.Except (ExceptT)
import Control.Monad.Reader (ReaderT)
import Control.Monad.State (StateT)
import Control.Monad.Writer (WriterT)
import Data.Aeson (FromJSON (..), (.!=), (.:?))
import qualified Data.Aeson as Aeson
import qualified Data.IntMap.Strict as IntMap
import qualified Data.Map as Map
import Data.Map.Strict (Map)
import qualified Data.Set as Set
import Data.Text (Text)
import Morloc.Data.Doc
import Morloc.LangRegistry (LangRegistry (..), LangRegistryEntry (..))
import qualified Morloc.LangRegistry as LR
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.Type

---- Monad types

{- | The general monad transformer stack: Reader for config, Except for errors,
Writer for log messages, State for mutable compiler state, over IO.
-}
type MorlocMonadGen c e l s a =
  ReaderT c (ExceptT e (WriterT l (StateT s IO))) a

-- | The full result of running a MorlocMonad computation
type MorlocReturn a = ((Either MorlocError a, [Text]), MorlocState)

-- | The concrete compiler monad used throughout the pipeline
type MorlocMonad a = MorlocMonadGen Config MorlocError [Text] MorlocState a

---- State

{- | Mutable compiler state threaded through the entire pipeline.
Accumulates type signatures, source bindings, typedefs, and metadata
as modules are parsed, linked, and typechecked.
-}
data MorlocState = MorlocState
  { statePackageMeta :: [PackageMeta]
  , stateVerbosity :: Int
  , stateCounter :: Int
  , stateDepth :: Int
  , stateSignatures :: GMap Int Int SignatureSet
  , stateTypeclasses :: Map.Map EVar Instance
  , stateConcreteTypedefs :: GMap Int MVar (Map Lang Scope)
  , stateGeneralTypedefs :: GMap Int MVar Scope
  , stateUniversalGeneralTypedefs :: Scope
  , stateUniversalConcreteTypedefs :: Map Lang Scope
  , stateSources :: GMap Int MVar [Source]
  , stateAnnotations :: Map Int TypeU
  , stateOutfile :: Maybe Path
  , stateExports :: [Int]
  , stateName :: Map Int EVar
  , stateTermDocs :: Map.Map EVar [Text]
  -- ^ Declaration-level docstrings keyed by term name. Takes precedence over
  -- signature docstrings for the command-level description.
  , stateManifoldConfig :: Map Int ManifoldConfig
  , stateSourceMap :: Map Int SrcLoc
  , stateSourceText :: Map Path Text
  , stateBuildConfig :: BuildConfig
  , stateModuleName :: Maybe MVar
  , stateInstall :: Bool
  , stateInstallForce :: Bool
  , stateInstallDir :: Maybe Path
  , stateClassDefs :: Map ClassName [Constraint]
  , stateLangRegistry :: LangRegistry
  , stateExportGroups :: Map Text ([Text], [Int])
  -- ^ Map from group name to (description lines, member export indices)
  , stateManifoldLang :: Map Int Lang
  -- ^ Map from export manifold ID to its pool language
  , stateManifoldEffects :: Map Int (Set.Set EffectLabel)
  -- ^ Map from export manifold ID to its original return effect labels
  , stateProjectRoot :: Maybe Path
  -- ^ Project root directory (directory of the entry-point file)
  , stateEvalMode :: Bool
  -- ^ True when running in eval mode (restricts source/class/instance)
  , stateModuleDoc :: [Text]
  -- ^ Module-level description lines (from docstrings before module declaration)
  , stateModuleEpilogues :: [[Text]]
  -- ^ Epilogue blocks for the top-level help output
  }
  deriving (Show)

data SignatureSet
  = Monomorphic TermTypes
  | Polymorphic
      ClassName
      EVar
      EType
      [TermTypes]
  deriving (Show)

data Instance = Instance
  { className :: ClassName
  , classVars :: [TVar]
  , classType :: EType
  , instanceTerms :: [TermTypes]
  }
  deriving (Show, Ord, Eq)

data TermTypes = TermTypes
  { termGeneral :: Maybe EType
  , termConcrete :: [(MVar, Indexed Source)]
  , termDecl :: [ExprI]
  }
  deriving (Show, Ord, Eq)

---- Error types

-- | All compiler errors
data MorlocError
  = -- | Error tied to a specific AST node index
    SourcedError Int MDoc
  | -- | Internal compiler error (bug)
    SystemError MDoc
  | -- | Type unification failure
    UnificationError Int Int Int MDoc
  deriving (Show)

---- Configuration

-- | Read-only configuration loaded from the morloc config file
data Config
  = Config
  { configHome :: !Path
  , configLibrary :: !Path
  , configPlane :: !Path
  , configPlaneCore :: !Path
  , configTmpDir :: !Path
  , configBuildConfig :: !Path
  , configLangOverrides :: !(Map Text [Text])
  , configRegistry :: !(Maybe Text)
  }
  deriving (Show, Ord, Eq)

---- Package metadata

data PackageMeta
  = PackageMeta
  { packageName :: !Text
  , packageVersion :: !Text
  , packageHomepage :: !Text
  , packageSynopsis :: !Text
  , packageDescription :: !Text
  , packageCategory :: !Text
  , packageLicense :: !Text
  , packageAuthor :: !Text
  , packageMaintainer :: !Text
  , packageGithub :: !Text
  , packageBugReports :: !Text
  , packageCppVersion :: !Int
  , packageDependencies :: [Text]
  , packageInclude :: Maybe [Text]
  }
  deriving (Show, Ord, Eq)

---- Typechecking context

{- | Entries in the typechecking context (an ordered list of assumptions).
The context is manipulated as a stack during bidirectional typechecking.
-}
data GammaIndex
  = VarG TVar
  | AnnG EVar TypeU
  | ExistG
      TVar
      ([TypeU], OpenOrClosed)
      ([(Key, TypeU)], OpenOrClosed)
  | SolvedG TVar TypeU
  | MarkG TVar
  | SrcG Source
  deriving (Ord, Eq, Show)

{- | Typechecking context using IntMap for O(log N) operations.
Entries are keyed by monotonically increasing slot numbers (higher = newer).
Side-indexes provide O(log N) lookup of ExistG entries by TVar.
-}
data Gamma = Gamma
  { gammaCounter :: !Int
  -- | Next available slot number (always increasing)
  , gammaSlot :: !Int
  -- | Ordered context: higher slot = newer entry
  , gammaContext :: IntMap.IntMap GammaIndex
  -- | Index: ExistG TVar -> slot number (for O(log N) access1)
  , gammaExist :: Map TVar Int
  -- | Cache of solved existential types
  , gammaSolved :: Map TVar TypeU
  -- | Nat constraints that could not be solved (deferred)
  , gammaDeferred :: [(TypeU, TypeU)]
  -- | Solutions for NatVarU variables from nat constraint solving
  , gammaNatSubs :: Map TVar TypeU
  -- | Known constant values for let-bound variables (for nat label resolution).
  -- Tracks integers, tuples, and records so accessors like .0 can be evaluated.
  , gammaIntVals :: Map EVar ConstVal
  }

-- | Compile-time constant values tracked during typechecking for nat label
-- resolution. Only pure literal expressions are tracked.
data ConstVal
  = ConstInt Integer
  | ConstTup [ConstVal]
  deriving (Show, Eq, Ord)

---- Data files and system

data NexusSource = NexusSource
  { nexusSourceUtility :: MDoc
  , nexusSourceMain :: MDoc
  }

data Socket = Socket
  { socketLang :: Lang
  , socketServerInit :: [MDoc]
  , socketPath :: MDoc
  }
  deriving (Show)

data SysCommand
  = SysExe Path
  | SysMove Path Path
  | SysRun Code
  | SysInstall Path
  | SysUnlink Path
  deriving (Show, Ord, Eq)

data Script
  = Script
  { scriptBase :: !String
  , scriptLang :: !Lang
  , scriptCode :: !(AnchoredDirTree Code)
  , scriptMake :: ![SysCommand]
  }
  deriving (Show, Ord, Eq)

---- Instances

instance Defaultable MorlocState where
  defaultValue =
    MorlocState
      { statePackageMeta = []
      , stateVerbosity = 0
      , stateCounter = -1
      , stateDepth = 0
      , stateSignatures = GMap Map.empty Map.empty
      , stateTypeclasses = Map.empty
      , stateConcreteTypedefs = GMap Map.empty Map.empty
      , stateGeneralTypedefs = GMap Map.empty Map.empty
      , stateUniversalConcreteTypedefs = Map.empty
      , stateUniversalGeneralTypedefs = Map.empty
      , stateSources = GMap Map.empty Map.empty
      , stateAnnotations = Map.empty
      , stateOutfile = Nothing
      , stateExports = []
      , stateName = Map.empty
      , stateTermDocs = Map.empty
      , stateManifoldConfig = Map.empty
      , stateSourceMap = Map.empty
      , stateSourceText = Map.empty
      , stateBuildConfig = defaultValue
      , stateModuleName = Nothing
      , stateInstall = False
      , stateInstallForce = False
      , stateInstallDir = Nothing
      , stateClassDefs = Map.empty
      , stateLangRegistry = LR.emptyRegistry
      , stateExportGroups = Map.empty
      , stateManifoldLang = Map.empty
      , stateManifoldEffects = Map.empty
      , stateProjectRoot = Nothing
      , stateEvalMode = False
      , stateModuleDoc = []
      , stateModuleEpilogues = []
      }

instance Defaultable PackageMeta where
  defaultValue =
    PackageMeta
      { packageName = ""
      , packageVersion = ""
      , packageHomepage = ""
      , packageSynopsis = ""
      , packageDescription = ""
      , packageCategory = ""
      , packageLicense = ""
      , packageAuthor = ""
      , packageMaintainer = ""
      , packageGithub = ""
      , packageBugReports = ""
      , packageCppVersion = 17
      , packageDependencies = []
      , packageInclude = Nothing
      }

instance FromJSON Config where
  parseJSON =
    Aeson.withObject "object" $ \o -> do
      home' <- o .:? "home" .!= "~/.local/share/morloc"
      source' <- o .:? "source" .!= "~/.local/share/morloc/src/morloc"
      plane' <- o .:? "plane" .!= "default"
      planeCore' <- o .:? "plane-core" .!= "morloclib"
      tmpdir' <- o .:? "tmpdir" .!= "~/.local/share/morloc/tmp"
      buildConfig' <- o .:? "build-config" .!= "~/.local/share/morloc/build-config.yaml"
      -- Parse legacy lang_python3/lang_R fields into langOverrides
      pyCmd <- o .:? "lang_python3" .!= ("" :: Text)
      rCmd <- o .:? "lang_R" .!= ("" :: Text)
      overrides <- o .:? "lang_overrides" .!= Map.empty
      registry' <- o .:? "registry"
      let legacyOverrides =
            Map.fromList $
              filter
                (not . null . snd)
                [ ("py", if pyCmd == "" then [] else [pyCmd])
                , ("r", if rCmd == "" then [] else [rCmd])
                ]
          allOverrides = Map.union overrides legacyOverrides
      return $ Config home' source' plane' planeCore' tmpdir' buildConfig' allOverrides registry'

instance FromJSON PackageMeta where
  parseJSON = Aeson.withObject "object" $ \o ->
    PackageMeta
      <$> o .:? "name" .!= ""
      <*> o .:? "version" .!= ""
      <*> o .:? "homepage" .!= ""
      <*> o .:? "synopsis" .!= ""
      <*> o .:? "description" .!= ""
      <*> o .:? "category" .!= ""
      <*> o .:? "license" .!= ""
      <*> o .:? "author" .!= ""
      <*> o .:? "maintainer" .!= ""
      <*> o .:? "github" .!= ""
      <*> o .:? "bug-reports" .!= ""
      <*> o .:? "cpp-version" .!= 0
      <*> o .:? "dependencies" .!= []
      <*> o .:? "include"

----- Pretty instances -------------------------------------------------------

instance Pretty Instance where
  pretty (Instance cls vs et ts) =
    "Instance"
      <+> pretty cls
      <+> pretty vs
      <+> parens (pretty (etype et))
      <+> list (map pretty ts)

instance Pretty TermTypes where
  pretty (TermTypes (Just t) cs es) = "TermTypes" <+> (align . vsep $ (parens (pretty t) : map pretty cs <> map pretty es))
  pretty (TermTypes Nothing cs es) = "TermTypes" <+> "?" <> (align . vsep $ (map pretty cs <> map pretty es))

instance Pretty SignatureSet where
  pretty (Monomorphic t) = pretty t
  pretty (Polymorphic cls v t ts) =
    "class"
      <+> pretty cls
      <+> (align . vsep $ (pretty v <+> "::" <+> parens (pretty t)) : map pretty ts)

instance Pretty GammaIndex where
  pretty (VarG tv) = "VarG:" <+> pretty tv
  pretty (ExistG tv ([], _) ([], _)) = angles (pretty tv)
  pretty (ExistG tv (ts, _) (rs, _)) =
    "ExistG:"
      <+> pretty tv
      <+> list (map (parens . pretty) ts)
      <+> list (map ((\(x, y) -> tupled [x, y]) . bimap pretty pretty) rs)
  pretty (SolvedG tv t) = "SolvedG:" <+> pretty tv <+> "=" <+> pretty t
  pretty (MarkG tv) = "MarkG:" <+> pretty tv
  pretty (SrcG (Source ev1 lang _ _ _ _ _ _ _)) = "SrcG:" <+> pretty ev1 <+> viaShow lang
  pretty (AnnG v t) = pretty v <+> "::" <+> pretty t


================================================
FILE: library/Morloc/Namespace/Type.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Namespace.Type
Description : Type system types and partial order logic
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Core type representations. 'Type' is the ground type (no quantifiers) used
after type erasure. 'TypeU' is the full type with existentials ('ExistU') and
universals ('ForallU'), used during typechecking and in type signatures.
'EType' extends 'TypeU' with typeclass constraints and documentation.

A partial order is defined on 'TypeU' via "Data.PartialOrd" where @t1 <= t2@
means t1 is at least as specific as t2 (t1 is a subtype of t2).
-}
module Morloc.Namespace.Type
  ( -- * Types
    NamType (..)
  , Type (..)
  , TypeU (..)
  , OpenOrClosed (..)
  , extractKey
  , type2typeu
  , EType (..)
  , unresolvedType2type

    -- * Effect types
  , EffectLabel
  , EffectSet (..)
  , resolveEffectSet
  , emptyEffectSet
  , ioEffectSet
  , effectSubsetOf

    -- * Docstring related types
  , CliOpt (..)
  , ArgDoc (..)
  , ArgDocVars (..)
  , ExprTypeE (..)

    -- * Scope
  , Scope

    -- * Type extensions
  , Constraint (..)

    -- * Predicates
  , containsUnk

    -- * Typeclasses
  , Typelike (..)

    -- * kludge
  , newVariable

    -- * Partial order logic
  , isSubtypeOf
  , equivalent
  , mostGeneral
  , mostSpecific
  , mostSpecificSubtypes
  , substituteFirst
  , findFirst
  ) where

import qualified Data.List as DL
import Data.Map.Strict (Map)
import qualified Data.PartialOrd as P
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as DT
import Morloc.Data.Doc
import Morloc.Namespace.Prim

---- Effect types

-- | A named effect label (e.g., "IO", "Random", "Error")
type EffectLabel = Text

-- | An effect set for use during typechecking. May contain concrete labels,
-- unsolved effect variables, or unions of effect sets.
data EffectSet
  = EffectSet (Set.Set EffectLabel)
  | EffectVar TVar
  | EffectUnion EffectSet EffectSet
  deriving (Show, Ord, Eq)

-- | Resolve an effect set to concrete labels. Unsolved variables resolve to empty.
resolveEffectSet :: EffectSet -> Set.Set EffectLabel
resolveEffectSet (EffectSet labels) = labels
resolveEffectSet (EffectVar _) = Set.empty
resolveEffectSet (EffectUnion a b) = Set.union (resolveEffectSet a) (resolveEffectSet b)

-- | An empty effect set (no effects)
emptyEffectSet :: EffectSet
emptyEffectSet = EffectSet Set.empty

-- | An IO effect set
ioEffectSet :: EffectSet
ioEffectSet = EffectSet (Set.singleton "IO")

-- | Check if one effect set is a subset of another (resolved labels).
-- Unsolved EffectVar resolves to empty, so EffectVar is a subset of everything.
effectSubsetOf :: EffectSet -> EffectSet -> Bool
effectSubsetOf e1 e2 = Set.isSubsetOf (resolveEffectSet e1) (resolveEffectSet e2)

---- Type definitions

{- | Scope maps each type name to its definitions: the type parameters, the
body type, documentation, and whether the definition is terminal (won't be
expanded further during type resolution).
-}
type Scope =
  Map
    TVar
    [ ( [Either (TVar, Kind) TypeU] -- type parameters (generic for left, specific for right)
      , TypeU
      , ArgDoc
      , Bool -- True if this is a "terminal" type (won't be reduced further)
      )
    ]

-- | Flavors of named (keyed) types
data NamType
  = -- | Structural record with named fields
    NamRecord
  | -- | Nominal object type
    NamObject
  | -- | Tabular type (columns as fields)
    NamTable
  deriving (Show, Ord, Eq)

{- | Ground type with no quantifiers. Produced after type erasure and used in
code generation where all type variables have been resolved.
-}
data Type
  = UnkT TVar
  | VarT TVar
  | FunT [Type] Type
  | AppT Type [Type]
  | NamT NamType TVar [Type] [(Key, Type)]
  | EffectT (Set.Set EffectLabel) Type
  | OptionalT Type
  | NatLitT Integer
  | NatAddT Type Type
  | NatMulT Type Type
  | NatSubT Type Type
  | NatDivT Type Type
  deriving (Show, Ord, Eq)

data OpenOrClosed = Open | Closed
  deriving (Show, Ord, Eq)

{- | Full type with quantifiers. 'ExistU' represents existential variables
(solved during unification), 'ForallU' represents universally quantified
variables. This is the primary type representation during typechecking.
-}
data TypeU
  = VarU TVar
  | NatVarU TVar -- ^ Nat-kinded variable, never quantified by ForallU
  | ExistU
      TVar
      ([TypeU], OpenOrClosed)
      ([(Key, TypeU)], OpenOrClosed)
  | ForallU TVar TypeU
  | FunU [TypeU] TypeU
  | AppU TypeU [TypeU]
  | NamU NamType TVar [TypeU] [(Key, TypeU)]
  | EffectU EffectSet TypeU
  | OptionalU TypeU
  | NatLitU Integer
  | NatAddU TypeU TypeU
  | NatMulU TypeU TypeU
  | NatSubU TypeU TypeU
  | NatDivU TypeU TypeU
  | LabeledU TVar TypeU -- ^ Transient: m:Int -> LabeledU (TV "m") Int, stripped in desugar
  deriving (Show, Ord, Eq)

{- | Extended Type that may represent a language specific type as well as sets
of properties and constrains.
-}
data EType
  = EType
  { etype :: TypeU
  , econs :: Set.Set Constraint
  , edocs :: ArgDoc
  , enatLabels :: Map TVar Int -- ^ Nat var name -> argument position index (from m:Int syntax)
  }
  deriving (Show, Eq, Ord)

data Constraint = Constraint ClassName [TypeU]
  deriving (Show, Eq, Ord)

-- a CLI option that takes an argument
data CliOpt
  = CliOptShort Char
  | CliOptLong Text
  | CliOptBoth Char Text
  deriving (Show, Ord, Eq)

data ArgDocVars = ArgDocVars
  { docLines :: [Text]
  , docName :: Maybe Text
  , docLiteral :: Maybe Bool
  , docUnroll :: Maybe Bool
  , docDefault :: Maybe Text
  , docMetavar :: Maybe Text
  , docArg :: Maybe CliOpt
  , docTrue :: Maybe CliOpt
  , docFalse :: Maybe CliOpt
  , docReturn :: Maybe Text
  }
  deriving (Show, Ord, Eq)

data ArgDoc
  = ArgDocRec ArgDocVars [(Key, ArgDocVars)]
  | ArgDocSig
      ArgDocVars
      [ArgDocVars]
      ArgDocVars
  | ArgDocAlias ArgDocVars
  deriving (Show, Ord, Eq)

-- Wraps all information stored in a type definition
data ExprTypeE = ExprTypeE
  { exprTypeConcreteForm :: Maybe (Lang, Bool)
  , exprTypeName :: TVar
  , exprTypeParams :: [Either (TVar, Kind) TypeU]
  , exprTypeType :: TypeU
  , exprTypeDoc :: ArgDoc
  }
  deriving (Show, Ord, Eq)

---- Typeclasses

class Typelike a where
  typeOf :: a -> Type

  free :: a -> Set.Set a

  substituteTVar :: TVar -> a -> a -> a

  nargs :: a -> Int
  nargs (typeOf -> FunT ts _) = length ts
  nargs _ = 0

  normalizeType :: a -> a

---- Typeclass instances

instance Defaultable ArgDocVars where
  defaultValue =
    ArgDocVars
      { docLines = []
      , docName = Nothing
      , docLiteral = Nothing
      , docUnroll = Nothing
      , docDefault = Nothing
      , docMetavar = Nothing
      , docArg = Nothing
      , docTrue = Nothing
      , docFalse = Nothing
      , docReturn = Nothing
      }

instance Typelike Type where
  typeOf = id

  substituteTVar v0 r0 t0 = sub t0
    where
      sub t@(UnkT _) = t
      sub t@(VarT v)
        | v0 == v = r0
        | otherwise = t
      sub (FunT ts t) = FunT (map sub ts) (sub t)
      sub (AppT v ts) = AppT (sub v) (map sub ts)
      sub (NamT r n ps es) = NamT r n ps [(k, sub t) | (k, t) <- es]
      sub (EffectT effs t) = EffectT effs (sub t)
      sub (OptionalT t) = OptionalT (sub t)
      sub t@(NatLitT _) = t
      sub (NatAddT a b) = NatAddT (sub a) (sub b)
      sub (NatMulT a b) = NatMulT (sub a) (sub b)
      sub (NatSubT a b) = NatSubT (sub a) (sub b)
      sub (NatDivT a b) = NatDivT (sub a) (sub b)

  free (UnkT _) = Set.empty
  free v@(VarT _) = Set.singleton v
  free (FunT ts t) = Set.unions (map free (t : ts))
  free (AppT t ts) = Set.unions (map free (t : ts))
  free (NamT _ _ _ es) = Set.unions (map (free . snd) es)
  free (EffectT _ t) = free t
  free (OptionalT t) = free t
  free (NatLitT _) = Set.empty
  free (NatAddT a b) = Set.union (free a) (free b)
  free (NatMulT a b) = Set.union (free a) (free b)
  free (NatSubT a b) = Set.union (free a) (free b)
  free (NatDivT a b) = Set.union (free a) (free b)

  normalizeType (FunT ts1 (FunT ts2 ft)) = normalizeType $ FunT (ts1 <> ts2) ft
  normalizeType (AppT t ts) = AppT (normalizeType t) (map normalizeType ts)
  normalizeType (NamT n v ds ks) = NamT n v (map normalizeType ds) (zip (map fst ks) (map (normalizeType . snd) ks))
  normalizeType (EffectT effs t) = EffectT effs (normalizeType t)
  normalizeType (OptionalT t) = OptionalT (normalizeType t)
  normalizeType (NatAddT a b) = NatAddT (normalizeType a) (normalizeType b)
  normalizeType (NatMulT a b) = NatMulT (normalizeType a) (normalizeType b)
  normalizeType (NatSubT a b) = NatSubT (normalizeType a) (normalizeType b)
  normalizeType (NatDivT a b) = NatDivT (normalizeType a) (normalizeType b)
  normalizeType t = t

instance Typelike TypeU where
  typeOf (VarU v) = VarT v
  typeOf (NatVarU _) = NatLitT 0
  typeOf (ExistU _ (ps, _) (rs@(_ : _), _)) = NamT NamRecord (TV "Record") (map typeOf ps) (map (second typeOf) rs)
  typeOf (ExistU v _ _) = typeOf (ForallU v (VarU v))
  typeOf (ForallU v t) = substituteTVar v (UnkT v) (typeOf t)
  typeOf (FunU ts t) = FunT (map typeOf ts) (typeOf t)
  typeOf (AppU t ts) = AppT (typeOf t) (map typeOf ts)
  typeOf (NamU n o ps rs) = NamT n o (map typeOf ps) (zip (map fst rs) (map (typeOf . snd) rs))
  typeOf (EffectU effs t) = EffectT (resolveEffectSet effs) (typeOf t)
  typeOf (OptionalU t) = OptionalT (typeOf t)
  typeOf (NatLitU n) = NatLitT n
  typeOf (NatAddU a b) = NatAddT (typeOf a) (typeOf b)
  typeOf (NatMulU a b) = NatMulT (typeOf a) (typeOf b)
  typeOf (NatSubU a b) = NatSubT (typeOf a) (typeOf b)
  typeOf (NatDivU a b) = NatDivT (typeOf a) (typeOf b)
  typeOf (LabeledU _ t) = typeOf t

  free v@(VarU _) = Set.singleton v
  free (NatVarU _) = Set.empty
  free v@(ExistU _ ([], _) (rs, _)) = Set.unions $ Set.singleton v : map (free . snd) rs
  free (ExistU v (ts, _) _) = Set.unions $ Set.singleton (AppU (VarU v) ts) : map free ts
  free (ForallU v t) = Set.delete (VarU v) (free t)
  free (FunU ts t) = Set.unions $ map free (t : ts)
  free (AppU t ts) = Set.unions $ map free (t : ts)
  free (NamU _ _ ps rs) = Set.unions $ map free (map snd rs <> ps)
  free (EffectU _ t) = free t
  free (OptionalU t) = free t
  free (NatLitU _) = Set.empty
  free (NatAddU a b) = Set.union (free a) (free b)
  free (NatMulU a b) = Set.union (free a) (free b)
  free (NatSubU a b) = Set.union (free a) (free b)
  free (NatDivU a b) = Set.union (free a) (free b)
  free (LabeledU _ t) = free t

  substituteTVar v (ForallU q r) t =
    if Set.member (VarU q) (free t)
      then
        let q' = newVariable r t
            r' = substituteTVar q (VarU q') r
         in ForallU q' (substituteTVar v r' t)
      else
        ForallU q (substituteTVar v r t)
  substituteTVar _ _ t@(NatVarU _) = t
  substituteTVar v0 r0 t0 = sub t0
    where
      sub t@(VarU v)
        | v0 == v = r0
        | otherwise = t
      sub t@(NatVarU _) = t
      sub (ExistU v (map sub -> ps, pc) (map (second sub) -> rs, rc)) = ExistU v (ps, pc) (rs, rc)
      sub (ForallU v t)
        | v0 == v = ForallU v t
        | otherwise = ForallU v (sub t)
      sub (FunU ts t) = FunU (map sub ts) (sub t)
      sub (AppU t ts) = AppU (sub t) (map sub ts)
      sub (NamU r n ps rs) = NamU r n (map sub ps) [(k, sub t) | (k, t) <- rs]
      sub (EffectU effs t) = EffectU effs (sub t)
      sub (OptionalU t) = OptionalU (sub t)
      sub t@(NatLitU _) = t
      sub (NatAddU a b) = NatAddU (sub a) (sub b)
      sub (NatMulU a b) = NatMulU (sub a) (sub b)
      sub (NatSubU a b) = NatSubU (sub a) (sub b)
      sub (NatDivU a b) = NatDivU (sub a) (sub b)
      sub (LabeledU n t) = LabeledU n (sub t)

  normalizeType (FunU ts1 (FunU ts2 ft)) = normalizeType $ FunU (ts1 <> ts2) ft
  normalizeType (AppU t ts) = AppU (normalizeType t) (map normalizeType ts)
  normalizeType (NamU n v ds ks) = NamU n v (map normalizeType ds) (zip (map fst ks) (map (normalizeType . snd) ks))
  normalizeType (ForallU v t) = ForallU v (normalizeType t)
  normalizeType (ExistU v (map normalizeType -> ps, pc) (map (second normalizeType) -> rs, rc)) = ExistU v (ps, pc) (rs, rc)
  normalizeType (EffectU effs t) = EffectU effs (normalizeType t)
  normalizeType (OptionalU t) = OptionalU (normalizeType t)
  normalizeType (NatAddU a b) = NatAddU (normalizeType a) (normalizeType b)
  normalizeType (NatMulU a b) = NatMulU (normalizeType a) (normalizeType b)
  normalizeType (NatSubU a b) = NatSubU (normalizeType a) (normalizeType b)
  normalizeType (NatDivU a b) = NatDivU (normalizeType a) (normalizeType b)
  normalizeType t@(NatVarU _) = t
  normalizeType (LabeledU n t) = LabeledU n (normalizeType t)
  normalizeType t = t

----- Partial order logic

instance P.PartialOrd TypeU where
  (<=) (VarU v1) (VarU v2) = v1 == v2
  (<=) (NatVarU v1) (NatVarU v2) = v1 == v2
  (<=) (ExistU v1 (ts1, _) (rs1, _)) (ExistU v2 (ts2, _) (rs2, _)) =
    v1 == v2
      && length ts1 == length ts2
      && and (zipWith (P.<=) ts1 ts2)
      && and [maybe False (t1 P.<=) (lookup k rs2) | (k, t1) <- rs1]
  (<=) (ForallU v t1) t2
    | (P.==) (ForallU v t1) t2 = True
    | otherwise = (P.<=) (substituteFirst v t1 t2) t2
  (<=) (FunU (t11 : rs1) t12) (FunU (t21 : rs2) t22) = t11 P.<= t21 && FunU rs1 t12 P.<= FunU rs2 t22
  (<=) (FunU [] t12) (FunU [] t22) = t12 P.<= t22
  (<=) (AppU t1 (t11 : rs1)) (AppU t2 (t21 : rs2)) = t11 P.<= t21 && AppU t1 rs1 P.<= AppU t2 rs2
  (<=) (AppU t1 []) (AppU t2 []) = t1 P.<= t2
  (<=) (NamU o1 n1 ps1 ((k1, e1) : rs1)) (NamU o2 n2 ps2 es2) =
    case DL.partition ((== k1) . fst) es2 of
      ([(_, e2)], rs2) -> e1 P.<= e2 && NamU o1 n1 ps1 rs1 P.<= NamU o2 n2 ps2 rs2
      _ -> False
  (<=) (NamU o1 n1 ps1 []) (NamU o2 n2 ps2 []) =
    o1 == o2 && n1 == n2 && length ps1 == length ps2
  (<=) (EffectU e1 t1) (EffectU e2 t2) = e1 == e2 && t1 P.<= t2
  (<=) (OptionalU t1) (OptionalU t2) = t1 P.<= t2
  (<=) (NatLitU n1) (NatLitU n2) = n1 == n2
  (<=) (NatAddU a1 b1) (NatAddU a2 b2) = a1 P.<= a2 && b1 P.<= b2
  (<=) (NatMulU a1 b1) (NatMulU a2 b2) = a1 P.<= a2 && b1 P.<= b2
  (<=) (NatSubU a1 b1) (NatSubU a2 b2) = a1 P.<= a2 && b1 P.<= b2
  (<=) (NatDivU a1 b1) (NatDivU a2 b2) = a1 P.<= a2 && b1 P.<= b2
  (<=) (LabeledU _ t1) t2 = t1 P.<= t2
  (<=) t1 (LabeledU _ t2) = t1 P.<= t2
  (<=) _ _ = False

  (==) (ForallU v1 t1) (ForallU v2 t2) =
    if Set.member (VarU v1) (free t2)
      then
        let v = newVariable t1 t2
         in (P.==) (substituteTVar v1 (VarU v) t1) (substituteTVar v2 (VarU v) t2)
      else (P.==) t1 (substituteTVar v2 (VarU v1) t2)
  (==) a b = a == b

substituteFirst :: TVar -> TypeU -> TypeU -> TypeU
substituteFirst v t1 t2 = case findFirst v t1 t2 of
  (Just t) -> substituteTVar v t t1
  Nothing -> t1

findFirst :: TVar -> TypeU -> TypeU -> Maybe TypeU
findFirst v = f
  where
    f (VarU v') t2
      | v == v' = Just t2
      | otherwise = Nothing
    f (NatVarU _) _ = Nothing
    f (ForallU v1 t1) (ForallU v2 t2)
      | v == v1 = Nothing
      | otherwise = f t1 (substituteTVar v2 (VarU v1) t2)
    f (ForallU v1 t1) t2
      | v == v1 = Nothing
      | otherwise = f (substituteTVar v1 (VarU v1) t1) t2
    f (FunU ts1 t1) (FunU ts2 t2) =
      foldl firstOf Nothing (zipWith f (ts1 <> [t1]) (ts2 <> [t2]))
    f (AppU t1 ts1) (AppU t2 ts2) =
      foldl firstOf Nothing (zipWith f (t1 : ts1) (t2 : ts2))
    f (NamU o1 n1 ps1 ((k1, e1) : rs1)) (NamU o2 n2 ps2 es2) =
      case DL.partition ((== k1) . fst) es2 of
        ([(_, e2)], rs2) -> firstOf (f e1 e2) (f (NamU o1 n1 ps1 rs1) (NamU o2 n2 ps2 rs2))
        _ -> Nothing
    f (EffectU _ t1) (EffectU _ t2) = f t1 t2
    f (OptionalU t1) (OptionalU t2) = f t1 t2
    f (NatAddU a1 b1) (NatAddU a2 b2) = firstOf (f a1 a2) (f b1 b2)
    f (NatMulU a1 b1) (NatMulU a2 b2) = firstOf (f a1 a2) (f b1 b2)
    f (NatSubU a1 b1) (NatSubU a2 b2) = firstOf (f a1 a2) (f b1 b2)
    f (NatDivU a1 b1) (NatDivU a2 b2) = firstOf (f a1 a2) (f b1 b2)
    f (LabeledU _ t1) t2 = f t1 t2
    f t1 (LabeledU _ t2) = f t1 t2
    f _ _ = Nothing

    firstOf :: Maybe a -> Maybe a -> Maybe a
    firstOf (Just x) _ = Just x
    firstOf _ (Just x) = Just x
    firstOf _ _ = Nothing

-- | is t1 a generalization of t2?
isSubtypeOf :: TypeU -> TypeU -> Bool
isSubtypeOf t1 t2 = case P.compare t1 t2 of
  (Just x) -> x <= EQ
  _ -> False

equivalent :: TypeU -> TypeU -> Bool
equivalent t1 t2 = isSubtypeOf t1 t2 && isSubtypeOf t2 t1

-- | find the most specific subtypes
mostSpecificSubtypes :: TypeU -> [TypeU] -> [TypeU]
mostSpecificSubtypes t ts = mostSpecific $ filter (`isSubtypeOf` t) ts

-- | find all types that are not greater than any other type
mostGeneral :: [TypeU] -> [TypeU]
mostGeneral = P.minima

-- | find all types that are not less than any other type
mostSpecific :: [TypeU] -> [TypeU]
mostSpecific = P.maxima

---- Utility functions

extractKey :: TypeU -> TVar
extractKey (VarU v) = v
extractKey (NatVarU v) = v
extractKey (ForallU _ t) = extractKey t
extractKey (AppU t _) = extractKey t
extractKey (NamU _ v _ _) = v
extractKey (ExistU v _ _) = v
extractKey (EffectU _ t) = extractKey t
extractKey (OptionalU t) = extractKey t
extractKey (NatLitU _) = TV "Nat"
extractKey (NatAddU _ _) = TV "Nat"
extractKey (NatMulU _ _) = TV "Nat"
extractKey (NatSubU _ _) = TV "Nat"
extractKey (NatDivU _ _) = TV "Nat"
extractKey (LabeledU _ t) = extractKey t
extractKey t = error $ "Cannot currently handle functional type imports: " <> show t

type2typeu :: Type -> TypeU
type2typeu (VarT v) = VarU v
type2typeu (UnkT v) = ForallU v (VarU v)
type2typeu (FunT ts t) = FunU (map type2typeu ts) (type2typeu t)
type2typeu (AppT v ts) = AppU (type2typeu v) (map type2typeu ts)
type2typeu (NamT o n ps rs) = NamU o n (map type2typeu ps) [(k, type2typeu x) | (k, x) <- rs]
type2typeu (EffectT effs t) = EffectU (EffectSet effs) (type2typeu t)
type2typeu (OptionalT t) = OptionalU (type2typeu t)
type2typeu (NatLitT n) = NatLitU n
type2typeu (NatAddT a b) = NatAddU (type2typeu a) (type2typeu b)
type2typeu (NatMulT a b) = NatMulU (type2typeu a) (type2typeu b)
type2typeu (NatSubT a b) = NatSubU (type2typeu a) (type2typeu b)
type2typeu (NatDivT a b) = NatDivU (type2typeu a) (type2typeu b)

unresolvedType2type :: TypeU -> Type
unresolvedType2type (VarU v) = VarT v
unresolvedType2type (NatVarU _) = NatLitT 0
unresolvedType2type ExistU {} = error "Cannot cast existential type to Type"
unresolvedType2type (ForallU _ _) = error "Cannot cast universal type as Type"
unresolvedType2type (FunU ts t) = FunT (map unresolvedType2type ts) (unresolvedType2type t)
unresolvedType2type (AppU v ts) = AppT (unresolvedType2type v) (map unresolvedType2type ts)
unresolvedType2type (NamU t n ps rs) = NamT t n (map unresolvedType2type ps) [(k, unresolvedType2type e) | (k, e) <- rs]
unresolvedType2type (EffectU effs t) = EffectT (resolveEffectSet effs) (unresolvedType2type t)
unresolvedType2type (OptionalU t) = OptionalT (unresolvedType2type t)
unresolvedType2type (NatLitU n) = NatLitT n
unresolvedType2type (NatAddU a b) = NatAddT (unresolvedType2type a) (unresolvedType2type b)
unresolvedType2type (NatMulU a b) = NatMulT (unresolvedType2type a) (unresolvedType2type b)
unresolvedType2type (NatSubU a b) = NatSubT (unresolvedType2type a) (unresolvedType2type b)
unresolvedType2type (NatDivU a b) = NatDivT (unresolvedType2type a) (unresolvedType2type b)
unresolvedType2type (LabeledU _ t) = unresolvedType2type t

-- | get a fresh variable name that is not used in t1 or t2
newVariable :: TypeU -> TypeU -> TVar
newVariable t1 t2 = findNew variables (Set.union (allVars t1) (allVars t2))
  where
    variables = [1 ..] >>= flip replicateM ['a' .. 'z']

    findNew :: [String] -> Set.Set TypeU -> TVar
    findNew [] _ = error "No variable in the infinite list was OK with you? Sheesh, picky."
    findNew (x : xs) ts
      | Set.member (VarU v) ts = findNew xs ts
      | otherwise = v
      where
        v = TV $ DT.pack x

    allVars :: TypeU -> Set.Set TypeU
    allVars (ForallU v t) = Set.union (Set.singleton (VarU v)) (allVars t)
    allVars (NatVarU v) = Set.singleton (NatVarU v)
    allVars (EffectU _ t) = allVars t
    allVars (OptionalU t) = allVars t
    allVars (NatAddU a b) = Set.union (allVars a) (allVars b)
    allVars (NatMulU a b) = Set.union (allVars a) (allVars b)
    allVars (NatSubU a b) = Set.union (allVars a) (allVars b)
    allVars (NatDivU a b) = Set.union (allVars a) (allVars b)
    allVars (LabeledU _ t) = allVars t
    allVars t = free t

{- | Check whether a ground type contains any unknown (unresolved) type variables.
These arise from erasing 'ForallU' during 'typeOf', indicating a polymorphic type.
-}
containsUnk :: Type -> Bool
containsUnk (UnkT _) = True
containsUnk (VarT _) = False
containsUnk (FunT ts t) = any containsUnk ts || containsUnk t
containsUnk (AppT t ts) = containsUnk t || any containsUnk ts
containsUnk (NamT _ _ ps rs) = any containsUnk ps || any (containsUnk . snd) rs
containsUnk (EffectT _ t) = containsUnk t
containsUnk (OptionalT t) = containsUnk t
containsUnk (NatLitT _) = False
containsUnk (NatAddT a b) = containsUnk a || containsUnk b
containsUnk (NatMulT a b) = containsUnk a || containsUnk b
containsUnk (NatSubT a b) = containsUnk a || containsUnk b
containsUnk (NatDivT a b) = containsUnk a || containsUnk b

----- Pretty instances -------------------------------------------------------

-- | Records, objects, and tables render identically in type signatures —
-- just the type name optionally followed by parameters. The record/object/
-- table distinction is surfaced separately in the CLI help's type
-- definition block, where each named type is listed with its tag and
-- fields. Using a trivial instance here keeps signatures uncluttered.
instance Pretty NamType where
  pretty _ = mempty

instance Pretty Type where
  pretty t0 = f True t0
    where
      f _ (UnkT v) = pretty v
      f _ (VarT v) = pretty v
      f _ (AppT (VarT (TV "List")) [t]) = "[" <> f True t <> "]"
      f _ (AppT (VarT (TV "Tuple2")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple3")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple4")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple5")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple6")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple7")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppT (VarT (TV "Tuple8")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (EffectT effs t)
        | Set.null effs = "{" <> f True t <> "}"
        | otherwise = "<" <> hcat (punctuate "," (map pretty (Set.toList effs))) <> ">" <+> f False t
      f _ (OptionalT t) = "?" <> f False t
      f _ (NatLitT n) = pretty n
      f _ (NatAddT a b) = "(" <> f True a <+> "+" <+> f True b <> ")"
      f _ (NatMulT a b) = "(" <> f True a <+> "*" <+> f True b <> ")"
      f _ (NatSubT a b) = "(" <> f True a <+> "-" <+> f True b <> ")"
      f _ (NatDivT a b) = "(" <> f True a <+> "/" <+> f True b <> ")"
      f False t = parens (f True t)
      f _ (FunT [] t) = "() -> " <> f False t
      f _ (FunT ts t) = hsep $ punctuate " -> " (map (f False) (ts <> [t]))
      f _ (AppT t ts) = hsep (map (f False) (t : ts))
      -- Named types (records / objects / tables) render as "name [p1 ...]",
      -- Haskell-style. No tag and no inline field block; the record/table
      -- distinction and the field list are surfaced in the CLI help's
      -- type definition section and in typeclass-aware contexts.
      f _ (NamT _ n ps _) =
        let params = if null ps
                     then mempty
                     else space <> hsep (map (f False) ps)
        in pretty n <> params

instance Pretty TypeU where
  pretty t0 = f True t0
    where
      f _ (VarU v) = pretty v
      f _ (NatVarU v) = pretty v
      f _ (ExistU v ([], _) ([], _)) = angles $ pretty v
      f _ (AppU (VarU (TV "List")) [t]) = "[" <> f True t <> "]"
      f _ (AppU (VarU (TV "Tuple2")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple3")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple4")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple5")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple6")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple7")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (AppU (VarU (TV "Tuple8")) ts) = encloseSep "(" ")" ", " (map (f True) ts)
      f _ (EffectU effs t) =
        let labels = resolveEffectSet effs
         in if Set.null labels
              then "{" <> f True t <> "}"
              else "<" <> hcat (punctuate "," (map pretty (Set.toList labels))) <> ">" <+> f False t
      f _ (OptionalU t) = "?" <> f False t
      f _ (NatLitU n) = pretty n
      f _ (NatAddU a b) = "(" <> f True a <+> "+" <+> f True b <> ")"
      f _ (NatMulU a b) = "(" <> f True a <+> "*" <+> f True b <> ")"
      f _ (NatSubU a b) = "(" <> f True a <+> "-" <+> f True b <> ")"
      f _ (NatDivU a b) = "(" <> f True a <+> "/" <+> f True b <> ")"
      f _ (LabeledU (TV n) t) = pretty n <> ":" <> f False t
      f False t = parens (f True t)
      f _ (ExistU v (ts, _) (rs, _)) =
        angles $
          pretty v
            <+> list (map (f False) ts)
            <+> list (map ((\(x, y) -> tupled [x, y]) . bimap pretty (f True)) rs)
      f _ (FunU [] t) = "() -> " <> f False t
      f _ (FunU ts t) = hsep $ punctuate " ->" (map (f False) (ts <> [t]))
      f _ (ForallU v t) = "forall" <+> pretty v <+> "." <+> f True t
      f _ (AppU t ts) = hsep $ map (f False) (t : ts)
      -- See the NamT case in 'Pretty Type' above for the rendering rules.
      f _ (NamU _ n ps _) =
        let params = if null ps
                     then mempty
                     else space <> hsep (map (f False) ps)
        in pretty n <> params

instance Pretty EType where
  pretty (EType t (Set.toList -> cs) _ _) = case cs of
    [] -> pretty t
    [c] -> pretty c <+> "=>" <+> pretty t
    _ -> tupled (map pretty cs) <+> "=>" <+> pretty t

instance Pretty Constraint where
  pretty (Constraint cls ts) = pretty cls <+> hsep (map pretty ts)


================================================
FILE: library/Morloc/ProgramBuilder/Build.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.ProgramBuilder.Build
Description : Compile pool source files and assemble the final executable
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Orchestrates the @morloc make@ build step: writes generated pool source
files, compiles them with the appropriate language toolchain, copies the
pre-compiled nexus binary, and writes the manifest file.
-}
module Morloc.ProgramBuilder.Build
  ( buildProgram
  ) where

import Control.Monad.Except (catchError, throwError)
import Morloc.Data.Doc ((<+>), vsep, pretty)
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import qualified Morloc.System as MS
import qualified System.Directory as SD
import System.Process (callProcess)

buildProgram :: (Script, [Script]) -> MorlocMonad ()
buildProgram (nexus, pools) = do
  installDir <- MM.gets stateInstallDir
  case installDir of
    Just dir -> do
      -- When installing, copy includes and the morloc script into the install
      -- directory, cd there, and build as normal. This avoids leaving artifacts
      -- in CWD and ensures the installed pools are a fresh build.
      force <- MM.gets stateInstallForce
      dirExists <- liftIO $ SD.doesDirectoryExist dir
      when (dirExists && not force) $ do
        contents <- liftIO $ SD.listDirectory dir
        unless (null contents) $
          MM.throwSystemError $ "Install directory already exists: " <> pretty dir
            <> ". Use --force to overwrite."
      when (dirExists && force) $
        liftIO $ SD.removeDirectoryRecursive dir
      liftIO $ SD.createDirectoryIfMissing True dir
      origDir <- liftIO SD.getCurrentDirectory
      liftIO $ SD.setCurrentDirectory dir
      mapM_ build (nexus : pools) `finally` liftIO (SD.setCurrentDirectory origDir)
    Nothing ->
      mapM_ build (nexus : pools)

-- | catch/finally for MorlocMonad
finally :: MorlocMonad a -> MorlocMonad () -> MorlocMonad a
finally action cleanup = do
  result <- catchError (fmap Right action) (return . Left)
  cleanup
  case result of
    Right a -> return a
    Left e -> throwError e

build :: Script -> MorlocMonad ()
build s = do
  (_ :/ tree) <- liftIO $ MS.writeDirectoryWith (\f c -> MT.writeFile f (unCode c)) (scriptCode s)
  case failures tree of
    [] -> return ()
    errs -> MM.throwSystemError $ "Failed to write generated files:" <+> vsep
      [pretty (show e) | Failed _ e <- errs]
  mapM_ runSysCommand (scriptMake s)

runSysCommand :: SysCommand -> MorlocMonad ()
runSysCommand (SysExe path) = liftIO $ callProcess "chmod" ["755", path]
runSysCommand (SysRun (Code cmd)) = MM.runCommand "runSysCommand" cmd
runSysCommand other =
  MM.throwSystemError $ "Unsupported SysCommand: " <> pretty (show other)


================================================
FILE: library/Morloc/ProgramBuilder/Install.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.ProgramBuilder.Install
Description : Install compiled morloc programs system-wide
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.ProgramBuilder.Install
  ( installProgram
  , validateIncludeScope
  , validateIncludeCoverage
  , copyAllFiltered
  , cleanIgnoredFiles
  ) where

import Control.Exception (throwIO)
import Control.Monad (forM_, when, unless)
import Data.List (isInfixOf, isPrefixOf, isSuffixOf)
import Data.Maybe (fromMaybe)
import Data.Text (Text)
import qualified Data.Text as T
import qualified Morloc.Completion as Completion
import System.Directory
  ( copyFile
  , createDirectoryIfMissing
  , doesDirectoryExist
  , doesFileExist
  , listDirectory
  , removeDirectoryRecursive
  , removeFile
  )
import System.Environment (lookupEnv)
import System.Process (callProcess)
import System.FilePath
  ( isAbsolute
  , makeRelative
  , normalise
  , splitDirectories
  , takeDirectory
  , takeFileName
  , (</>)
  )
import System.IO (hPutStrLn, stderr)

-- | Finalize an installed program. The build step has already written pools
-- and the wrapper script directly into installDir. This function copies the
-- wrapper to bin/, extracts the manifest to fdb/, and copies include files.
installProgram ::
  -- | configHome (e.g. ~/.local/share/morloc)
  String ->
  -- | installDir (e.g. <configHome>/exe/<name>)
  String ->
  -- | installName
  String ->
  -- | include patterns (Nothing = copy everything, Just [] = copy nothing)
  Maybe [Text] ->
  -- | force overwrite
  Bool ->
  IO ()
installProgram configHome installDir installName includes force = do
  let binDir = configHome </> "bin"
      binPath = binDir </> installName
      installedWrapper = installDir </> installName

  -- Check for existing bin entry (installDir is already populated by build)
  binExists <- doesFileExist binPath
  when (binExists && not force) $
    throwIO . userError $ "'" <> installName <> "' is already installed. Use --force to overwrite."
  when (binExists && force) $
    removeFile binPath

  -- Copy files from CWD to installDir
  case includes of
    Nothing -> copyAllFiltered "." installDir
    Just pats -> mapM_ (\pat -> copyIncludePattern (T.unpack pat) "." installDir) pats

  -- Copy wrapper from installDir to bin/
  createDirectoryIfMissing True binDir
  copyFile installedWrapper binPath
  makeExecutable binPath

  -- Copy manifest to fdb/ for daemon discovery
  let fdbDir = configHome </> "fdb"
      fdbPath = fdbDir </> (installName ++ ".manifest")
  createDirectoryIfMissing True fdbDir
  extractAndWriteManifest binPath fdbPath

  -- Check if bin dir is on PATH and print hint if not
  pathEnv <- lookupEnv "PATH"
  let pathStr = fromMaybe "" pathEnv
  when (not (binDir `isInfixOf` pathStr)) $
    hPutStrLn stderr $ "Note: add " <> binDir <> " to your PATH"

  hPutStrLn stderr $ "Installed '" <> installName <> "' to " <> binPath

  -- Regenerate shell completions
  Completion.regenerateCompletions False configHome

-- ======================================================================
-- Copy-everything mode (default)
-- ======================================================================

-- | Always-excluded patterns, applied even without a .morlocignore file.
defaultIgnorePatterns :: [String]
defaultIgnorePatterns =
  [ ".git/"
  , ".morlocignore"
  , "*.manifest"
  ]

-- | Copy all files from srcRoot to dstRoot, excluding files that match
-- .morlocignore patterns and always-excluded patterns. Preserves
-- relative directory structure.
copyAllFiltered :: FilePath -> FilePath -> IO ()
copyAllFiltered srcRoot dstRoot = do
  userPatterns <- readMorlocIgnore (srcRoot </> ".morlocignore")
  let allPatterns = defaultIgnorePatterns ++ userPatterns
  files <- listDirectoryRecursive srcRoot
  let relFiles = map (makeRelative srcRoot) files
      kept = filter (not . isIgnored allPatterns) relFiles
  forM_ kept $ \rel -> do
    let dst = dstRoot </> rel
    createDirectoryIfMissing True (takeDirectory dst)
    -- Skip if dst already exists (build artifacts placed by the compiler)
    dstExists <- doesFileExist dst
    unless dstExists $
      copyFile (srcRoot </> rel) dst

-- | Remove files matching .morlocignore and always-excluded patterns
-- from an already-populated directory. Used after git clone for module
-- install to clean up ignored files in-place.
cleanIgnoredFiles :: FilePath -> IO ()
cleanIgnoredFiles dir = do
  userPatterns <- readMorlocIgnore (dir </> ".morlocignore")
  let allPatterns = defaultIgnorePatterns ++ userPatterns
  files <- listDirectoryRecursive dir
  let relFiles = map (makeRelative dir) files
      ignored = filter (isIgnored allPatterns) relFiles
  forM_ ignored $ \rel ->
    removeFile (dir </> rel)
  -- Clean up empty directories left behind
  cleanEmptyDirs dir

-- | Remove empty directories recursively (bottom-up).
cleanEmptyDirs :: FilePath -> IO ()
cleanEmptyDirs dir = do
  entries <- listDirectory dir
  forM_ entries $ \entry -> do
    let path = dir </> entry
    isDir <- doesDirectoryExist path
    when isDir $ do
      cleanEmptyDirs path
      subEntries <- listDirectory path
      when (null subEntries) $
        removeDirectoryRecursive path

-- ======================================================================
-- .morlocignore parsing
-- ======================================================================

-- | Read and parse a .morlocignore file. Returns empty list if the file
-- does not exist.
readMorlocIgnore :: FilePath -> IO [String]
readMorlocIgnore path = do
  exists <- doesFileExist path
  if exists
    then do
      content <- readFile path
      return $ parseIgnorePatterns content
    else return []

-- | Parse .morlocignore content into a list of patterns.
-- Supports: blank lines, # comments, negation with !, trailing / for dirs.
parseIgnorePatterns :: String -> [String]
parseIgnorePatterns = filter (not . null) . map clean . lines
  where
    clean line =
      let trimmed = dropWhile (== ' ') line
      in if null trimmed || head trimmed == '#'
           then ""
           else trimmed

-- | Check if a relative path should be ignored based on ignore patterns.
-- Supports: glob patterns, directory patterns (trailing /), negation (!).
isIgnored :: [String] -> FilePath -> Bool
isIgnored patterns relPath = foldl apply False patterns
  where
    apply acc pat
      | "!" `isPrefixOf` pat =
          if matchIgnorePattern (drop 1 pat) relPath then False else acc
      | otherwise =
          if matchIgnorePattern pat relPath then True else acc

-- | Match a single ignore pattern against a relative path.
matchIgnorePattern :: String -> FilePath -> Bool
matchIgnorePattern pat relPath
  -- Directory pattern: "build/" matches any path under build/
  | "/" `isSuffixOf` pat =
      let dir = init pat
      in dir == relPath
           || (dir ++ "/") `isPrefixOf` relPath
           || ("/" ++ dir ++ "/") `isInfixOf` ("/" ++ relPath)
           || takeFileName (takeDirectory relPath) == dir
  -- Pattern contains / → match against full relative path
  | '/' `elem` pat = matchGlob pat relPath
  -- Pattern without / → match against filename only
  | otherwise = matchGlob pat (takeFileName relPath)

-- ======================================================================
-- Allowlist mode (explicit include patterns)
-- ======================================================================

-- | Recursively copy a directory
copyDirectoryRecursive :: FilePath -> FilePath -> IO ()
copyDirectoryRecursive src dst = do
  createDirectoryIfMissing True dst
  entries <- listDirectory src
  mapM_
    ( \entry -> do
        let srcPath = src </> entry
            dstPath = dst </> entry
        isDir <- doesDirectoryExist srcPath
        if isDir
          then copyDirectoryRecursive srcPath dstPath
          else copyFile srcPath dstPath
    )
    entries

{- | Copy files matching an include pattern, preserving relative paths.
Trailing "/" means copy a directory recursively.
"*" in a pattern means glob match.
Otherwise treated as an exact file/directory path.
-}
copyIncludePattern :: String -> FilePath -> FilePath -> IO ()
copyIncludePattern pattern srcRoot dstRoot
  | "/" `isSuffixOf` pattern = do
      let dirName = init pattern
          srcDir = srcRoot </> dirName
      exists <- doesDirectoryExist srcDir
      if exists
        then copyDirectoryRecursive srcDir (dstRoot </> dirName)
        else return ()
  | '*' `elem` pattern = do
      files <- listDirectoryRecursive srcRoot
      let matching = filter (matchGlob pattern . makeRelative srcRoot) files
      mapM_
        ( \f -> do
            let rel = makeRelative srcRoot f
                dst = dstRoot </> rel
            createDirectoryIfMissing True (takeDirectory dst)
            copyFile f dst
        )
        matching
  | otherwise = do
      let srcPath = srcRoot </> pattern
      isFile <- doesFileExist srcPath
      isDir <- doesDirectoryExist srcPath
      if isFile
        then do
          let dst = dstRoot </> pattern
          createDirectoryIfMissing True (takeDirectory dst)
          copyFile srcPath dst
        else
          if isDir
            then
              copyDirectoryRecursive srcPath (dstRoot </> pattern)
            else
              return ()

-- | Recursively list all files in a directory
listDirectoryRecursive :: FilePath -> IO [FilePath]
listDirectoryRecursive dir = do
  exists <- doesDirectoryExist dir
  if not exists
    then return []
    else do
      entries <- listDirectory dir
      paths <-
        mapM
          ( \entry -> do
              let path = dir </> entry
              isDir <- doesDirectoryExist path
              if isDir
                then listDirectoryRecursive path
                else return [path]
          )
          entries
      return (concat paths)

{- | Simple glob pattern matching supporting * (any sequence within a segment)
and ** (any path segments). Matches against relative paths.
-}
matchGlob :: String -> FilePath -> Bool
matchGlob [] [] = True
matchGlob ('*' : '*' : '/' : rest) path =
  matchGlob rest path || case break (== '/') path of
    (_, '/' : remaining) -> matchGlob ('*' : '*' : '/' : rest) remaining
    _ -> False
matchGlob ('*' : rest) path = any (\i -> matchGlob rest (drop i path)) [0 .. length segment]
  where
    segment = takeWhile (/= '/') path
matchGlob (p : rest) (c : cs) | p == c = matchGlob rest cs
matchGlob _ _ = False

-- ======================================================================
-- Validation
-- ======================================================================

-- | Make a file executable (0755 so group/other can execute too)
makeExecutable :: FilePath -> IO ()
makeExecutable path = callProcess "chmod" ["755", path]

{- | Reject include patterns that escape the package root.

An include path is only valid if it resolves to a location inside the
directory that contains package.yaml (and the main .loc script). Absolute
paths are rejected outright; relative paths are rejected if normalising
them produces a leading @..@ segment.

This closes the obvious footgun of a package referencing files outside the
project directory, which would break reproducibility and make installs
depend on ambient filesystem layout.
-}
validateIncludeScope :: [Text] -> IO ()
validateIncludeScope patterns =
  case filter (not . inScope . T.unpack) patterns of
    [] -> return ()
    bad ->
      throwIO . userError $
        "Invalid `include` in package.yaml: the following entries escape the "
          <> "package directory (absolute paths and `..` are not allowed):\n"
          <> unlines (map (("  " <>) . T.unpack) bad)
  where
    inScope :: String -> Bool
    inScope pat
      | isAbsolute pat = False
      | otherwise =
          case splitDirectories (normalise pat) of
            (".." : _) -> False
            segs -> not (any (== "..") segs)

{- | Verify that every directly-sourced file in the compiled program is
covered by at least one include pattern.

Only runs in strict mode (when include patterns are explicitly specified).
In default mode (include everything), this check is skipped since all
files are copied.

Note: we only check /directly/ sourced files, not files that those sources
in turn import (e.g., one R file calling @source()@ on another). Transitive
dependencies cannot be discovered without executing the source language.
-}
validateIncludeCoverage ::
  -- | package root (directory containing the main .loc script / package.yaml)
  FilePath ->
  -- | include patterns as written in package.yaml
  [Text] ->
  -- | absolute filesystem paths of every directly-sourced file
  [FilePath] ->
  IO ()
validateIncludeCoverage packageRoot patterns sourcePaths = do
  let patStrs = map T.unpack patterns
      relPaths = [ rel
                 | p <- sourcePaths
                 , let rel = makeRelative packageRoot (normalise p)
                 , not (isAbsolute rel)
                 , not ("../" `isPrefixOf` rel)
                 , rel /= ".."
                 ]
      uncovered = filter (not . isCovered patStrs) relPaths
  case uncovered of
    [] -> return ()
    missing ->
      throwIO . userError $
        "The following source files are referenced from your morloc program "
          <> "but not listed in `include` in package.yaml:\n"
          <> unlines (map ("  " <>) missing)
          <> "\nAdd them to `include` so they are copied into the install:\n"
          <> "  include:\n"
          <> unlines (map (("    - " <>)) missing)

-- | True if any include pattern matches the given relative path.
isCovered :: [String] -> FilePath -> Bool
isCovered patterns relPath = any (coversOne relPath) patterns
  where
    coversOne :: FilePath -> String -> Bool
    coversOne rel pat
      -- `src/` matches anything inside the src/ directory
      | "/" `isSuffixOf` pat =
          let dir = init pat
          in (dir ++ "/") `isPrefixOf` rel
      -- glob pattern
      | '*' `elem` pat = matchGlob pat rel
      -- exact path
      | otherwise = pat == rel

-- ======================================================================
-- Manifest extraction
-- ======================================================================

{- | Extract the manifest JSON from a wrapper script and write it to a file.
The wrapper script has the format:
  #!/bin/sh
  exec morloc-nexus "$0" "$@"
  ### MANIFEST ###
  <json>
-}
extractAndWriteManifest :: FilePath -> FilePath -> IO ()
extractAndWriteManifest wrapperPath manifestPath = do
  contents <- readFile wrapperPath
  let marker = "### MANIFEST ###"
      afterMarker = drop 1 $ dropWhile (/= marker) (lines contents)
  case afterMarker of
    [] -> return () -- no manifest found, skip silently
    _ -> writeFile manifestPath (unlines afterMarker)


================================================
FILE: library/Morloc/Quasi.hs
================================================
{-# LANGUAGE QuasiQuotes #-}
{-# LANGUAGE TemplateHaskell #-}

{- |
Module      : Morloc.Quasi
Description : String-interpolating quasiquoter for Doc values
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Provides the @[idoc|...|]@ quasiquoter for building 'Doc' values with
embedded Haskell expressions via @#\{expr\}@ syntax. Used in translators
to generate code with interpolated variable names and types.
-}
module Morloc.Quasi
  ( idoc
  ) where

import Language.Haskell.TH
import Language.Haskell.TH.Quote
import qualified Morloc.Data.Doc as G

import qualified Language.Haskell.Meta.Parse as MP

import Text.Parsec

type Parser = Parsec String ()

data I
  = S String
  | V String

pIs :: Parser [I]
pIs = many1 (try pV <|> try pS <|> try pE) <* eof

pV :: Parser I
pV = V <$> between (string "#{") (char '}') (many1 (noneOf "}"))

pS :: Parser I
pS = S <$> many1 (noneOf "#")

-- | match a literal '#' sign
pE :: Parser I
pE = fmap (S . return) $ char '#' <* notFollowedBy (char '}')

-- | __i__nterpolated __doc__ument
idoc :: QuasiQuoter
idoc =
  QuasiQuoter
    { quoteExp = compile
    , quotePat = error "Can't handle patterns"
    , quoteType = error "Can't handle types"
    , quoteDec = error "Can't handle declarations"
    }
  where
    compile :: String -> Q Exp
    compile txt =
      case parse pIs "" txt of
        Left err -> error $ show err
        Right xs -> return $ AppE (VarE 'G.hcat) (ListE (map qI xs))
          where
            qI :: I -> Exp
            qI (S x) = LitE (StringL x)
            qI (V x) =
              case MP.parseExp x of
                (Right hask) -> hask -- a Haskell expression
                (Left err) -> error err


================================================
FILE: library/Morloc/System.hs
================================================
{- |
Module      : Morloc.System
Description : Filesystem re-exports and YAML config loading
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Re-exports "System.Directory", "System.Directory.Tree", and
"System.FilePath.Posix" so that other modules can import a single module
for all filesystem operations. Also provides 'loadYamlConfig' for loading
YAML configuration with defaults.
-}
module Morloc.System
  ( module System.Directory.Tree
  , module System.Directory
  , module System.FilePath.Posix
  , loadYamlConfig
  ) where

import Morloc.Namespace.Prim

import Data.Aeson (FromJSON (..))
import qualified Data.Yaml.Config as YC
import System.Directory
import System.Directory.Tree
import System.FilePath.Posix

loadYamlConfig ::
  (FromJSON a) =>
  -- | possible locations of the config file
  Maybe [String] ->
  -- | default values taken from the environment (or a hashmap)
  YC.EnvUsage ->
  -- | default configuration
  IO a ->
  IO a
loadYamlConfig (Just fs) e _ = YC.loadYamlSettings fs [] e
loadYamlConfig Nothing _ d = d


================================================
FILE: library/Morloc/TypeEval.hs
================================================
{-# LANGUAGE CPP #-}
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.TypeEval
Description : Expand type aliases and reduce type applications
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Evaluates type expressions by expanding type aliases from the scope
(general and concrete), applying type arguments, and reducing applications.
Used by the typechecker and code generator to resolve user-defined types
to their canonical forms.
-}
module Morloc.TypeEval
  ( evaluateType
  , transformType
  , evaluateStep
  , pairEval
  , reduceType
  ) where

import qualified Data.Set as Set
import Morloc.Data.Doc
import qualified Morloc.Data.Map as Map
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM
import Morloc.Namespace.Prim
import Morloc.Namespace.State (MorlocError (..))
import Morloc.Namespace.Type

-- Evaluate a type expression with both the concrete and general scopes
--
-- This function does not know the concrete language, the parent sets that.
--
-- First try to resolve an expression with the concrete scope
-- If this fails, resolve one step with the general scope.
pairEval ::
  Scope -> -- concrete scope
  Scope -> -- general scope
  TypeU ->
  Either MorlocError TypeU
pairEval cscope gscope =
  -- transform the concrete type until an unresolvable node is reached
  generalTransformType Set.empty id resolveGen cscope
  where
    -- resolve by attempting to evaluate one step as in the general scope
    resolveGen f bnd t =
      case generalTransformType bnd (\_ _ -> return) resolveFail gscope t of
        (Right t') ->
          if t' /= t
            -- if general resolution succeeds, continue evaluation with the concrete scope
            then f bnd t'
            -- if it fails, return to the concrete scope to handle failure without
            -- general resolution option
            else generalTransformType Set.empty id resolveFail cscope t
        -- if no resolution is possible, propagate the error
        e -> e

evaluateStep :: Scope -> TypeU -> Maybe TypeU
evaluateStep scope t0 =
  case generalTransformType Set.empty (\_ _ -> return) resolveFail scope t0 of
    (Left _) -> Nothing
    (Right t) -> Just t

-- | evaluate a type exactly one step, return nothing if no evaluation is possible
reduceType :: Scope -> TypeU -> Maybe TypeU
reduceType scope t0 =
  case evaluateStep scope t0 of
    (Just t1) -> if t1 == t0 then Nothing else Just t1
    Nothing -> Nothing

-- evaluate a type until terminal functions called, fail if termini are not reached
transformType :: Scope -> TypeU -> Either MorlocError TypeU
transformType = generalTransformType Set.empty id resolveFail

-- evaluate a type as far as possible given the type functions in scope
evaluateType :: Scope -> TypeU -> Either MorlocError TypeU
evaluateType = generalTransformType Set.empty id resolveIgnore

resolveIgnore ::
  (Set.Set TVar -> TypeU -> Either MorlocError TypeU) ->
  Set.Set TVar ->
  TypeU ->
  Either MorlocError TypeU
resolveIgnore f bnd (AppU (VarU v) ts) = AppU (VarU v) <$> mapM (f bnd) ts
resolveIgnore _ _ t@(VarU _) = return t
resolveIgnore _ _ _ = MM.throwSystemError "Compiler bug (__FILE__:__LINE__): Reached unexpected branch"

resolveFail ::
  (Set.Set TVar -> TypeU -> Either MorlocError TypeU) ->
  Set.Set TVar ->
  TypeU ->
  Either MorlocError TypeU
resolveFail _ _ (AppU (VarU v) _) =
  MM.throwSystemError $
    "Could not resolve type applied variable" <+> squotes (pretty v)
      <> ". You may be missing a language-specific type definition."
resolveFail _ _ (VarU v) =
  MM.throwSystemError $
    "Could not resolve type for variable" <+> squotes (pretty v)
      <> ". You may be missing a language-specific type definition."
resolveFail _ _ _ = MM.throwSystemError "Compiler bug (__FILE__:__LINE__): Reached unexpected branch"

generalTransformType ::
  Set.Set TVar ->
  ( (Set.Set TVar -> TypeU -> Either MorlocError TypeU) ->
    Set.Set TVar ->
    TypeU ->
    Either MorlocError TypeU
  ) ->
  ( (Set.Set TVar -> TypeU -> Either MorlocError TypeU) ->
    Set.Set TVar ->
    TypeU ->
    Either MorlocError TypeU
  ) ->
  Scope -> -- may be general or concrete scope
  TypeU ->
  Either MorlocError TypeU
generalTransformType bnd0 recurse' resolve' scope = f bnd0
  where
    recurse = recurse' f
    resolve = resolve' recurse

    f :: Set.Set TVar -> TypeU -> Either MorlocError TypeU
    f bnd (ExistU v (ps, pc) (rs, rc)) = do
      ps' <- mapM (recurse bnd) ps
      rs' <- mapM (\(k, v') -> (,) k <$> recurse bnd v') rs
      return $ ExistU v (ps', pc) (rs', rc)
    f bnd (FunU ts t) = FunU <$> mapM (recurse bnd) ts <*> recurse bnd t
    f bnd (NamU o n ps rs) = do
      (n', o') <- case Map.lookup n scope of
        -- If the record type itself is aliased, substitute the name and record form
        (Just [(_, NamU o'' n'' _ _, _, _)]) -> return (n'', o'')
        -- Otherwise, keep the record name and form and recurse only into children
        _ -> return (n, o)
      ts' <- mapM (recurse bnd . snd) rs
      ps' <- mapM (recurse bnd) ps
      return $ NamU o' n' ps' (zip (map fst rs) ts')
    f bnd t0@(AppU (VarU v) ts)
      -- Handle generic case:
      --   type Cpp => A a b = "map<$1,$2>" a b
      --   foo Cpp :: A D [B] -> X
      --   -----------------------------------
      --   foo :: "map<$1,$2>" D [B] -> X
      --
      --   type Foo a = (a, A)
      --   f :: Foo Int -> B
      --   -----------------
      --   f :: (Int, A) -> B
      | Set.member v bnd = AppU (VarU v) <$> mapM (recurse bnd) ts
      -- Handle specialization, e.g.
      --   type Py => List Int64 = "np.ndarray" "int64"
      | otherwise =
          case Map.lookup v scope of
            (Just ts') -> do
              mergedAliases <- foldlM (mergeAliases ts) Nothing (map Just ts') |>> fmap (renameTypedefs bnd)
              case mergedAliases of
                (Just (vs, newType, _, isTerminal)) -> case isTerminal of
                  True -> terminate bnd $ foldr parsub newType (zip vs ts)
                  -- substitute the head term and re-evaluate
                  False -> recurse bnd $ foldr parsub newType (zip vs ts)
                Nothing ->
                  MM.throwSystemError $
                    "No matching alias found for" <+> pretty t0
                      <> "\n  Available aliases have"
                      <+> pretty (length ts') <+> "entries, none match the given arguments"
            _ -> resolve bnd t0
    -- t may be existential
    f bnd (AppU t ts) = AppU <$> recurse bnd t <*> mapM (recurse bnd) ts
    -- type Foo = A
    -- f :: Foo -> B
    -- -----------------
    -- f :: A -> B
    f bnd t0@(VarU v)
      | Set.member v bnd = return t0
      | otherwise = case Map.lookup v scope of
          (Just []) -> return t0
          (Just ts1) -> do
            -- new parameters may be added on the right that are not on the left
            mergedAliases <- foldlM (mergeAliases []) Nothing (map Just ts1)
            case mergedAliases of
              (Just (_, t2, _, isTerminal)) ->
                if isTerminal
                  then terminate bnd t2
                  else recurse bnd t2
              Nothing ->
                MM.throwSystemError $
                  "No matching alias found for" <+> pretty t0
                    <> "\n  Available aliases have"
                    <+> pretty (length ts1) <+> "entries, none match"
          Nothing -> resolve bnd t0
    f bnd (ForallU v t) = ForallU v <$> recurse (Set.insert v bnd) t
    f bnd (EffectU effs t) = EffectU effs <$> recurse bnd t
    f bnd (OptionalU t) = OptionalU <$> recurse bnd t
    f _ t@(NatVarU _) = return t  -- nat vars are not type aliases
    f _ t@(NatLitU _) = return t
    f bnd (NatAddU a b) = NatAddU <$> recurse bnd a <*> recurse bnd b
    f bnd (NatMulU a b) = NatMulU <$> recurse bnd a <*> recurse bnd b
    f bnd (NatSubU a b) = NatSubU <$> recurse bnd a <*> recurse bnd b
    f bnd (NatDivU a b) = NatDivU <$> recurse bnd a <*> recurse bnd b
    f bnd (LabeledU n t) = LabeledU n <$> recurse bnd t

    terminate :: Set.Set TVar -> TypeU -> Either MorlocError TypeU
    terminate bnd (ExistU v (ts, tc) (rs, rc)) = do
      ts' <- mapM (recurse bnd) ts
      rs' <- mapM (secondM (recurse bnd)) rs
      return $ ExistU v (ts', tc) (rs', rc)
    terminate bnd (FunU ts t) = FunU <$> mapM (recurse bnd) ts <*> recurse bnd t
    terminate bnd (ForallU v t) = ForallU v <$> recurse (Set.insert v bnd) t
    terminate bnd (AppU t ts) = AppU t <$> mapM (recurse bnd) ts
    terminate bnd (NamU o v ts rs) = NamU o v <$> mapM (recurse bnd) ts <*> mapM (secondM (recurse bnd)) rs
    terminate _ (VarU v) = return (VarU v)
    terminate _ t@(NatVarU _) = return t
    terminate bnd (EffectU effs t) = EffectU effs <$> recurse bnd t
    terminate bnd (OptionalU t) = OptionalU <$> recurse bnd t
    terminate _ t@(NatLitU _) = return t
    terminate bnd (NatAddU a b) = NatAddU <$> recurse bnd a <*> recurse bnd b
    terminate bnd (NatMulU a b) = NatMulU <$> recurse bnd a <*> recurse bnd b
    terminate bnd (NatSubU a b) = NatSubU <$> recurse bnd a <*> recurse bnd b
    terminate bnd (NatDivU a b) = NatDivU <$> recurse bnd a <*> recurse bnd b
    terminate bnd (LabeledU n t) = LabeledU n <$> recurse bnd t

    renameTypedefs ::
      Set.Set TVar -> ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) -> ([TVar], TypeU, ArgDoc, Bool)
    renameTypedefs _ ([], t, d, isTerminal) = ([], t, d, isTerminal)
    renameTypedefs bnd (Left (v@(TV x), _) : vs, t, d, isTerminal)
      | Set.member v bnd =
          let (vs', t', d', isTerminal') = renameTypedefs bnd (vs, t, d, isTerminal)
              v' =
                head
                  [ x' | x' <- [TV (MT.show' i <> x) | i <- [(0 :: Int) ..]], not (Set.member x' bnd), x' `notElem` vs'
                  ]
              t'' = substituteTVar v (VarU v') t'
           in (v' : vs', t'', d', isTerminal')
      | otherwise =
          let (vs', t', d', isTerminal') = renameTypedefs bnd (vs, t, d, isTerminal)
           in (v : vs', t', d', isTerminal')
    renameTypedefs bnd (Right _ : vs, t, d, isTerminal) =
      renameTypedefs bnd (vs, t, d, isTerminal)

    -- When a type alias is imported from two places, this function reconciles them, if possible
    mergeAliases ::
      [TypeU] ->
      Maybe ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      Maybe ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      Either MorlocError (Maybe ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool))
    mergeAliases _ Nothing Nothing = Right Nothing
    mergeAliases tsMain Nothing (Just b)
      | checkAlias tsMain b = Right (Just b)
      | otherwise = Right Nothing
    mergeAliases tsMain (Just a) Nothing
      | checkAlias tsMain a = Right (Just a)
      | otherwise = Right Nothing
    -- TODO: should the docstring args be considered here?
    mergeAliases tsMain (Just a@(ts1, t1, _, isTerminal1)) (Just b@(ts2, t2, _, isTerminal2))
      -- if both are invalid, return nothing
      | not aIsValid && not bIsValid = Right Nothing
      -- if one is valid and the other isn't, return the valid one
      | aIsValid && not bIsValid = Right (Just a)
      | not aIsValid && bIsValid = Right (Just b)
      -- if they are both valid AND they are identical AND there is no specialization, return the first
      | -- the return types are the same
        isSubtypeOf t1 t2
          && isSubtypeOf t2 t1
          -- there is no specialization
          && nonspecialized
          -- the return type is concrete, not an alias for something else
          && isTerminal1 == isTerminal2 =
          return (Just a)
      -- handle specialization
      | not nonspecialized = return $ selectSpecialization a b
      | otherwise =
          MM.throwSystemError $
            "Cannot merge conflicting type aliases:"
              <> "\n  t1:" <+> pretty t1
              <> "\n  t2:" <+> pretty t2
      where
        aIsValid = checkAlias tsMain a
        bIsValid = checkAlias tsMain b
        -- True if all parameters in both aliases are generic
        nonspecialized =
          all
            (\(x, y) -> either (\_ -> either (const True) (const False) y) (const False) x)
            (zip ts1 ts2)

    selectSpecialization ::
      ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      Maybe ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)
    selectSpecialization a@(aps0, _, _, _) b@(bps0, _, _, _) = g aps0 bps0
      where
        g [] _ = Just a
        g _ [] = Just b
        g ((Right _) : _) ((Left _) : _) = Just a
        g ((Left _) : _) ((Right _) : _) = Just b
        g ((Left _) : aps) ((Left _) : bps) = g aps bps
        g ((Right ta) : aps) ((Right tb) : bps)
          | isSubtypeOf ta tb && isSubtypeOf tb ta = g aps bps
          | isSubtypeOf ta tb && not (isSubtypeOf tb ta) = Just b
          | not (isSubtypeOf ta tb) && isSubtypeOf tb ta = Just a
          | otherwise = Nothing

    checkAlias ::
      [TypeU] ->
      ([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool) ->
      Bool
    checkAlias ts1 (ts2, _, _, _) =
      length ts1 == length ts2
        && all (\(x, y) -> either (const True) (\ytype -> isSubtypeOf ytype x) y) (zip ts1 ts2)

-- Replace a type variable with an expression. For example:
-- parsub ("a", "Int") -> "Map a b" -> "Map Int b"
parsub :: (TVar, TypeU) -> TypeU -> TypeU
parsub (v, t2) t1@(VarU v0)
  | v0 == v = t2 -- substitute
  | otherwise = t1 -- keep the original
parsub _ t@(NatVarU _) = t
parsub pair (ExistU t (ts, tc) (rs, rc)) = ExistU t (map (parsub pair) ts, tc) (zip (map fst rs) (map (parsub pair . snd) rs), rc)
parsub pair (ForallU v t1) = ForallU v (parsub pair t1)
parsub pair (FunU ts t) = FunU (map (parsub pair) ts) (parsub pair t)
parsub pair (AppU t ts) = AppU (parsub pair t) (map (parsub pair) ts)
parsub pair (NamU o n ps rs) = NamU o n (map (parsub pair) ps) [(k', parsub pair t) | (k', t) <- rs]
parsub pair (EffectU effs t) = EffectU effs (parsub pair t)
parsub pair (OptionalU t) = OptionalU (parsub pair t)
parsub _ t@(NatLitU _) = t
parsub pair (NatAddU a b) = NatAddU (parsub pair a) (parsub pair b)
parsub pair (NatMulU a b) = NatMulU (parsub pair a) (parsub pair b)
parsub pair (NatSubU a b) = NatSubU (parsub pair a) (parsub pair b)
parsub pair (NatDivU a b) = NatDivU (parsub pair a) (parsub pair b)
parsub pair (LabeledU n t) = LabeledU n (parsub pair t)


================================================
FILE: library/Morloc/Typecheck/Internal.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : Morloc.Typecheck.Internal
Description : Shared typechecking machinery (unification, substitution, context)
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Exports typechecking primitives shared between the frontend general
typechecker ('Morloc.Frontend.Typecheck') and any backend-specific
typecheckers: unification, context operations, substitution, fresh
variable generation, and type quantification\/unquantification.
-}
module Morloc.Typecheck.Internal
  ( (+>)
  , (++>)

    -- * accessing state
  , newvar
  , tvarname
  , newvarRich
  , evarname
  , qualify
  , unqualify

    -- * Typeclasses
  , Applicable (..)
  , GammaIndexLike (..)

    -- * manipulating context
  , access1
  , access2
  , solveExist
  , solveExistWith
  , lookupU
  , lookupE
  , cacheSolved
  , cut
  , substitute
  , rename
  , cleanTypeName
  , prettyTypeU
  , occursCheck
  , toExistential
  , gammaContextList
  , gammaTrimAfter

    -- * selectors
  , selectorType
  , selectorGetter
  , selectorSetter

    -- * subtyping
  , subtype
  , isSubtypeOf2
  , recheckDeferred

    -- * nat label helpers
  , collectNatVarNames

    -- * debugging
  , seeGamma
  -- debugging
  , enter
  , insetSay
  , leave
  , peak
  , peakGen
  , seeType
  ) where

import qualified Data.IntMap.Strict as IntMap
import qualified Data.Map.Strict as Map
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Morloc.BaseTypes as BT
import Morloc.Data.Doc
import qualified Morloc.Data.Text as MT
import qualified Morloc.Monad as MM
import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type
import qualified Morloc.Typecheck.NatSolver as NS
import qualified Morloc.TypeEval as TE

qualify :: [TVar] -> TypeU -> TypeU
qualify vs t = foldr (\v -> ForallU v) t vs

unqualify :: TypeU -> ([TVar], TypeU)
unqualify (ForallU v (unqualify -> (vs, t))) = (v : vs, t)
unqualify t = ([], t)

toExistential :: Gamma -> TypeU -> (Gamma, TypeU)
toExistential g0 (unqualify -> (vs0, t0)) = f g0 vs0 t0
  where
    f g [] t = (g, t)
    f g (v : vs) t =
      let (g', newVar) = newvar ("cls_" <> unTVar v) g
       in f g' vs (substituteTVar v newVar t)

class Applicable a where
  apply :: Gamma -> a -> a

-- | Apply a context to a type (See Dunfield Figure 8).
instance Applicable TypeU where
  -- [G]a = a
  apply g (VarU v) =
    -- FIXME: very wrong - only works because of my renaming scheme
    case lookupU v g of
      (Just t') -> t'
      Nothing -> VarU v
  apply g (NatVarU v) = case Map.lookup v (gammaNatSubs g) of
    Just t -> t
    Nothing -> NatVarU v
  -- [G](A->B) = ([G]A -> [G]B)
  apply g (FunU ts t) = FunU (map (apply g) ts) (apply g t)
  apply g (AppU t ts) = AppU (apply g t) (map (apply g) ts)
  -- [G]ForallU a.a = forall a. [G]a
  apply g (ForallU v a) =
    -- FIXME: VERY WRONG
    case lookupU v g of
      (Just _) -> apply g a
      Nothing -> ForallU v (apply g a)
  -- [G[a=t]]a = [G[a=t]]t
  apply g (ExistU v (ts, tc) (rs, rc)) =
    case lookupU v g of
      -- FIXME: this seems problematic - do I keep the previous parameters or the new ones?
      (Just t') -> apply g t' -- reduce an existential; strictly smaller term
      Nothing -> ExistU v (map (apply g) ts, tc) (map (second (apply g)) rs, rc)
  apply g (NamU o n ps rs) = NamU o n ps [(k, apply g t) | (k, t) <- rs]
  apply g (EffectU effs t) = EffectU effs (apply g t)
  apply g (OptionalU t) = OptionalU (apply g t)
  apply _ t@(NatLitU _) = t
  apply g (NatAddU a b) = NatAddU (apply g a) (apply g b)
  apply g (NatMulU a b) = NatMulU (apply g a) (apply g b)
  apply g (NatSubU a b) = NatSubU (apply g a) (apply g b)
  apply g (NatDivU a b) = NatDivU (apply g a) (apply g b)
  apply g (LabeledU n t) = LabeledU n (apply g t)

instance Applicable EType where
  apply g e =
    e
      { etype = apply g (etype e)
      , econs = Set.map (applyConstraint g) (econs e)
      }
    where
      applyConstraint g' (Constraint cls ts) = Constraint cls (map (apply g') ts)

instance Applicable Gamma where
  apply g1 g2 =
    g2
      { gammaContext = IntMap.map f (gammaContext g2)
      , gammaSolved = Map.map (apply g1) (gammaSolved g2)
      , gammaNatSubs = Map.map (apply g1) (gammaNatSubs g2)
      }
    where
      f :: GammaIndex -> GammaIndex
      f (AnnG v t) = AnnG v (apply g1 t)
      f (ExistG v (ps, pc) (rs, rc)) = ExistG v (map (apply g1) ps, pc) (map (second (apply g1)) rs, rc)
      f (SolvedG v t) = SolvedG v (apply g1 t)
      f x = x

class GammaIndexLike a where
  index :: a -> GammaIndex

instance GammaIndexLike GammaIndex where
  index = id

instance GammaIndexLike TypeU where
  index (ExistU t (ts, tc) (rs, rc)) = ExistG t (ts, tc) (rs, rc)
  index t = error $ "Can only index ExistT, found: " <> show t

instance GammaIndexLike TVar where
  index v = ExistG v ([], Open) ([], Open)

-- | Slot spacing between consecutive entries added by (+>).
-- Leaves room for solveExistWith to insert entries in between.
slotSpacing :: Int
slotSpacing = 256

-- | Prepend an entry to the context (newest position).
(+>) :: (GammaIndexLike a) => Gamma -> a -> Gamma
(+>) g x =
  let gi = index x
      s = gammaSlot g
  in g { gammaSlot = s + slotSpacing
       , gammaContext = IntMap.insert s gi (gammaContext g)
       , gammaExist = case gi of
           ExistG v _ _ -> Map.insert v s (gammaExist g)
           _ -> gammaExist g
       }

-- | Add multiple entries: last element of list becomes newest (highest slot).
(++>) :: (GammaIndexLike a) => Gamma -> [a] -> Gamma
(++>) g xs = foldl' (+>) g xs

isSubtypeOf2 :: Scope -> TypeU -> TypeU -> Bool
isSubtypeOf2 scope a b = case subtype scope a b (Gamma 0 0 IntMap.empty Map.empty Map.empty [] Map.empty Map.empty) of
  (Left _) -> False
  (Right _) -> True

subtypeEvaluated :: Scope -> TypeU -> TypeU -> Gamma -> Either MDoc Gamma
subtypeEvaluated scope t1 t2 g
  -- Reject sibling aliases before reduction. Without this, Array Int <: Deque Int
  -- would succeed transitively (Array Int -> List Int -> Deque Int) even though
  -- they are on different branches of the alias tree.
  | areSiblingAliases scope t1 t2 =
      Left $ "Cannot compare sibling types" <+> pretty t1 <+> "and" <+> pretty t2
  | otherwise = case (TE.reduceType scope t1, TE.reduceType scope t2) of
    (Just t1', _) -> subtype scope t1' t2 g
    (_, Just t2') -> subtype scope t1 t2' g
    (_, _)
      -- When both are bare type constructors that can't be reduced (e.g.,
      -- List vs Deque where Deque a = List a), check if one is an ancestor
      -- of the other by evaluating and comparing heads.
      | aliasEquivConstructors scope t1 t2 -> Right g
      | otherwise -> Left $ "Cannot compare types" <+> pretty t1 <+> "and" <+> pretty t2

-- | Check whether two applied types are sibling aliases -- both reduce to
-- the same ancestor but neither reduces to the other. For example,
-- Array Int and Deque Int are siblings (both reduce to List Int, but
-- Array does not reduce to Deque nor vice versa).
areSiblingAliases :: Scope -> TypeU -> TypeU -> Bool
areSiblingAliases scope (AppU (VarU v1) _) (AppU (VarU v2) _)
  | v1 == v2 = False
  | otherwise =
    let h1 = evalHead v1
        h2 = evalHead v2
    in case (h1, h2) of
         -- Both reduce to the same ancestor, but neither is the other's ancestor
         (Just hv1, Just hv2) -> hv1 == hv2 && hv1 /= v1 && hv2 /= v2
         _ -> False
  where
    evalHead v = case Map.lookup v scope of
      Just ((ps, _, _, _) : _)
        | all isGenericParam ps && not (null ps) ->
          let n = length ps
              freshVars = [VarU (TV (MT.show' i <> "__sib_cmp")) | i <- [0 .. n - 1]]
              app = AppU (VarU v) freshVars
          in case TE.evaluateType scope app of
               Right (AppU (VarU headV) _) -> Just headV
               _ -> Nothing
        | otherwise -> Nothing
      _ -> Nothing
    isGenericParam (Left _) = True
    isGenericParam _ = False
areSiblingAliases _ _ _ = False

-- | Check whether two unapplied type constructors are on the same path in
-- the alias hierarchy -- i.e., one reduces to the other. Applied aliases
-- (like Deque Int) are handled by reduceType above; this covers the bare
-- constructor case (Deque vs List) which arises when an existential is solved
-- to one name and then compared against an ancestor or descendant alias.
--
-- Only ancestor-descendant pairs match: List<->Deque and List<->Array succeed,
-- but Array<->Deque fails (siblings with a common ancestor but neither
-- reduces to the other).
aliasEquivConstructors :: Scope -> TypeU -> TypeU -> Bool
aliasEquivConstructors scope (VarU v1) (VarU v2) =
  reducesToHead v1 v2 || reducesToHead v2 v1
  where
    reducesToHead src target =
      case arityOf (Map.lookup src scope) of
        Just n | n > 0 ->
          let freshVars = [VarU (TV (MT.show' i <> "__alias_cmp")) | i <- [0 .. n - 1]]
              app = AppU (VarU src) freshVars
          in case TE.evaluateType scope app of
               Right (AppU (VarU headV) _) -> headV == target
               _ -> False
        -- base type with no alias: matches only itself
        _ -> False

    arityOf :: Maybe [([Either (TVar, Kind) TypeU], TypeU, ArgDoc, Bool)] -> Maybe Int
    arityOf Nothing = Nothing
    arityOf (Just []) = Nothing
    arityOf (Just ((ps, _, _, _) : _))
      | all isGenericParam ps = Just (length ps)
      | otherwise = Nothing

    isGenericParam (Left _) = True
    isGenericParam _ = False
aliasEquivConstructors _ _ _ = False

subtypeError :: TypeU -> TypeU -> MDoc -> Either MDoc a
subtypeError t1 t2 msg =
  Left $
    "Subtype error:" <+> msg
      <> "\n  "
      <> prettyTypeU t1 <+> "<:" <+> prettyTypeU t2

-- Nat expression helpers for SOP-based comparison
isNatExpr :: TypeU -> Bool
isNatExpr (NatVarU _) = True
isNatExpr (NatLitU _) = True
isNatExpr (NatAddU _ _) = True
isNatExpr (NatMulU _ _) = True
isNatExpr (NatSubU _ _) = True
isNatExpr (NatDivU _ _) = True
isNatExpr _ = False

typeUToNatExpr :: TypeU -> Maybe NS.NatExpr
typeUToNatExpr (NatVarU v) = Just (NS.NatVar v)
typeUToNatExpr (NatLitU n) = Just (NS.NatLit n)
typeUToNatExpr (NatAddU a b) = NS.NatAdd <$> typeUToNatExpr a <*> typeUToNatExpr b
typeUToNatExpr (NatMulU a b) = NS.NatMul <$> typeUToNatExpr a <*> typeUToNatExpr b
typeUToNatExpr (NatSubU a b) = NS.NatSub <$> typeUToNatExpr a <*> typeUToNatExpr b
typeUToNatExpr (NatDivU a b) = NS.NatDiv <$> typeUToNatExpr a <*> typeUToNatExpr b
typeUToNatExpr (VarU v) = Just (NS.NatVar v)
typeUToNatExpr (ExistU v _ _) = Just (NS.NatVar v)
typeUToNatExpr _ = Nothing

natExprToTypeU :: NS.NatExpr -> TypeU
natExprToTypeU (NS.NatLit n) = NatLitU n
natExprToTypeU (NS.NatVar v) = NatVarU v
natExprToTypeU (NS.NatAdd a b) = NatAddU (natExprToTypeU a) (natExprToTypeU b)
natExprToTypeU (NS.NatMul a b) = NatMulU (natExprToTypeU a) (natExprToTypeU b)
natExprToTypeU (NS.NatSub a b) = NatSubU (natExprToTypeU a) (natExprToTypeU b)
natExprToTypeU (NS.NatDiv a b) = NatDivU (natExprToTypeU a) (natExprToTypeU b)

applyNatSolutions :: Map.Map TVar NS.NatExpr -> Gamma -> Either MDoc Gamma
applyNatSolutions subs g0 = foldM applySub g0 (Map.toList subs)
  where
    applySub g (v, ne) =
      let t = natExprToTypeU ne
      -- Try solving as existential first (for existential nat vars),
      -- then store in gammaNatSubs (for NatVarU variables)
      in case solveExist v t g of
           Right (Just g') -> Right g'
           Right Nothing ->
             -- Not an existential — store as a NatVarU solution
             Right g { gammaNatSubs = Map.insert v t (gammaNatSubs g) }
           Left err -> Left err

-- | Re-check deferred Nat constraints after all existentials are solved.
-- Applies the final gamma to each deferred pair, converts to NatExpr,
-- and re-solves. Returns Left on contradiction, Right with remaining
-- still-deferred constraints (now truly unsolvable).
recheckDeferred :: Gamma -> Either MDoc [(TypeU, TypeU)]
recheckDeferred g = foldM check [] (gammaDeferred g)
  where
    check acc (t1, t2) =
      let t1' = apply g t1
          t2' = apply g t2
      in case (typeUToNatExpr t1', typeUToNatExpr t2') of
           (Just ne1, Just ne2) ->
             case NS.solveNat ne1 ne2 of
               Right _ -> Right acc
               Left NS.Contradiction ->
                 Left $ "Nat constraint mismatch (deferred):"
                   <+> prettyTypeU t1' <+> "~" <+> prettyTypeU t2'
               Left (NS.Deferred _) -> Right ((t1', t2') : acc)
           _ -> Right acc  -- not nat exprs after apply, skip

-- | type 1 is more polymorphic than type 2 (Dunfield Figure 9)
subtype :: Scope -> TypeU -> TypeU -> Gamma -> Either MDoc Gamma
-- NatVarU: identical nat variables are equal; different ones fall to isNatExpr path
subtype _ (NatVarU v1) (NatVarU v2) g
  | v1 == v2 = return g
-- VarU vs VarT
subtype scope t1@(VarU a1) t2@(VarU a2) g
  -- If everything is the same, do nothing
  --
  -- ----------------------------------------- <:Var
  --  G[a] |- a_l <: a_l -| G[a]
  | a1 == a2 = return g
  | otherwise = subtypeEvaluated scope t1 t2 g
subtype scope a@ExistU {} b@ExistU {} g
  --
  -- ----------------------------------------- <:Exvar
  --  G[E.a] |- E.a <: E.a -| G[E.a]
  | a == b = return g
  -- ----------------------------------------- <:InstantiateL/<:InstantiateR
  --  G[E.a] |- Ea <: Ea -| G[E.a]
  | otherwise = instantiate scope a b g
-- formally, an `Ea notin FV(G)` check should be done here, but since the
-- types involved are all existentials, it will always pass, so I omit
-- it.

-- EffectU: covariant subtyping with effect row subsumption.
-- <E1> T1 <: <E2> T2 when E1 is a subset of E2 and T1 <: T2.
-- Fewer effects can be used where more effects are expected.
subtype scope (EffectU e1 t1) (EffectU e2 t2) g
  | effectSubsetOf e1 e2 = subtype scope t1 t2 g
  | otherwise = subtype scope t1 t2 g -- permissive for now: EffectVar not yet solved
-- OptionalU: covariant subtyping
subtype scope (OptionalU t1) (OptionalU t2) g = subtype scope t1 t2 g
--  g1 |- B1 <: A1 -| g2
--  g2 |- [g2]A2 <: [g2]B2 -| g3
-- ----------------------------------------- <:-->
--  g1 |- A1 -> A2 <: B1 -> B2 -| g3
--
-- function subtypes are *contravariant* with respect to the input, that is,
-- the subtypes are reversed so we have b1<:a1 instead of a1<:b1.
--
-- Apply context between each argument subtype check so that solved
-- existentials propagate to later arguments. This is necessary when a
-- forall-bound variable appears in multiple argument positions (e.g.,
-- (==) :: c -> c -> Bool passed to fold).
subtype scope t1@(FunU as1 ret1) t2@(FunU as2 ret2) g0
  | length as1 /= length as2 = subtypeError t1 t2 "function arity mismatch"
  | null as1 = subtype scope ret1 ret2 g0
  | otherwise = do
      -- Process all arguments (contravariant: b <: a), applying context between each
      g1 <- foldlM (\g (b, a) -> subtype scope (apply g b) (apply g a) g) g0 (zip as2 as1)
      -- Apply context to return types, then subtype
      subtype scope (apply g1 ret1) (apply g1 ret2) g1

--  g1 |- A1 <: B1
-- ----------------------------------------- <:App
--  g1 |- A1 A2 <: B1 B2 -| g2
--  unparameterized types are the same as VarT, so subtype on that instead
subtype scope t1@(AppU v1@(ExistU _ _ _) vs1) t2@(AppU v2 vs2) g
  | length vs1 == length vs2 = zipSubtype t1 t2 scope (v1 : vs1) (v2 : vs2) g
  | otherwise = subtypeEvaluated scope t1 t2 g
subtype scope t1@(AppU v1 vs1) t2@(AppU v2@(ExistU _ _ _) vs2) g
  | length vs1 == length vs2 = zipSubtype t1 t2 scope (v1 : vs1) (v2 : vs2) g
  | otherwise = subtypeEvaluated scope t1 t2 g
subtype scope t1@(AppU v1 vs1) t2@(AppU v2 vs2) g
  | v1 == v2 && length vs1 == length vs2 = zipSubtype t1 t2 scope vs1 vs2 g
  | otherwise = subtypeEvaluated scope t1 t2 g
-- subtype unordered records
subtype scope (NamU _ v1 _ []) (NamU _ v2 _ []) g
  -- If one of the records is generic, allow promotion
  | v1 == BT.record || v2 == BT.record = return g
  -- Otherwise subtype the variable names
  | otherwise = subtype scope (VarU v1) (VarU v2) g
subtype _ t1@(NamU _ _ _ []) t2@(NamU _ _ _ _) _ =
  subtypeError t1 t2 "NamU - Unequal number of fields"
subtype _ t1@(NamU _ _ _ _) t2@(NamU _ _ _ []) _ =
  subtypeError t1 t2 "NamU - Unequal number of fields"
subtype scope t1@(NamU o1 v1 p1 ((k1, x1) : rs1)) t2@(NamU o2 v2 p2 es2) g0 =
  case filterApart (\(k2, _) -> k2 == k1) es2 of
    (Nothing, _) -> subtypeError t1 t2 "NamU - Unequal fields"
    (Just (_, x2), rs2) ->
      subtype scope x1 x2 g0
        >>= subtype scope (NamU o1 v1 p1 rs1) (NamU o2 v2 p2 rs2)
--  Ea not in FV(a)
--  g1[Ea] |- A <=: Ea -| g2
-- ----------------------------------------- <:InstantiateR
--  g1[Ea] |- A <: Ea -| g2
subtype scope a b@(ExistU _ ([], _) _) g = occursCheck b a "InstantiateR" >> instantiate scope a b g
--  Ea not in FV(a)
--  g1[Ea] |- Ea <=: A -| g2
-- ----------------------------------------- <:InstantiateL
--  g1[Ea] |- Ea <: A -| g2
subtype scope a@(ExistU _ ([], _) _) b g = occursCheck a b "InstantiateL" >> instantiate scope a b g
subtype scope a@(AppU _ _) b@(ExistU _ _ _) g = subtype scope b a g
subtype scope t1@(ExistU v1 (ps1, pc1) rs@([], _)) t2@(AppU _ ps2) g1
  -- if the existential is closed and the parameter length is not equal, die
  | pc1 == Closed && length ps1 /= length ps2 =
      subtypeError t1 t2 "InstantiateL - Expected equal number of type parameters"
  -- if the exsistential is open and it has fewer parameters, extend the
  -- parameter list and retry
  | pc1 == Open && length ps1 < length ps2 = do
      let (ps1', _) = extendList ps1 ps2
      subtype scope (ExistU v1 (ps1', pc1) rs) t2 g1
  | length ps1 > length ps2 =
      subtypeError t1 t2 "InstantiateL - too many parameters in left existential"
  -- otherwise, do the thing
  | otherwise = do
      g2 <- foldM (\g (p1, p2) -> subtype scope p1 p2 g) g1 (zip ps1 ps2)
      solveExist v1 t2 g2 >>= maybe (return g2) return

--  g1,>Ea,Ea |- [Ea/x]A <: B -| g2,>Ea,g3
-- ----------------------------------------- <:ForallL
--  g1 |- Forall x . A <: B -| g2
--
subtype scope (ForallU v a) b g0 = subtype scope (substitute v a) b (g0 +> v)
-- NOTE: I am deviating from the rules here by not cutting. It is not
-- necessary to do so since I rewrote all qualifiers to be globally unique.
-- Also, when I cut here I lose my only link to v, and that caused `map fst`
-- to not compile.

--  g1,a |- A <: B -| g2,a,g3
-- ----------------------------------------- <:ForallR
--  g1 |- A <: Forall a. B -| g2
subtype scope a (ForallU v b) g = subtype scope a b (g +> VarG v) >>= cut (VarG v)
-- Nat expressions: compare via SOP normalization (handles commutativity,
-- associativity, and cross-form equality like 2+3 ~ 5)
subtype _ t1 t2 g
  | isNatExpr t1 && isNatExpr t2 =
      let t1' = apply g t1
          t2' = apply g t2
      in case (typeUToNatExpr t1', typeUToNatExpr t2') of
           (Just ne1, Just ne2) ->
             case NS.solveNat ne1 ne2 of
               Right subs
                 | Map.null subs -> return g
                 | otherwise -> applyNatSolutions subs g
               Left NS.Contradiction -> subtypeError t1 t2 "Nat constraint mismatch"
               Left (NS.Deferred _) -> return g { gammaDeferred = (t1', t2') : gammaDeferred g }
           _ -> subtypeError t1 t2 "Cannot compare Nat expressions"
-- note that these need to be evaluated AFTER all the existentials
subtype scope t1@(VarU _) t2 g = subtypeEvaluated scope t1 t2 g
subtype scope t1 t2@(VarU _) g = subtypeEvaluated scope t1 t2 g
-- fall through
subtype _ a b _ = subtypeError a b "Type mismatch fall through"

zipSubtype :: TypeU -> TypeU -> Scope -> [TypeU] -> [TypeU] -> Gamma -> Either MDoc Gamma
zipSubtype _ _ _ [] [] g' = return g'
zipSubtype a b scope (t1' : ts1') (t2' : ts2') g' = do
  g'' <- subtype scope t1' t2' g'
  zipSubtype a b scope (map (apply g'') ts1') (map (apply g'') ts2') g''
zipSubtype a b _ _ _ _ = subtypeError a b "Parameter type mismatch"

-- | Dunfield Figure 10 -- type-level structural recursion
instantiate :: Scope -> TypeU -> TypeU -> Gamma -> Either MDoc Gamma
instantiate scope ta@(ExistU _ _ (_ : _, _)) tb@(NamU _ _ _ _) g1 = instantiate scope tb ta g1
instantiate scope ta@(ExistU _ _ (_ : _, _)) tb@(VarU _) g1 = instantiate scope tb ta g1
instantiate scope ta@(VarU _) tb@(ExistU _ _ (_ : _, _)) g1 = do
  case TE.reduceType scope ta of
    (Just ta') -> instantiate scope ta' tb g1
    Nothing -> subtypeError ta tb "Error in VarU versus NamU with existential keys"
instantiate scope ta@(NamU _ _ _ rs1) tb@(ExistU v _ (rs2@(_ : _), rc)) g1 = do
  let keyset1 = Set.fromList $ map fst rs1
      keyset2 = Set.fromList $ map fst rs2
  _ <- case rc of
    -- if the existential keys are closed, the the ta and tb keys must be identical
    Closed ->
      if keyset1 == keyset2
        then return ()
        else subtypeError ta tb "Error in NamU with conflicting closed keysets"
    -- if the existential keys are open, then all existential keys muts be in
    -- ta, but not vice versa
    Open ->
      if Set.isSubsetOf keyset2 keyset1
        then return ()
        else subtypeError ta tb "Error in NamU with conflicting open keysets"

  g2 <-
    foldM
      (\g' (t1, t2) -> subtype scope t1 t2 g')
      g1
      [(t1, t2) | (k1, t1) <- rs1, (k2, t2) <- rs2, k1 == k2]
  solveExist v ta g2 >>= maybe (subtypeError ta tb "Error in NamU with existential keys") return
-- ExistU vs EffectU: solve ?a = <effs> ?b, then ?b <: inner
instantiate scope (ExistU v ([], _) _) (EffectU effs inner) g1 = do
  let (g2, veb) = tvarname g1 "eff"
      eb = ExistU veb ([], Open) ([], Open)
  g3 <- solveExistWith v (EffectU effs eb) [index eb] g2 >>= maybe (return g2) return
  instantiate scope eb (apply g3 inner) g3
instantiate scope (EffectU effs inner) (ExistU v ([], _) _) g1 = do
  let (g2, veb) = tvarname g1 "eff"
      eb = ExistU veb ([], Open) ([], Open)
  g3 <- solveExistWith v (EffectU effs eb) [index eb] g2 >>= maybe (return g2) return
  instantiate scope (apply g3 inner) eb g3
-- ExistU vs OptionalU: solve ?a = ??b, then ?b <: inner
instantiate scope (ExistU v ([], _) _) (OptionalU inner) g1 = do
  let (g2, veb) = tvarname g1 "opt"
      eb = ExistU veb ([], Open) ([], Open)
  g3 <- solveExistWith v (OptionalU eb) [index eb] g2 >>= maybe (return g2) return
  instantiate scope eb (apply g3 inner) g3
instantiate scope (OptionalU inner) (ExistU v ([], _) _) g1 = do
  let (g2, veb) = tvarname g1 "opt"
      eb = ExistU veb ([], Open) ([], Open)
  g3 <- solveExistWith v (OptionalU eb) [index eb] g2 >>= maybe (return g2) return
  instantiate scope (apply g3 inner) eb g3
instantiate scope (ExistU v ([], _) _) (FunU as b) g1 = do
  let (g2, veas) = statefulMap (\g _ -> tvarname g "ta") g1 as
      (g3, veb) = tvarname g2 "to"
      eas = [ExistU v' ([], Open) ([], Open) | v' <- veas]
      eb = ExistU veb ([], Open) ([], Open)
  g4 <- solveExistWith v (FunU eas eb) (index eb : map index eas) g3 >>= maybe (return g3) return
  g5 <- foldlM (\g (e, t) -> instantiate scope e t g) g4 (zip eas as)
  instantiate scope eb (apply g5 b) g5

--  g1[Ea2,Ea1,Ea=Ea1->Ea2] |- Ea1 <=: A1 -| g2
--  g2 |- [g2]A2 <=: Ea2 -| g3
-- ----------------------------------------- InstRApp
--  g1[Ea] |- A1 -> A2 <=: Ea -| g3
instantiate scope (FunU as b) (ExistU v ([], _) _) g1 = do
  let (g2, veas) = statefulMap (\g _ -> tvarname g "ta") g1 as
      (g3, veb) = tvarname g2 "to"
      eas = [ExistU v' ([], Open) ([], Open) | v' <- veas]
      eb = ExistU veb ([], Open) ([], Open)
  g4 <- solveExistWith v (FunU eas eb) (index eb : map index eas) g3 >>= maybe (return g3) return
  g5 <- foldlM (\g (e, t) -> instantiate scope t e g) g4 (zip eas as)
  instantiate scope eb (apply g5 b) g5

-- This is terrible kludge, I am not close to having considered all the edge
-- cases. I need to completely rewrite my type system. Argh. I also need to get
-- rid of all default types. Defaults should be set explicitly in morloc code.
instantiate _ ta@(ExistU _ _ (_ : _, _)) (ExistU v ([], _) ([], _)) g1 =
  solveExist v ta g1 >>= maybe (return g1) return
instantiate _ (ExistU v ([], _) ([], _)) tb@(ExistU _ _ (_ : _, _)) g1 =
  solveExist v tb g1 >>= maybe (return g1) return

--
-- ----------------------------------------- InstLAllR
--
instantiate scope ta@(ExistU _ _ _) (ForallU v2 t2) g1 =
  instantiate scope ta t2 (g1 +> VarG v2)
    >>= cut (VarG v2)
-- InstLReach or instRReach -- each rule eliminates an existential
-- Replace the rightmost with leftmost (G[a][b] --> L,a,M,b=a,R)
-- WARNING: be careful here, since the implementation adds to the front and the
-- formal syntax adds to the back. Don't change anything in the function unless
-- you really know what you are doing and have tests to confirm it.
instantiate scope ta@(ExistU v1 (ps1, pc1) (rs1, rc1)) tb@(ExistU v2 (ps2, pc2) (rs2, rc2)) g1 = do
  -- check and expand open parameters
  (ps1', ps2') <- case (pc1, pc2, compare (length ps1) (length ps2)) of
    (_, _, EQ) -> Right (ps1, ps2)
    (Closed, Closed, _) -> subtypeError ta tb "Unequal parameter length for closed existentials"
    (Closed, Open, GT) -> Right $ extendList ps1 ps2
    (Closed, Open, LT) -> subtypeError ta tb "Left closed existential parameter list is less than right"
    (Open, Closed, LT) -> Right $ extendList ps1 ps2
    (Open, Closed, GT) -> subtypeError ta tb "Right closed existential parameter list is less than left"
    (Open, Open, _) -> Right $ extendList ps1 ps2

  let keyset1 = Set.fromList (map fst rs1)
  let keyset2 = Set.fromList (map fst rs2)

  -- check and expand open records
  (g2, rs1', rs2') <- case (rc1, rc2, Set.isSubsetOf keyset1 keyset2, Set.isSubsetOf keyset2 keyset1) of
    (Closed, Closed, False, _) -> subtypeError ta tb "Right closed existential contains keys missing in left closed existential"
    (Closed, Closed, _, False) -> subtypeError ta tb "Right closed existential contains keys missing in left closed existential"
    (Closed, Open, a, False) ->
      subtypeError ta tb $
        "Right existential contains keys missing in left closed existential " <> pretty a
    (Open, Closed, False, b) ->
      subtypeError ta tb $
        "Left existential contains keys missing in right closed existential " <> pretty b
    _ -> extendRec scope g1 rs1 rs2

  g3 <- foldM (\g (t1, t2) -> subtype scope t1 t2 g) g2 (zip ps1 ps2)
  g4 <-
    foldM
      (\g' (t1, t2) -> subtype scope t1 t2 g')
      g3
      [(t1, t2) | (k1, t1) <- rs1, (k2, t2) <- rs2, k1 == k2]

  -- define new types to insert
  let taExpanded = ExistU v1 (ps1', pc1) (rs1', rc1)
  let tbExpanded = ExistU v2 (ps2', pc1) (rs2', rc1)

  -- Check gammaSolved first: if either is already solved, skip access2
  case (Map.lookup v1 (gammaSolved g4), Map.lookup v2 (gammaSolved g4)) of
    (Just t1, Just t2) -> subtype scope t1 t2 g4
    (Just t1, _)       -> subtype scope t1 tb g4
    (_, Just t2)       -> subtype scope ta t2 g4
    _ -> case access2 v1 v2 g4 of
      -- InstLReach: v1 is newer than v2, solve v1 = tbExpanded
      Just _ -> solveExist v1 tbExpanded g4 >>= maybe (return g4) return
      Nothing -> case access2 v2 v1 g4 of
        -- InstRReach: v2 is newer than v1, solve v2 = taExpanded
        Just _ -> solveExist v2 taExpanded g4 >>= maybe (return g4) return
        Nothing -> return g4

--  g1[Ea],>Eb,Eb |- [Eb/x]B <=: Ea -| g2,>Eb,g3
-- ----------------------------------------- InstRAllL
--  g1[Ea] |- Forall x. B <=: Ea -| g2
instantiate scope (ForallU x b) tb@(ExistU _ ([], _) _) g1 =
  instantiate
    scope
    (substitute x b) -- [Eb/x]B
    tb -- Ea
    (g1 +> MarkG x +> ExistG x ([], Open) ([], Open)) -- g1[Ea],>Eb,Eb
    >>= cut (MarkG x)
--  g1 |- t
-- ----------------------------------------- InstRSolve
--  g1,Ea,g2 |- t <=: Ea -| g1,Ea=t,g2
instantiate scope ta (ExistU v ([], _) ([], _)) g1 =
  case lookupU v g1 of
    Just t  -> subtype scope ta t g1 >>= specializeExist scope v t ta
    Nothing -> solveExist v ta g1 >>= maybe (return g1) return

--  g1 |- t
-- ----------------------------------------- instLSolve
--  g1,Ea,g2 |- Ea <=: t -| g1,Ea=t,g2
instantiate scope (ExistU v ([], _) ([], _)) tb g1 =
  case lookupU v g1 of
    Just t  -> subtype scope t tb g1 >>= specializeExist scope v t tb
    Nothing -> solveExist v tb g1 >>= maybe (return g1) return

instantiate _ ta tb _ = subtypeError ta tb "Unexpected types"

-- | After a subtype check succeeds between a solved existential's current
-- value and a new type, check if the new type is more specialized (a
-- descendant in the alias hierarchy). If so, update the solution.
-- E.g., if ?a = List Int and we check against Deque Int, update to Deque Int
-- since Deque is a specialization of List.
specializeExist :: Scope -> TVar -> TypeU -> TypeU -> Gamma -> Either MDoc Gamma
specializeExist scope v currentType newType g
  | isMoreSpecialized scope newType currentType = Right $ cacheSolved v newType g
  | otherwise = Right g

-- | Check if t1 is a more specialized (descendant) alias of t2.
-- t1 is more specialized if it has an alias definition that evaluates to
-- t2's head constructor, while t2 does not evaluate to t1's head.
isMoreSpecialized :: Scope -> TypeU -> TypeU -> Bool
isMoreSpecialized scope (AppU (VarU v1) _) (AppU (VarU v2) _) =
  v1 /= v2 && reducesToHead scope v1 v2
  where
    reducesToHead scope' src target =
      case Map.lookup src scope' of
        Just ((ps, _, _, _) : _)
          | all isGenericParam ps && not (null ps) ->
            let n = length ps
                freshVars = [VarU (TV (MT.show' i <> "__spec_cmp")) | i <- [0 .. n - 1]]
                app = AppU (VarU src) freshVars
            in case TE.evaluateType scope' app of
                 Right (AppU (VarU headV) _) -> headV == target
                 _ -> False
        _ -> False
    isGenericParam (Left _) = True
    isGenericParam _ = False
isMoreSpecialized _ _ _ = False

solve :: TVar -> TypeU -> Either MDoc GammaIndex
solve v t
  | occursIn v t =
      Left $ "Infinite recursion, cannot substitute" <+> pretty v <+> "into type" <+> pretty t
  | otherwise = Right (SolvedG v t)
  where
    occursIn :: TVar -> TypeU -> Bool
    occursIn v' (VarU v'') = v' == v''
    occursIn _ (NatVarU _) = False
    occursIn v' (ExistU v'' (ps, _) (rs, _)) = v' == v'' || any (occursIn v') ps || any (occursIn v' . snd) rs
    occursIn v' (ForallU _ t') = occursIn v' t'
    occursIn v' (FunU ts t') = any (occursIn v') ts || occursIn v' t'
    occursIn v' (AppU t' ts) = occursIn v' t' || any (occursIn v') ts
    occursIn v' (NamU _ _ ps rs) = any (occursIn v') ps || any (occursIn v' . snd) rs
    occursIn v' (EffectU _ t') = occursIn v' t'
    occursIn v' (OptionalU t') = occursIn v' t'
    occursIn _ (NatLitU _) = False
    occursIn v' (NatAddU a b) = occursIn v' a || occursIn v' b
    occursIn v' (NatMulU a b) = occursIn v' a || occursIn v' b
    occursIn v' (NatSubU a b) = occursIn v' a || occursIn v' b
    occursIn v' (NatDivU a b) = occursIn v' a || occursIn v' b
    occursIn v' (LabeledU _ t') = occursIn v' t'

-- | Record a solved variable in the gamma map cache
cacheSolved :: TVar -> TypeU -> Gamma -> Gamma
cacheSolved v t g = g {gammaSolved = Map.insert v t (gammaSolved g)}

occursCheck :: TypeU -> TypeU -> Text -> Either MDoc ()
occursCheck t1 t2 place =
  if Set.member t1 (free t2)
    then subtypeError t1 t2 $ "Occurs check at" <+> pretty place
    else Right ()

{- | substitute all appearances of a given variable with an existential
[t/v]A
-}
substitute :: TVar -> TypeU -> TypeU
substitute v = substituteTVar v (ExistU v ([], Open) ([], Open))

-- | Find an unsolved ExistG by TVar. O(log N) via gammaExist index.
-- Returns the slot and entry if found.
access1 :: TVar -> Gamma -> Maybe (Int, GammaIndex)
access1 v g = do
  slot <- Map.lookup v (gammaExist g)
  entry <- IntMap.lookup slot (gammaContext g)
  return (slot, entry)

-- | Check if ExistG v1 has a HIGHER slot (= newer) than ExistG v2.
-- Used for InstLReach/InstRReach ordering.
access2 :: TVar -> TVar -> Gamma -> Maybe (Int, Int)
access2 v1 v2 g = do
  s1 <- Map.lookup v1 (gammaExist g)
  s2 <- Map.lookup v2 (gammaExist g)
  if s1 > s2 then Just (s1, s2) else Nothing

-- | Solve an ExistG: replace it with SolvedG in place. O(log N).
-- Returns Right Nothing if the ExistG is not found (already solved).
-- Returns Left on solve error (e.g., occurs check). Returns Right (Just g) on success.
solveExist :: TVar -> TypeU -> Gamma -> Either MDoc (Maybe Gamma)
solveExist v t g = case Map.lookup v (gammaExist g) of
  Nothing -> Right Nothing
  Just slot -> do
    solved <- solve v t
    return . Just $ cacheSolved v t $ g
      { gammaContext = IntMap.insert slot solved (gammaContext g)
      , gammaExist = Map.delete v (gammaExist g)
      }

-- | Solve an ExistG and insert additional entries between the solved
-- position and older entries. O(log N + K) where K = length extras.
-- The first element of extras gets the highest sub-slot (= newest).
-- Returns Right Nothing if ExistG not found. Left on solve error.
solveExistWith :: TVar -> TypeU -> [GammaIndex] -> Gamma -> Either MDoc (Maybe Gamma)
solveExistWith v t extras g = case Map.lookup v (gammaExist g) of
  Nothing -> Right Nothing
  Just slot -> do
    solved <- solve v t
    let g1 = cacheSolved v t $ g
          { gammaContext = IntMap.insert slot solved (gammaContext g)
          , gammaExist = Map.delete v (gammaExist g)
          }
        -- Insert extras at slots below the solved entry
        insertExtra (g', subSlot) x =
          ( g' { gammaContext = IntMap.insert subSlot x (gammaContext g')
               , gammaExist = case x of
                   ExistG ev _ _ -> Map.insert ev subSlot (gammaExist g')
                   _ -> gammaExist g'
               }
          , subSlot - 1
          )
    return . Just $ fst $ foldl' insertExtra (g1, slot - 1) extras

-- | Look up a solved existential type variable. O(log N) via gammaSolved.
lookupU :: TVar -> Gamma -> Maybe TypeU
lookupU v g = Map.lookup v (gammaSolved g)

-- | Look up an annotation type variable. O(N) scan (AnnG entries are rare).
lookupE :: EVar -> Gamma -> Maybe TypeU
lookupE v g = foldr step Nothing (IntMap.toDescList (gammaContext g))
  where
    step (_, AnnG v' t) _ | v == v' = Just t
    step _ acc = acc

-- | Remove context entries newer than (and including) a marker. O(N) in
-- removed entries for cleanup; O(log N) for the IntMap split itself.
cut :: GammaIndex -> Gamma -> Either MDoc Gamma
cut marker g = do
  -- Find the marker's slot by scanning (markers are infrequent)
  markerSlot <- case [s | (s, gi) <- IntMap.toDescList (gammaContext g), gi == marker] of
    (s : _) -> Right s
    [] -> Left $ "Empty cut" <+> pretty marker
  -- Everything with slot < markerSlot is kept (older entries)
  let kept = fst (IntMap.split markerSlot (gammaContext g))
      -- Collect removed entries for cleanup
      removedSlots = IntMap.filterWithKey (\s _ -> s >= markerSlot) (gammaContext g)
      removedSolvedKeys = [v | (_, SolvedG v _) <- IntMap.toList removedSlots]
      removedExistKeys = [v | (_, ExistG v _ _) <- IntMap.toList removedSlots]
      solvedMap' = foldl' (flip Map.delete) (gammaSolved g) removedSolvedKeys
      existMap' = foldl' (flip Map.delete) (gammaExist g) removedExistKeys
  return $ g
    { gammaContext = kept
    , gammaExist = existMap'
    , gammaSolved = solvedMap'
    }

-- | Convert context to a list (newest first) for iteration/debugging.
gammaContextList :: Gamma -> [GammaIndex]
gammaContextList g = map snd (IntMap.toDescList (gammaContext g))

-- | Trim context back to the state it had at a given slot counter value.
-- Removes all entries with slot >= the given threshold.
gammaTrimAfter :: Int -> Gamma -> Gamma
gammaTrimAfter slotThreshold g =
  let kept = fst (IntMap.split slotThreshold (gammaContext g))
      removedSlots = IntMap.filterWithKey (\s _ -> s >= slotThreshold) (gammaContext g)
      removedSolvedKeys = [v | (_, SolvedG v _) <- IntMap.toList removedSlots]
      removedExistKeys = [v | (_, ExistG v _ _) <- IntMap.toList removedSlots]
      solvedMap' = foldl' (flip Map.delete) (gammaSolved g) removedSolvedKeys
      existMap' = foldl' (flip Map.delete) (gammaExist g) removedExistKeys
  in g
    { gammaContext = kept
    , gammaSlot = slotThreshold
    , gammaExist = existMap'
    , gammaSolved = solvedMap'
    }

selectorType :: Gamma -> Selector -> MorlocMonad (Gamma, TypeU)
selectorType g0 SelectorEnd = do
  let (g1, s) = newvar "_pattern_" g0
  return (g1, s)
selectorType g0 (SelectorIdx x xs) = do
  -- highest index in this pattern, matching tuple must be at least this long
  let maxIndex = maximum (map fst (x : xs))

  -- combine groups, e.g.: .(.1.(0,1), .1.2, .2) --> .(.1.(0,1,2), .2)
  xs' <- mapM (secondM weaveSelectors) (groupSort (x : xs))

  (g1, ts) <- statefulMapM (makeIndexType xs') g0 (take (maxIndex + 1) [0 ..])

  return $ newvarRich (ts, Open) ([], Closed) "_pattern_" g1
  where
    makeIndexType :: [(Int, Selector)] -> Gamma -> Int -> MorlocMonad (Gamma, TypeU)
    makeIndexType xs' g i = case lookup i xs' of
      (Just s) -> selectorType g s
      Nothing -> selectorType g SelectorEnd
selectorType g0 (SelectorKey x xs) = do
  xs' <- mapM (secondM weaveSelectors) (groupSort (x : xs))
  (g1, ss) <- statefulMapM selectorType g0 (map snd xs')
  return $ newvarRich ([], Closed) (zip (map (Key . fst) xs') ss, Open) "_pattern_" g1

weaveSelectors :: [Selector] -> MorlocMonad Selector
weaveSelectors [] = return SelectorEnd
weaveSelectors (s0 : ss0) = foldrM weavePair s0 ss0
  where
    weavePair :: Selector -> Selector -> MorlocMonad Selector
    weavePair SelectorEnd s = return s
    weavePair s SelectorEnd = return s
    weavePair (SelectorIdx s1 ss1) (SelectorIdx s2 ss2) = do
      xs <- mapM (secondM weaveSelectors) (groupSort ((s1 : ss1) <> (s2 : ss2)))
      return $ SelectorIdx (head xs) (tail xs)
    weavePair (SelectorKey s1 ss1) (SelectorKey s2 ss2) = do
      xs <- mapM (secondM weaveSelectors) (groupSort ((s1 : ss1) <> (s2 : ss2)))
      return $ SelectorKey (head xs) (tail xs)
    weavePair x@(SelectorKey _ _) y@(SelectorIdx _ _) = weavePair y x
    weavePair (SelectorIdx _ _) (SelectorKey _ _) = MM.throwSystemError $ "Bad pattern, cannot merge index and keyword patterns"

selectorGetter :: TypeU -> Selector -> [TypeU]
selectorGetter t SelectorEnd = [t]
selectorGetter (ExistU _ _ (ks, _)) (SelectorKey x xs) =
  concat [maybe [] (\t -> selectorGetter t s) (lookup (Key k) ks) | (k, s) <- (x : xs)]
selectorGetter (ExistU _ (ts, _) _) (SelectorIdx x xs) =
  concat [selectorGetter (ts !! i) s | (i, s) <- (x : xs)]
selectorGetter _ _ = error "Unreachable"

-- | map over a type using a selector and update the type using set values
selectorSetter ::
  [TypeU] -> -- types to which the selected fields are set
  Selector -> -- current selector pattern
  TypeU -> -- current type that is being updated
  TypeU -- modified return type
selectorSetter setTypes0 s0 t0 = fst (f t0 setTypes0 s0)
  where
    f ::
      TypeU ->
      [TypeU] ->
      Selector ->
      (TypeU, [TypeU]) -- the modified type and the list of remaining setters
    f _ (t : ts) SelectorEnd = (t, ts)
    f (ExistU v (ts, tc) (ks, kc)) setTypes1 (SelectorKey s ss) =
      let (ks', setTypes2) = foldr subKey (ks, setTypes1) (s : ss)
       in (ExistU v (ts, tc) (ks', kc), setTypes2)
    f (NamU o v ps ks) setTypes1 (SelectorKey s ss) =
      let (ks', setTypes2) = foldr subKey (ks, setTypes1) (s : ss)
       in (NamU o v ps ks', setTypes2)
    -- handle non-existential records
    --  * note that this may well change the field type of the record, this should
    --    raise an error later if such changes are not allowed
    f (ExistU v (ts, tc) (ks, kc)) setTypes1 (SelectorIdx s ss) =
      let (ts', setTypes2) = foldl subIdx (ts, setTypes1) (s : ss)
       in (ExistU v (ts', tc) (ks, kc), setTypes2)
    -- handle non-existential tuples
    f (AppU t ts) setTypes1 (SelectorIdx s ss)
      -- if this is a tuple, fine, proceed
      | (VarU (BT.tuple (length ts))) == t =
          let (ts', setTypes2) = foldl subIdx (ts, setTypes1) (s : ss)
           in (AppU t ts', setTypes2)
      -- otherwise die
      | otherwise = error "Unreachable case"
    -- and die some more
    f _ _ _ = error "Unreachable pattern case"

    subKey :: (Text, Selector) -> ([(Key, TypeU)], [TypeU]) -> ([(Key, TypeU)], [TypeU])
    subKey (k, s) (ks, setTypesN) = case lookup (Key k) ks of
      Nothing -> error "Malformed pattern"
      (Just priorType) -> (ks', setTypesN')
        where
          (newType, setTypesN') = f priorType setTypesN s
          ks' = [if k' == k then (Key k, newType) else x | x@(Key k', _) <- ks]

    subIdx :: ([TypeU], [TypeU]) -> (Int, Selector) -> ([TypeU], [TypeU])
    subIdx (ts, setTypesN) (i, s)
      | i < length ts =
          let (newType, setTypesN') = f (ts !! i) setTypesN s
           in (take i ts <> [newType] <> drop (i + 1) ts, setTypesN')
      | otherwise = error $ "Bad pattern, index " <> show i <> " is greather than tuple length"

extendList :: [a] -> [a] -> ([a], [a])
extendList [] ys = (ys, ys)
extendList xs [] = (xs, xs)
extendList (x : xs) (y : ys) =
  let (xs', ys') = extendList xs ys
   in (x : xs', y : ys')

extendRec ::
  (Ord k) =>
  Scope ->
  Gamma ->
  [(k, TypeU)] ->
  [(k, TypeU)] ->
  Either MDoc (Gamma, [(k, TypeU)], [(k, TypeU)])
extendRec scope g0 xs ys = do
  g1 <-
    foldlM
      ( \g (k, x) ->
          maybe
            (return g)
            (\y -> subtype scope x y g)
            (lookup k ys)
      )
      g0
      xs
  return $
    ( g1
    , xs <> [y | y@(k, _) <- ys, Set.notMember k setX]
    , ys <> [x | x@(k, _) <- xs, Set.notMember k setY]
    )
  where
    setX = Set.fromList (map fst xs)
    setY = Set.fromList (map fst ys)

newvar :: Text -> Gamma -> (Gamma, TypeU)
newvar = newvarRich ([], Open) ([], Open)

newvarRich ::
  -- | type parameters
  ([TypeU], OpenOrClosed) ->
  -- | key-value pairs
  ([(Key, TypeU)], OpenOrClosed) ->
  -- | prefix, just for readability
  Text ->
  Gamma ->
  (Gamma, TypeU)
newvarRich ps rs prefix g =
  let (g', v) = tvarname g prefix
   in (g' +> ExistG v ps rs, ExistU v ps rs)

-- | standardize quantifier names, for example, replace `a -> b` with `v0 -> v1`.
rename :: Gamma -> TypeU -> (Gamma, TypeU)
rename g0 (ForallU v@(TV s) t0) =
  let (g1, v') = tvarname g0 (s <> "___q")
      (g2, t1) = rename g1 t0
      t2 = substituteTVar v (VarU v') t1
   in (g2, ForallU v' t2)
-- After stripping ForallU, rename NatVarU variables to fresh names
rename g0 t0 =
  let nvs = nub (collectNatVarNames t0)
   in if null nvs then (g0, t0)
      else
        let (g1, nvs') = statefulMap (\g (TV s) -> tvarname g (s <> "___n")) g0 nvs
            renameMap = Map.fromList (zip nvs nvs')
         in (g1, renameNatVars renameMap t0)

-- | Rename NatVarU variables according to a mapping
renameNatVars :: Map.Map TVar TVar -> TypeU -> TypeU
renameNatVars m = go
  where
    ren v = Map.findWithDefault v v m
    go (NatVarU v) = NatVarU (ren v)
    go (VarU v) = VarU v
    go (ExistU v (ts, tc) (rs, rc)) = ExistU v (map go ts, tc) ([(k, go t) | (k, t) <- rs], rc)
    go (ForallU v t) = ForallU v (go t)
    go (FunU ts t) = FunU (map go ts) (go t)
    go (AppU t ts) = AppU (go t) (map go ts)
    go (NamU n o ps rs) = NamU n o (map go ps) [(k, go t) | (k, t) <- rs]
    go (EffectU effs t) = EffectU effs (go t)
    go (OptionalU t) = OptionalU (go t)
    go t@(NatLitU _) = t
    go (NatAddU a b) = NatAddU (go a) (go b)
    go (NatMulU a b) = NatMulU (go a) (go b)
    go (NatSubU a b) = NatSubU (go a) (go b)
    go (NatDivU a b) = NatDivU (go a) (go b)
    go (LabeledU n t) = LabeledU n (go t)

{- | Rename all generic type variables (ForallU-bound and ExistU) to clean
letters from a lazy pool: a, b, c, ..., z, a1, b1, ..., z1, a2, ...
Avoids names already used by concrete types in the expression.
-}
cleanTypeName :: TypeU -> TypeU
cleanTypeName t0 =
  let (vs, body) = unqualify t0
      evs = collectExistVars body
      nvs = collectNatVarNames body
      allGeneric = nub (vs ++ evs ++ nvs)
      fixed = collectFixedNames (Set.fromList allGeneric) body
      pool = filter (\(TV n) -> Set.notMember n fixed) letterPool
      renameMap = Map.fromList (zip allGeneric pool)
      renamedBody = applyVarRenaming renameMap body
      renamedVs = map (\v -> Map.findWithDefault v v renameMap) vs
   in simplifyNats $ qualify renamedVs renamedBody

-- | Simplify nat arithmetic in types (e.g., 34 + (4 + 5) -> 43)
simplifyNats :: TypeU -> TypeU
simplifyNats = go
  where
    go (NatAddU a b) = trySimplify (NatAddU (go a) (go b))
    go (NatMulU a b) = trySimplify (NatMulU (go a) (go b))
    go (NatSubU a b) = trySimplify (NatSubU (go a) (go b))
    go (NatDivU a b) = trySimplify (NatDivU (go a) (go b))
    go (AppU f ts) = AppU (go f) (map go ts)
    go (FunU ts r) = FunU (map go ts) (go r)
    go (ForallU v t) = ForallU v (go t)
    go (NamU o v ps es) = NamU o v (map go ps) [(k, go t) | (k, t) <- es]
    go (ExistU v (ps, pc) (rs, rc)) = ExistU v (map go ps, pc) ([(k, go t) | (k, t) <- rs], rc)
    go (EffectU e t) = EffectU e (go t)
    go (OptionalU t) = OptionalU (go t)
    go t@(NatVarU _) = t
    go (LabeledU n t) = LabeledU n (go t)
    go t = t

    trySimplify nat = case typeUToNatExpr nat of
      Just ne -> natExprToTypeU (NS.sopToNatExpr (NS.normalize ne))
      Nothing -> nat

letterPool :: [TVar]
letterPool =
  [ TV (MT.singleton c <> suffix)
  | suffix <- "" : map MT.show' [1 :: Int ..]
  , c <- ['a' .. 'z']
  ]

collectExistVars :: TypeU -> [TVar]
collectExistVars = go
  where
    go (VarU _) = []
    go (NatVarU _) = []
    go (ExistU v (ts, _) (rs, _)) = v : concatMap go ts ++ concatMap (go . snd) rs
    go (ForallU _ t) = go t
    go (FunU ts t) = concatMap go (t : ts)
    go (AppU t ts) = concatMap go (t : ts)
    go (NamU _ _ ps rs) = concatMap go ps ++ concatMap (go . snd) rs
    go (EffectU _ t) = go t
    go (OptionalU t) = go t
    go (NatLitU _) = []
    go (NatAddU a b) = go a ++ go b
    go (NatMulU a b) = go a ++ go b
    go (NatSubU a b) = go a ++ go b
    go (NatDivU a b) = go a ++ go b
    go (LabeledU _ t) = go t

-- | Collect NatVarU variable names from a type (for renaming)
collectNatVarNames :: TypeU -> [TVar]
collectNatVarNames = go
  where
    go (NatVarU v) = [v]
    go (VarU _) = []
    go (ExistU _ (ts, _) (rs, _)) = concatMap go ts ++ concatMap (go . snd) rs
    go (ForallU _ t) = go t
    go (FunU ts t) = concatMap go (t : ts)
    go (AppU t ts) = concatMap go (t : ts)
    go (NamU _ _ ps rs) = concatMap go ps ++ concatMap (go . snd) rs
    go (EffectU _ t) = go t
    go (OptionalU t) = go t
    go (NatLitU _) = []
    go (NatAddU a b) = go a ++ go b
    go (NatMulU a b) = go a ++ go b
    go (NatSubU a b) = go a ++ go b
    go (NatDivU a b) = go a ++ go b
    go (LabeledU _ t) = go t

collectFixedNames :: Set.Set TVar -> TypeU -> Set.Set Text
collectFixedNames generics = go
  where
    go (VarU v)
      | Set.member v generics = Set.empty
      | otherwise = Set.singleton (unTVar v)
    go (NatVarU _) = Set.empty
    go (ExistU _ (ts, _) (rs, _)) = Set.unions (map go ts ++ map (go . snd) rs)
    go (ForallU _ t) = go t
    go (FunU ts t) = Set.unions $ map go (t : ts)
    go (AppU t ts) = Set.unions $ map go (t : ts)
    go (NamU _ (TV n) ps rs) =
      Set.insert n $ Set.unions (map go ps ++ map (go . snd) rs)
    go (EffectU _ t) = go t
    go (OptionalU t) = go t
    go (NatLitU _) = Set.empty
    go (NatAddU a b) = Set.union (go a) (go b)
    go (NatMulU a b) = Set.union (go a) (go b)
    go (NatSubU a b) = Set.union (go a) (go b)
    go (NatDivU a b) = Set.union (go a) (go b)
    go (LabeledU _ t) = go t

applyVarRenaming :: Map.Map TVar TVar -> TypeU -> TypeU
applyVarRenaming m = go
  where
    ren v = Map.findWithDefault v v m
    go (VarU v) = VarU (ren v)
    go (NatVarU v) = NatVarU (ren v)
    go (ExistU v (ts, tc) (rs, rc)) =
      ExistU (ren v) (map go ts, tc) ([(k, go t) | (k, t) <- rs], rc)
    go (ForallU v t) = ForallU (ren v) (go t)
    go (FunU ts t) = FunU (map go ts) (go t)
    go (AppU t ts) = AppU (go t) (map go ts)
    go (NamU n o ps rs) = NamU n o (map go ps) [(k, go t) | (k, t) <- rs]
    go (EffectU effs t) = EffectU effs (go t)
    go (OptionalU t) = OptionalU (go t)
    go t@(NatLitU _) = t
    go (NatAddU a b) = NatAddU (go a) (go b)
    go (NatMulU a b) = NatMulU (go a) (go b)
    go (NatSubU a b) = NatSubU (go a) (go b)
    go (NatDivU a b) = NatDivU (go a) (go b)
    go (LabeledU n t) = LabeledU n (go t)

prettyTypeU :: TypeU -> MDoc
prettyTypeU = pretty . cleanTypeName

tvarname :: Gamma -> Text -> (Gamma, TVar)
tvarname g prefix =
  let i = gammaCounter g
   in (g {gammaCounter = i + 1}, TV (prefix <> MT.pack (show i)))

evarname :: Gamma -> Text -> (Gamma, EVar)
evarname g prefix =
  let i = gammaCounter g
   in (g {gammaCounter = i + 1}, EV (prefix <> "@@" <> MT.pack (show i)))

-- debugging -------------------

enter :: MDoc -> MorlocMonad ()
enter d = do
  depth <- MM.incDepth
  insetSay $ "--" <> pretty depth <> "-->" <+> d

insetSay :: MDoc -> MorlocMonad ()
insetSay d = do
  MM.sayVVV $ " :" <+> d

seeType :: TypeU -> MorlocMonad ()
seeType t = insetSay $ pretty t

leave :: MDoc -> MorlocMonad ()
leave d = do
  depth <- MM.decDepth
  insetSay $ "<--" <> pretty (depth + 1) <> "--" <+> d

seeGamma :: Gamma -> MorlocMonad ()
seeGamma g = MM.sayVVV $ nest 4 $ "Gamma:" <> line <> vsep (map pretty (gammaContextList g))

peak :: (Foldable f) => ExprS g f c -> MorlocMonad ()
peak = insetSay . pretty

peakGen :: (Foldable f) => AnnoS g f c -> MorlocMonad ()
peakGen = insetSay . pretty


================================================
FILE: library/Morloc/Typecheck/NatSolver.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc.Typecheck.NatSolver
Description : Type-level natural number arithmetic solver
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Normalizes type-level Nat expressions to Sum-of-Products (SOP) canonical form
and solves equality constraints between Nat expressions. Based on the
approach in ghc-typelits-natnormalise by Christiaan Baaij.
-}
module Morloc.Typecheck.NatSolver
  ( NatExpr(..)
  , NatSOP(..)
  , NatProduct(..)
  , NatError(..)
  , normalize
  , natEqual
  , solveNat
  , substituteNat
  , isGround
  , freeNatVars
  , sopToNatExpr
  ) where

import Data.Map.Strict (Map)
import qualified Data.Map.Strict as Map
import qualified Data.Set as Set
import Data.List (sortBy, groupBy)
import Data.Ord (comparing)
import Data.Function (on)
import Morloc.Namespace.Prim (TVar(..))

-- | A type-level natural number expression
data NatExpr
  = NatLit Integer        -- ^ literal: 0, 1, 2, ...
  | NatVar TVar           -- ^ type variable of kind Nat
  | NatAdd NatExpr NatExpr -- ^ addition
  | NatMul NatExpr NatExpr -- ^ multiplication
  | NatSub NatExpr NatExpr -- ^ subtraction (a - b = a + negate b in SOP)
  | NatDiv NatExpr NatExpr -- ^ division (ground-only or constant-divisor)
  deriving (Eq, Ord, Show)

-- | Sum-of-Products canonical form for Nat expressions.
-- Represents: sum of (coefficient * product-of-variable-powers)
newtype NatSOP = NatSOP { unNatSOP :: [NatProduct] }
  deriving (Eq, Ord, Show)

-- | A single product term: coefficient * (v1^e1 * v2^e2 * ...)
-- Invariants: exponents > 0, zero-coefficient terms removed
data NatProduct = NatProduct
  { npCoeff :: !Integer
  , npVars  :: !(Map TVar Integer)
  } deriving (Show)

-- Custom Eq/Ord: full comparison including coefficient
instance Eq NatProduct where
  (NatProduct c1 v1) == (NatProduct c2 v2) = c1 == c2 && v1 == v2

instance Ord NatProduct where
  compare (NatProduct c1 v1) (NatProduct c2 v2) =
    compare (Map.size v1, v1, c1) (Map.size v2, v2, c2)

-- | Result of attempting to solve a Nat constraint
data NatError
  = Contradiction
  | Deferred NatSOP  -- ^ cannot solve yet, keep as deferred constraint
  deriving (Eq, Show)

-- | Normalize a NatExpr to canonical SOP form
normalize :: NatExpr -> NatSOP
normalize (NatLit n)   = NatSOP [NatProduct n Map.empty]
normalize (NatVar v)   = NatSOP [NatProduct 1 (Map.singleton v 1)]
normalize (NatAdd a b) = addSOP (normalize a) (normalize b)
normalize (NatMul a b) = mulSOP (normalize a) (normalize b)
normalize (NatSub a b) = addSOP (normalize a) (negateSOP (normalize b))
normalize (NatDiv a b) = divSOP (normalize a) (normalize b)

-- | Add two SOPs by merging and combining like terms
addSOP :: NatSOP -> NatSOP -> NatSOP
addSOP (NatSOP ps1) (NatSOP ps2) = NatSOP (mergeLikeTerms (ps1 ++ ps2))

-- | Multiply two SOPs by distributing (cross-product of terms)
mulSOP :: NatSOP -> NatSOP -> NatSOP
mulSOP (NatSOP ps1) (NatSOP ps2) =
  NatSOP (mergeLikeTerms [mulProduct p1 p2 | p1 <- ps1, p2 <- ps2])

-- | Multiply two product terms
mulProduct :: NatProduct -> NatProduct -> NatProduct
mulProduct (NatProduct c1 vs1) (NatProduct c2 vs2) =
  NatProduct (c1 * c2) (Map.unionWith (+) vs1 vs2)

-- | Merge like terms: group by variable-power maps, sum coefficients,
-- remove zero-coefficient products, sort canonically
mergeLikeTerms :: [NatProduct] -> [NatProduct]
mergeLikeTerms =
    filter (\p -> npCoeff p /= 0)
  . map mergeGroup
  . groupBy ((==) `on` npVars)
  . sortBy (comparing npVars)
  where
    mergeGroup :: [NatProduct] -> NatProduct
    mergeGroup [] = error "impossible: groupBy produces non-empty groups"
    mergeGroup ps@(p:_) = NatProduct (sum (map npCoeff ps)) (npVars p)

-- | Check if two Nat expressions are equal (via SOP normalization)
natEqual :: NatExpr -> NatExpr -> Bool
natEqual e1 e2 = normalize e1 == normalize e2

-- | Solve the constraint e1 ~ e2, returning variable substitutions
solveNat :: NatExpr -> NatExpr -> Either NatError (Map TVar NatExpr)
solveNat e1 e2 =
  let sop1 = normalize e1
      sop2 = normalize e2
      diff = subSOP sop1 sop2
  in solveSOP diff

-- | Subtract two SOPs: sop1 - sop2
subSOP :: NatSOP -> NatSOP -> NatSOP
subSOP (NatSOP ps1) (NatSOP ps2) =
  addSOP (NatSOP ps1) (NatSOP (map negateProduct ps2))

-- | Negate a product term
negateProduct :: NatProduct -> NatProduct
negateProduct (NatProduct c vs) = NatProduct (negate c) vs

-- | Negate an entire SOP
negateSOP :: NatSOP -> NatSOP
negateSOP (NatSOP ps) = NatSOP (map negateProduct ps)

-- | Divide two SOPs. Only handles ground division or constant divisor.
-- For ground: compute directly. For constant divisor: divide each coefficient.
-- Otherwise: return the original forms unchanged (will be Deferred by solver).
divSOP :: NatSOP -> NatSOP -> NatSOP
divSOP (NatSOP ps1) (NatSOP [NatProduct d vs2])
  | Map.null vs2, d /= 0
  , all (\p -> npCoeff p `mod` d == 0) ps1
  = NatSOP (mergeLikeTerms [NatProduct (npCoeff p `div` d) (npVars p) | p <- ps1])
divSOP (NatSOP ps1) (NatSOP ps2)
  -- Both ground: compute directly
  | all (\p -> Map.null (npVars p)) ps1
  , all (\p -> Map.null (npVars p)) ps2
  , let n = sum (map npCoeff ps1)
  , let d = sum (map npCoeff ps2)
  , d /= 0
  , n `mod` d == 0
  = NatSOP [NatProduct (n `div` d) Map.empty]
  -- Cannot simplify: return a sentinel that won't match anything useful.
  -- The solver will see non-matching SOPs and return Deferred.
  | otherwise = NatSOP [NatProduct 0 (Map.singleton (TV "__div__") 1)]

-- | Solve sop = 0
solveSOP :: NatSOP -> Either NatError (Map TVar NatExpr)
solveSOP (NatSOP []) = Right Map.empty  -- 0 = 0
solveSOP (NatSOP [NatProduct c vs])
  | Map.null vs && c /= 0 = Left Contradiction  -- c = 0 where c /= 0
  | Map.null vs           = Right Map.empty      -- 0 = 0
  | Map.size vs == 1, [(v, 1)] <- Map.toList vs =
      -- c*v = 0, only solution is v = 0 (but only if c divides 0, which it does)
      if c == 0
        then Right Map.empty
        else Right (Map.singleton v (NatLit 0))
  | otherwise = Left (Deferred (NatSOP [NatProduct c vs]))
solveSOP (NatSOP prods)
  | Just (v, a, b) <- extractLinearVar prods =
      if b `mod` a == 0
        then Right (Map.singleton v (NatLit (negate b `div` a)))
        else Left Contradiction
  | otherwise = Left (Deferred (NatSOP prods))

-- | Find a variable that appears linearly (exponent 1, alone in its product)
-- Returns (variable, coefficient, sum of constant terms)
extractLinearVar :: [NatProduct] -> Maybe (TVar, Integer, Integer)
extractLinearVar prods =
  let -- Find products with exactly one variable at exponent 1
      linearSingles = [ (v, npCoeff p)
                       | p <- prods
                       , Map.size (npVars p) == 1
                       , [(v, 1)] <- [Map.toList (npVars p)]
                       ]
      -- Check which linear variables appear only once AND all other
      -- products are constant (no other variables). Without this guard,
      -- expressions like i*j - n would incorrectly solve n = 0.
      candidates = [ (v, c, constSum)
                    | (v, c) <- linearSingles
                    , length [() | p <- prods, Map.member v (npVars p)] == 1
                    , let others = [p | p <- prods, not (Map.member v (npVars p))]
                    , all (\p -> Map.null (npVars p)) others
                    , let constSum = sum (map npCoeff others)
                    ]
  in case candidates of
       ((v, c, s) : _) -> Just (v, c, s)
       [] -> Nothing

-- | Apply substitutions to a NatExpr
substituteNat :: Map TVar NatExpr -> NatExpr -> NatExpr
substituteNat m = go
  where
    go (NatLit n) = NatLit n
    go (NatVar v) = case Map.lookup v m of
      Just e  -> e
      Nothing -> NatVar v
    go (NatAdd a b) = NatAdd (go a) (go b)
    go (NatMul a b) = NatMul (go a) (go b)
    go (NatSub a b) = NatSub (go a) (go b)
    go (NatDiv a b) = NatDiv (go a) (go b)

-- | Check if a NatExpr has no free variables
isGround :: NatExpr -> Bool
isGround (NatLit _) = True
isGround (NatVar _) = False
isGround (NatAdd a b) = isGround a && isGround b
isGround (NatMul a b) = isGround a && isGround b
isGround (NatSub a b) = isGround a && isGround b
isGround (NatDiv a b) = isGround a && isGround b

-- | Get all free variables in a NatExpr
freeNatVars :: NatExpr -> Set.Set TVar
freeNatVars (NatLit _) = Set.empty
freeNatVars (NatVar v) = Set.singleton v
freeNatVars (NatAdd a b) = Set.union (freeNatVars a) (freeNatVars b)
freeNatVars (NatMul a b) = Set.union (freeNatVars a) (freeNatVars b)
freeNatVars (NatSub a b) = Set.union (freeNatVars a) (freeNatVars b)
freeNatVars (NatDiv a b) = Set.union (freeNatVars a) (freeNatVars b)

-- | Convert a SOP back to a NatExpr (for error messages and further processing)
sopToNatExpr :: NatSOP -> NatExpr
sopToNatExpr (NatSOP []) = NatLit 0
sopToNatExpr (NatSOP prods) = foldl1 NatAdd (map productToExpr prods)
  where
    productToExpr :: NatProduct -> NatExpr
    productToExpr (NatProduct c vs)
      | Map.null vs = NatLit c
      | c == 1      = varsToExpr (Map.toList vs)
      | otherwise   = NatMul (NatLit c) (varsToExpr (Map.toList vs))

    varsToExpr :: [(TVar, Integer)] -> NatExpr
    varsToExpr [] = NatLit 1
    varsToExpr pairs = foldl1 NatMul (concatMap expandVar pairs)

    expandVar :: (TVar, Integer) -> [NatExpr]
    expandVar (v, n)
      | n <= 0    = []
      | otherwise = replicate (fromIntegral n) (NatVar v)


================================================
FILE: library/Morloc/Version.hs
================================================
{- |
Module      : Morloc.Version
Description : Store the morloc version
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io
-}
module Morloc.Version (versionStr) where

import Data.Version (showVersion)
import qualified Paths_morloc (version)

versionStr :: String
versionStr = showVersion Paths_morloc.version


================================================
FILE: library/Morloc.hs
================================================
{-# LANGUAGE OverloadedStrings #-}

{- |
Module      : Morloc
Description : Top-level compiler pipeline: parse, typecheck, generate, build
Copyright   : (c) Zebulun Arendsee, 2016-2026
License     : Apache-2.0
Maintainer  : z@morloc.io

Entry point for the morloc compiler library. Orchestrates the full pipeline:
parsing source into a module DAG, typechecking, code generation (pools +
manifest), and building executables. The 'writeProgram' function is the
main API consumed by the CLI.
-}
module Morloc
  ( writeProgram
  , typecheck
  , typecheckFrontend
  , generatePools
  ) where

import Morloc.Namespace.Expr
import Morloc.Namespace.Prim
import Morloc.Namespace.State
import Morloc.Namespace.Type

import Morloc.Data.Doc (pretty)
import qualified Data.Map as Map
import qualified Data.Set as Set

import Morloc.CodeGenerator.Docstrings (processDocstrings)
import Morloc.CodeGenerator.Emit (TranslateFn, emit, pool)
import Morloc.CodeGenerator.Express (express)
import Morloc.CodeGenerator.LambdaEval (applyLambdas)
import Morloc.CodeGenerator.Namespace (SerialManifold)
import qualified Morloc.CodeGenerator.Nexus as Nexus
import Morloc.CodeGenerator.Parameterize (parameterize)
import Morloc.CodeGenerator.Realize (realityCheck)
import Morloc.CodeGenerator.Segment (segment)
import Morloc.CodeGenerator.Reduce (reduce)
import Morloc.CodeGenerator.Serialize (serialize)
import qualified Morloc.Data.DAG as DAG
import qualified Morloc.Frontend.API as F
import Morloc.Frontend.Restructure (restructure)
import Morloc.Frontend.Treeify (treeify)
import qualified Morloc.Monad as MM
import Morloc.ProgramBuilder.Build (buildProgram)

-- | Check the general types only
typecheckFrontend ::
  Maybe Path ->
  Code ->
  MorlocMonad [AnnoS (Indexed TypeU) Many Int]
typecheckFrontend path code = do
  dag <- F.parse path code
  evalMode <- MM.gets stateEvalMode
  if evalMode then checkEvalRestrictions dag else return ()
  case DAG.roots dag of
    (r : _) -> MM.modify (\s -> s {stateModuleName = Just r})
    _ -> return ()
  restructure dag
    >>= treeify
    >>= F.typecheck

-- | Check general types and also resolve implementations
typecheck ::
  Maybe Path ->
  Code ->
  MorlocMonad
    ( [AnnoS (Indexed Type) One ()]
    , [AnnoS (Indexed Type) One (Indexed Lang)]
    )
typecheck path code =
  typecheckFrontend path code
    -- resolve all TypeU types to Type
    |>> map F.resolveTypes
    -- resolve all TypeU types to Type
    >>= mapM F.valuecheck
    -- check for value contradictions between implementations
    >>= realityCheck

-- | Do everything except language specific code generation.
generatePools :: [AnnoS (Indexed Type) One (Indexed Lang)] -> MorlocMonad [(Lang, [SerialManifold])]
generatePools rASTs = do
  paramRASTs <- mapM parameterize rASTs
  let langMap = Map.fromList
        [(midx, lang) | AnnoS (Idx midx _) (Idx _ lang, _) _ <- paramRASTs]
  MM.modify (\s -> s { stateManifoldLang = langMap })
  mapM express paramRASTs
    >>= mapM segment |>> concat
    >>= mapM serialize
    >>= mapM reduce
      |>> pool

-- | Build a program as a local executable
writeProgram ::
  -- | language-specific translator callback
  TranslateFn ->
  -- | source code filename (for debugging messages)
  Maybe Path ->
  -- | source code text
  Code ->
  MorlocMonad ()
writeProgram translateFn path code = do
  typecheck path code
    -- evaluate all applied lambdas in rasts and gasts
    >>= bimapM (mapM applyLambdas) (mapM applyLambdas)
    -- process docstrings to determine how to build CLI
    >>= bimapM (mapM processDocstrings) (mapM processDocstrings)
    -- generate nexus and pools
    >>= \(gASTs, rASTs) ->
      do
        -- Filter out generic (polymorphic) exports -- they can't become CLI subcommands
        let isConcreteExport (AnnoS (Idx _ t) _ _, _) = not (containsUnk t)
            (concreteGASTs, genericGASTs) = partition isConcreteExport gASTs
            (concreteRASTs, genericRASTs) = partition isConcreteExport rASTs
            warnSkip (AnnoS (Idx i _) _ _) = do
              name <- MM.metaName i
              case name of
                Just (EV n) -> MM.say $ "Warning: skipping generic export '" <> pretty n <> "'"
                Nothing -> return ()
        mapM_ (warnSkip . fst) genericGASTs
        mapM_ (warnSkip . fst) genericRASTs
        -- Only pass exported rASTs to the nexus (not recursive helpers)
        exports <- MM.gets stateExports
        let exportSet = Set.fromList exports
            isExported (AnnoS (Idx midx _) _ _, _) = Set.member midx exportSet
            exportedRASTs = filter isExported concreteRASTs
        nexus <- Nexus.generate concreteGASTs exportedRASTs
        MM.startCounter
        paramRASTs <- mapM parameterize (map fst concreteRASTs)
        let langMap = Map.fromList
              [(midx, lang) | AnnoS (Idx midx _) (Idx _ lang, _) _ <- paramRASTs]
        MM.modify (\s -> s { stateManifoldLang = langMap })
        pools <-
          mapM express paramRASTs
            >>= mapM segment |>> concat
            >>= mapM serialize
            >>= mapM reduce
              |>> pool
            >>= mapM (uncurry (emit translateFn))
        return (nexus, pools)
        -- write the code and compile as needed
        >>= buildProgram

-- | In eval mode, reject source, class, and instance declarations in the root module.
-- Imported modules are not checked since they are pre-existing installed code.
checkEvalRestrictions :: DAG MVar Import ExprI -> MorlocMonad ()
checkEvalRestrictions dag =
  case DAG.roots dag of
    [] -> return ()
    (root : _) -> case Map.lookup root dag of
      Nothing -> return ()
      Just (ExprI _ (ModE _ body), _) -> mapM_ checkExpr body
      Just _ -> return ()
  where
    checkExpr :: ExprI -> MorlocMonad ()
    checkExpr (ExprI i (SrcE _)) =
      MM.throwSourcedError i "source statements are not allowed in eval mode"
    checkExpr (ExprI i (ClsE _)) =
      MM.throwSourcedError i "class declarations are not allowed in eval mode"
    checkExpr (ExprI i (IstE _ _ _)) =
      MM.throwSourcedError i "instance declarations are not allowed in eval mode"
    checkExpr _ = return ()


================================================
FILE: metrics/README.md
================================================
# Morloc Compiler Metrics

This directory contains tools for collecting and tracking code quality metrics for the morloc compiler.

## Purpose

Track quantitative metrics over time to:
- Monitor code growth and complexity
- Detect performance regressions
- Guide refactoring decisions
- Compare versions objectively

## Collected Metrics

### Code Metrics (via `scc`)
- Lines of code (total, by file, by language)
- Comment ratio
- Blank lines
- Cyclomatic complexity estimates

### Build Metrics
- Full build time (clean build)
- Binary size
- Module counts (library, executable, test, bench)

### Performance Metrics (via `tasty-bench`)
- Parser performance
- Type checker performance
- Code generator performance

## Directory Structure

```
metrics/
├── scripts/
│   ├── collect-metrics.sh   # Collect all metrics and save snapshot
│   └── compare-metrics.sh    # Compare two metric snapshots
├── baselines/
│   └── *.json                # Metric snapshots (version baselines)
└── reports/
    └── *.txt                 # Human-readable metric reports
```

## Usage

### Collect Metrics

```bash
# Collect metrics for current version
./metrics/scripts/collect-metrics.sh v0.59.0

# Or use auto-generated timestamp
./metrics/scripts/collect-metrics.sh
```

This creates:
- `baselines/v0.59.0.json` - Machine-readable metrics
- `reports/v0.59.0.txt` - Human-readable summary

### Compare Versions

```bash
./metrics/scripts/compare-metrics.sh \
    metrics/baselines/v0.59.0.json \
    metrics/baselines/v0.60.0.json
```

Shows changes in:
- Code lines
- Build time
- Binary size
- Benchmark performance

Color-coded output highlights significant changes (>10%).

## Requirements

### Required
- `stack` - Haskell build tool (already required for morloc)
- `bc` - Command-line calculator (usually pre-installed)

### Recommended
- `scc` - Fast line counter with complexity metrics (written in Go)
  - Install: `go install github.com/boyter/scc/v3@latest`
  - Or: `brew install scc` (macOS)
  - Or download from: https://github.com/boyter/scc/releases
  - Without it, only basic metrics are collected

- `jq` - JSON processor for detailed comparison
  - Install: `brew install jq` or `apt-get install jq`
  - Without it, comparison tool is less detailed

## Workflow

### On Release

```bash
# Before release, collect baseline
./metrics/scripts/collect-metrics.sh v0.59.0-baseline

# After changes, collect new metrics
./metrics/scripts/collect-metrics.sh v0.59.0-final

# Compare
./metrics/scripts/compare-metrics.sh \
    metrics/baselines/v0.59.0-baseline.json \
    metrics/baselines/v0.59.0-final.json
```

### During Development

Collect metrics periodically (weekly, monthly) to track trends:

```bash
./metrics/scripts/collect-metrics.sh $(date +%Y-%m-%d)
```

Compare against previous week/month to catch drift.

### After Major Refactoring

```bash
# Before refactoring
./metrics/scripts/collect-metrics.sh before-refactor-auth

# After refactoring
./metrics/scripts/collect-metrics.sh after-refactor-auth

# Verify no regressions
./metrics/scripts/compare-metrics.sh \
    metrics/baselines/before-refactor-auth.json \
    metrics/baselines/after-refactor-auth.json
```

## Interpreting Results

### Good Trends
- ✅ Build time stable or decreasing
- ✅ Comment ratio >15%
- ✅ Benchmark performance stable or improving
- ✅ Binary size stable (unless adding features)

### Warning Signs
- ⚠️  Code lines growing >20% per release
- ⚠️  Build time increasing >15%
- ⚠️  Benchmark performance degrading >10%
- ⚠️  Comment ratio decreasing

### When to Act
- 🚨 Any metric changes >25% unexpectedly
- 🚨 Build time >5 minutes
- 🚨 Binary size >100MB
- 🚨 Average module size >500 lines

## Extending Metrics

To add new metrics, edit `collect-metrics.sh`:

```bash
# Add new metric collection
echo "Collecting custom metric..."
CUSTOM_VALUE=$(your-command)
echo "  \"custom_metric\": $CUSTOM_VALUE," >> "$OUTPUT_FILE"
```

Ensure JSON formatting is valid (commas, no trailing comma on last entry).

## Notes

- Metrics are stored as JSON for easy parsing and analysis
- Scripts are designed to work without external dependencies (except scc/jq)
- Git commit hash is automatically captured in each snapshot
- Build metrics require clean build (slower but reproducible)

## See Also

- `../CLAUDE.md` - Full tooling guidelines including when to run metrics
- `../bench/` - Benchmark suite source code


================================================
FILE: metrics/scripts/collect-metrics.sh
================================================
#!/usr/bin/env bash
# Collect code metrics for morloc compiler
# Usage: ./collect-metrics.sh [version-label]
#
# Requirements:
#   - scc (lines of code): https://github.com/boyter/scc
#     Install: go install github.com/boyter/scc/v3@latest
#   - stack (Haskell build tool)
#
# This script collects:
#   - Source lines of code (scc)
#   - Module count and structure
#   - Build time
#   - Binary size
#   - Benchmark results (if available)

set -euo pipefail

VERSION="${1:-$(date +%Y%m%d-%H%M%S)}"
METRICS_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
OUTPUT_FILE="$METRICS_DIR/baselines/${VERSION}.json"
REPORT_FILE="$METRICS_DIR/reports/${VERSION}.txt"

echo "=== Collecting metrics for version: $VERSION ==="
echo "Output: $OUTPUT_FILE"
echo ""

# Create output directories
mkdir -p "$METRICS_DIR/baselines"
mkdir -p "$METRICS_DIR/reports"

# Start JSON output
echo "{" > "$OUTPUT_FILE"
echo "  \"version\": \"$VERSION\"," >> "$OUTPUT_FILE"
echo "  \"timestamp\": \"$(date -Iseconds)\"," >> "$OUTPUT_FILE"
echo "  \"git_commit\": \"$(git rev-parse HEAD 2>/dev/null || echo 'unknown')\"," >> "$OUTPUT_FILE"

# ==== Source Lines of Code ====
echo "Collecting source line counts with scc..."
if command -v scc &> /dev/null; then
    scc library/ executable/ test-suite/ bench/ --format json --by-file > "$METRICS_DIR/.scc-temp.json"
    echo "  \"scc\": $(cat "$METRICS_DIR/.scc-temp.json")," >> "$OUTPUT_FILE"
    rm "$METRICS_DIR/.scc-temp.json"

    # Summary for report
    scc library/ executable/ test-suite/ bench/ > "$REPORT_FILE"
else
    echo "  \"scc\": null," >> "$OUTPUT_FILE"
    echo "WARNING: scc not found. Install with: cargo install scc" >&2
    echo "scc not installed" > "$REPORT_FILE"
fi

# ==== Module Statistics ====
echo "Collecting module statistics..."
HASKELL_FILES=$(find library/ -name "*.hs" | wc -l)
EXECUTABLE_FILES=$(find executable/ -name "*.hs" | wc -l)
TEST_FILES=$(find test-suite/ -name "*.hs" | wc -l)
BENCH_FILES=$(find bench/ -name "*.hs" 2>/dev/null | wc -l || echo 0)

echo "  \"modules\": {" >> "$OUTPUT_FILE"
echo "    \"library\": $HASKELL_FILES," >> "$OUTPUT_FILE"
echo "    \"executable\": $EXECUTABLE_FILES," >> "$OUTPUT_FILE"
echo "    \"test\": $TEST_FILES," >> "$OUTPUT_FILE"
echo "    \"bench\": $BENCH_FILES" >> "$OUTPUT_FILE"
echo "  }," >> "$OUTPUT_FILE"

echo "" >> "$REPORT_FILE"
echo "=== Module Counts ===" >> "$REPORT_FILE"
echo "Library: $HASKELL_FILES" >> "$REPORT_FILE"
echo "Executable: $EXECUTABLE_FILES" >> "$REPORT_FILE"
echo "Test: $TEST_FILES" >> "$REPORT_FILE"
echo "Benchmark: $BENCH_FILES" >> "$REPORT_FILE"

# ==== Build Time ====
echo "Measuring build time (clean build)..."
stack clean 2>/dev/null || true
BUILD_START=$(date +%s)
if stack build --force-dirty 2>&1 | tee "$METRICS_DIR/.build-log.txt"; then
    BUILD_END=$(date +%s)
    BUILD_TIME=$((BUILD_END - BUILD_START))
    echo "  \"build_time_seconds\": $BUILD_TIME," >> "$OUTPUT_FILE"

    echo "" >> "$REPORT_FILE"
    echo "=== Build Time ===" >> "$REPORT_FILE"
    echo "$BUILD_TIME seconds" >> "$REPORT_FILE"
else
    echo "  \"build_time_seconds\": null," >> "$OUTPUT_FILE"
    echo "Build failed" >> "$REPORT_FILE"
fi
rm -f "$METRICS_DIR/.build-log.txt"

# ==== Binary Size ====
echo "Measuring binary size..."
INSTALL_ROOT=$(stack path --local-install-root 2>/dev/null || echo "")
if [ -n "$INSTALL_ROOT" ] && [ -f "$INSTALL_ROOT/bin/morloc" ]; then
    BINARY_SIZE=$(stat -f%z "$INSTALL_ROOT/bin/morloc" 2>/dev/null || stat -c%s "$INSTALL_ROOT/bin/morloc" 2>/dev/null || echo 0)
    BINARY_SIZE_MB=$(echo "scale=2; $BINARY_SIZE / 1024 / 1024" | bc)
    echo "  \"binary_size_bytes\": $BINARY_SIZE," >> "$OUTPUT_FILE"
    echo "  \"binary_size_mb\": $BINARY_SIZE_MB," >> "$OUTPUT_FILE"

    echo "" >> "$REPORT_FILE"
    echo "=== Binary Size ===" >> "$REPORT_FILE"
    echo "${BINARY_SIZE_MB} MB" >> "$REPORT_FILE"
else
    echo "  \"binary_size_bytes\": null," >> "$OUTPUT_FILE"
    echo "  \"binary_size_mb\": null," >> "$OUTPUT_FILE"
fi

# ==== Benchmarks ====
echo "Running benchmarks..."
if stack bench --benchmark-arguments '--csv '"$METRICS_DIR/.bench-temp.csv" 2>/dev/null; then
    # Convert CSV to JSON array
    echo "  \"benchmarks\": [" >> "$OUTPUT_FILE"
    tail -n +2 "$METRICS_DIR/.bench-temp.csv" | while IFS=, read -r name mean meanLB meanUB stddev stddevLB stddevUB; do
        echo "    {\"name\": \"$name\", \"mean\": $mean, \"stddev\": $stddev}," >> "$OUTPUT_FILE"
    done
    # Remove trailing comma from last entry
    sed -i '$s/,$//' "$OUTPUT_FILE"
    echo "  ]" >> "$OUTPUT_FILE"
    rm -f "$METRICS_DIR/.bench-temp.csv"

    echo "" >> "$REPORT_FILE"
    echo "=== Benchmarks ===" >> "$REPORT_FILE"
    cat "$METRICS_DIR/.bench-temp.csv" >> "$REPORT_FILE" 2>/dev/null || echo "No benchmark results" >> "$REPORT_FILE"
else
    echo "  \"benchmarks\": []" >> "$OUTPUT_FILE"
    echo "" >> "$REPORT_FILE"
    echo "=== Benchmarks ===" >> "$REPORT_FILE"
    echo "Benchmarks not available or failed" >> "$REPORT_FILE"
fi

# Close JSON
echo "}" >> "$OUTPUT_FILE"

echo ""
echo "=== Metrics collection complete ==="
echo "Results saved to: $OUTPUT_FILE"
echo "Report saved to: $REPORT_FILE"
echo ""
echo "To compare with another version:"
echo "  ./metrics/scripts/compare-metrics.sh baseline.json current.json"


================================================
FILE: metrics/scripts/compare-metrics.sh
================================================
#!/usr/bin/env bash
# Compare two metric snapshots
# Usage: ./compare-metrics.sh <baseline.json> <current.json>

set -euo pipefail

if [ $# -ne 2 ]; then
    echo "Usage: $0 <baseline.json> <current.json>"
    echo ""
    echo "Example:"
    echo "  $0 metrics/baselines/v0.59.0.json metrics/baselines/v0.60.0.json"
    exit 1
fi

BASELINE="$1"
CURRENT="$2"

if [ ! -f "$BASELINE" ]; then
    echo "Error: Baseline file not found: $BASELINE"
    exit 1
fi

if [ ! -f "$CURRENT" ]; then
    echo "Error: Current file not found: $CURRENT"
    exit 1
fi

# Helper function to extract JSON values
get_value() {
    local file="$1"
    local path="$2"

    # Try with jq if available, otherwise grep
    if command -v jq &> /dev/null; then
        jq -r "$path // \"null\"" "$file" 2>/dev/null || echo "null"
    else
        # Fallback to grep (less reliable)
        grep "\"${path//./}\"" "$file" | sed 's/.*: \(.*\),\?/\1/' | tr -d '"' || echo "null"
    fi
}

# Helper function to calculate percentage change
pct_change() {
    local old="$1"
    local new="$2"

    if [ "$old" = "null" ] || [ "$new" = "null" ]; then
        echo "N/A"
        return
    fi

    # Use bc for floating point arithmetic
    local change=$(echo "scale=2; (($new - $old) / $old) * 100" | bc 2>/dev/null || echo "N/A")

    if [ "$change" = "N/A" ]; then
        echo "N/A"
    else
        echo "${change}%"
    fi
}

# Helper to format change with color (if tput available)
format_change() {
    local pct="$1"
    local inverse="${2:-false}"  # If true, negative is good

    if [ "$pct" = "N/A" ]; then
        echo "$pct"
        return
    fi

    local num=$(echo "$pct" | tr -d '%')
    local color=""

    if command -v tput &> /dev/null; then
        local green=$(tput setaf 2)
        local red=$(tput setaf 1)
        local reset=$(tput sgr0)

        if [ "$inverse" = "true" ]; then
            # For things like build time where decrease is good
            if (( $(echo "$num < 0" | bc -l) )); then
                color="$green"
            elif (( $(echo "$num > 0" | bc -l) )); then
                color="$red"
            fi
        else
            # For things like SLOC where increase might be concerning
            if (( $(echo "$num > 10" | bc -l) )); then
                color="$red"
            elif (( $(echo "$num < -10" | bc -l) )); then
                color="$green"
            fi
        fi

        echo "${color}${pct}${reset}"
    else
        echo "$pct"
    fi
}

echo "=================================="
echo "Morloc Metrics Comparison"
echo "=================================="
echo ""
echo "Baseline: $BASELINE"
echo "Current:  $CURRENT"
echo ""

# Extract versions
BASE_VER=$(get_value "$BASELINE" ".version")
CURR_VER=$(get_value "$CURRENT" ".version")
echo "Comparing: $BASE_VER -> $CURR_VER"
echo ""

# ==== Source Lines ====
echo "--- Source Lines (from scc) ---"
if command -v jq &> /dev/null; then
    BASE_LINES=$(jq -r '.scc[] | select(.Name == "Total") | .Code // 0' "$BASELINE" 2>/dev/null || echo "0")
    CURR_LINES=$(jq -r '.scc[] | select(.Name == "Total") | .Code // 0' "$CURRENT" 2>/dev/null || echo "0")
    BASE_COMMENTS=$(jq -r '.scc[] | select(.Name == "Total") | .Comments // 0' "$BASELINE" 2>/dev/null || echo "0")
    CURR_COMMENTS=$(jq -r '.scc[] | select(.Name == "Total") | .Comments // 0' "$CURRENT" 2>/dev/null || echo "0")
else
    BASE_LINES="N/A"
    CURR_LINES="N/A"
    BASE_COMMENTS="N/A"
    CURR_COMMENTS="N/A"
fi

echo "Code Lines:    $BASE_LINES -> $CURR_LINES  ($(format_change "$(pct_change "$BASE_LINES" "$CURR_LINES")"))"
echo "Comment Lines: $BASE_COMMENTS -> $CURR_COMMENTS  ($(format_change "$(pct_change "$BASE_COMMENTS" "$CURR_COMMENTS")" true))"
echo ""

# ==== Modules ====
echo "--- Module Counts ---"
BASE_MODS=$(get_value "$BASELINE" ".modules.library")
CURR_MODS=$(get_value "$CURRENT" ".modules.library")
echo "Library Modules: $BASE_MODS -> $CURR_MODS  ($(pct_change "$BASE_MODS" "$CURR_MODS"))"
echo ""

# ==== Build Time ====
echo "--- Build Performance ---"
BASE_TIME=$(get_value "$BASELINE" ".build_time_seconds")
CURR_TIME=$(get_value "$CURRENT" ".build_time_seconds")
echo "Build Time: ${BASE_TIME}s -> ${CURR_TIME}s  ($(format_change "$(pct_change "$BASE_TIME" "$CURR_TIME")" true))"
echo ""

# ==== Binary Size ====
echo "--- Binary Size ---"
BASE_SIZE=$(get_value "$BASELINE" ".binary_size_mb")
CURR_SIZE=$(get_value "$CURRENT" ".binary_size_mb")
echo "Binary Size: ${BASE_SIZE}MB -> ${CURR_SIZE}MB  ($(format_change "$(pct_change "$BASE_SIZE" "$CURR_SIZE")" true))"
echo ""

# ==== Benchmarks ====
echo "--- Benchmarks ---"
if command -v jq &> /dev/null; then
    # Compare benchmark means
    jq -r '.benchmarks[]? | .name' "$CURRENT" 2>/dev/null | while read -r bench_name; do
        BASE_MEAN=$(jq -r ".benchmarks[]? | select(.name == \"$bench_name\") | .mean // null" "$BASELINE" 2>/dev/null)
        CURR_MEAN=$(jq -r ".benchmarks[]? | select(.name == \"$bench_name\") | .mean // null" "$CURRENT" 2>/dev/null)

        if [ "$BASE_MEAN" != "null" ] && [ "$CURR_MEAN" != "null" ]; then
            echo "$bench_name: ${BASE_MEAN} -> ${CURR_MEAN}  ($(format_change "$(pct_change "$BASE_MEAN" "$CURR_MEAN")" true))"
        else
            echo "$bench_name: New benchmark"
        fi
    done
else
    echo "Install jq for detailed benchmark comparison"
fi
echo ""

# ==== Summary ====
echo "=================================="
echo "Summary"
echo "=================================="
echo ""
echo "Key changes:"

# Highlight significant changes (>10%)
if [ "$BASE_LINES" != "N/A" ] && [ "$CURR_LINES" != "N/A" ]; then
    LINES_PCT=$(pct_change "$BASE_LINES" "$CURR_LINES" | tr -d '%')
    if (( $(echo "${LINES_PCT#-} > 10" | bc -l 2>/dev/null || echo 0) )); then
        echo "  - Code size changed by $(format_change "$(pct_change "$BASE_LINES" "$CURR_LINES")")"
    fi
fi

if [ "$BASE_TIME" != "null" ] && [ "$CURR_TIME" != "null" ]; then
    TIME_PCT=$(pct_change "$BASE_TIME" "$CURR_TIME" | tr -d '%')
    if (( $(echo "${TIME_PCT#-} > 10" | bc -l 2>/dev/null || echo 0) )); then
        echo "  - Build time changed by $(format_change "$(pct_change "$BASE_TIME" "$CURR_TIME")" true)"
    fi
fi

echo ""
echo "For detailed line-by-line comparison, use jq:"
echo "  diff <(jq . $BASELINE) <(jq . $CURRENT)"


================================================
FILE: package.yaml
================================================
name:             morloc
version:          0.81.0
homepage:         https://github.com/morloc-project/morloc
synopsis:         A multi-lingual, typed, workflow language
description: |
  Morloc is a typed, multi-lingual workflow language that composes functions
  across Python, C++, R, and other languages under a unified type system.
  The compiler generates interprocess communication code, serialization
  logic, and a dispatch binary from a single morloc source file.
  See the GitHub README <https://github.com/morloc-project/morloc#readme>
  for full documentation.
category:         Language, Compiler, Code Generation
tested-with:      GHC == 9.6.6
license:          Apache-2.0
license-file:     LICENSE
author:           "Zebulun Arendsee" 
maintainer:       "z@morloc.io"
github:           "morloc-project/morloc"
bug-reports:      https://github.com/morloc-project/morloc/issues
copyright:        "2026 Zebulun Arendsee"

extra-source-files:
  - README.md
  - ChangeLog.md
  # libraries
  - data/lang/cpp/pool.cpp
  # universal c header
  - data/morloc/morloc.h
  # shared language config
  - data/lang/languages.yaml
  # per-language files
  - data/lang/c/lang.yaml
  - data/lang/cpp/lang.yaml
  - data/lang/cpp/cppmorloc.hpp
  - data/lang/cpp/cppmorloc.cpp
  - data/lang/cpp/morloc_pch.hpp
  - data/lang/cpp/pool.cpp
  - data/lang/cpp/init.sh
  - data/lang/py/lang.yaml
  - data/lang/py/pymorloc.c
  - data/lang/py/setup.py
  - data/lang/py/Makefile
  - data/lang/py/pool.py
  - data/lang/py/init.sh
  - data/lang/r/lang.yaml
  - data/lang/r/rmorloc.c
  - data/lang/r/pool.R
  - data/lang/r/init.sh
  - data/lang/julia/juliabridge.c
  - data/lang/julia/MorlocRuntime.jl
  - data/lang/julia/lang.yaml
  - data/lang/julia/pool.jl
  - data/lang/julia/init.sh

default-extensions:
  - TypeOperators

dependencies:
  - base
  - aeson
  - binary
  - array
  - bytestring
  - containers
  - directory
  - directory-tree
  - extra
  - filepath
  - file-embed
  - haskell-src-meta
  - http-conduit
  - http-types
  - mtl
  - parsec
  - partial-order
  - pretty-simple
  - prettyprinter
  - process
  - raw-strings-qq
  - safe
  - scientific
  - template-haskell
  - text
  - time
  - unordered-containers
  - vector
  - yaml
  - zip-archive

ghc-options:
  - -Wall
  - -Wcompat
  - -fwarn-unused-binds
  - -fwarn-unused-imports 
  - -fwarn-tabs
  - -fwarn-incomplete-uni-patterns
  - -fwarn-incomplete-record-updates
  - -fwarn-redundant-constraints
  - -fno-warn-missing-signatures
  - -fno-warn-unused-do-bind
  - -fno-warn-orphans
  - -haddock

library:
  source-dirs: library
  build-tools:
    - happy

executables:
  morloc:
    main:          Main.hs
    source-dirs:   executable
    ghc-options:
      - -Wall
      - -threaded
      - -rtsopts
      - -with-rtsopts=-N
      - -O2
      - -haddock
    dependencies:
      - morloc
      - base
      - optparse-applicative
      - temporary
      - text

  morloc-codegen-generic:
    main:          Main.hs
    source-dirs:   exe/morloc-codegen-generic
    ghc-options:
      - -Wall
      - -O2
    dependencies:
      - morloc
      - base
      - aeson
      - binary
      - bytestring
      - text
      - yaml

tests:
  morloc-test:
    main:          Main.hs
    source-dirs:   test-suite
    ghc-options:
      - -threaded
      - -rtsopts
      - -with-rtsopts=-N
    dependencies:
      - morloc
      - base
      - QuickCheck
      - tasty
      - tasty-golden
      - tasty-hunit
      - tasty-quickcheck

  morloc-integration-test:
    main:          Main.hs
    source-dirs:   test-suite/integration
    ghc-options:
      - -threaded
      - -rtsopts
      - -with-rtsopts=-N
    dependencies:
      - base
      - async
      - directory
      - filepath
      - process
      - tasty
      - tasty-hunit
      - temporary
      - text
      - time

benchmarks:
  morloc-bench:
    main:          Bench.hs
    source-dirs:   bench
    ghc-options:
      - -threaded
      - -rtsopts
      - -with-rtsopts=-N
      - -O2
    dependencies:
      - morloc
      - base
      - tasty-bench
      - text
      - filepath


================================================
FILE: scripts/build-rust.sh
================================================
#!/usr/bin/env bash
# Build static Rust binaries and/or container images locally.
#
# Usage:
#   ./scripts/build-rust.sh rust       Build static binaries to out/
#   ./scripts/build-rust.sh tiny       Build morloc-tiny container
#   ./scripts/build-rust.sh full       Build morloc-full container (requires tiny)
#   ./scripts/build-rust.sh all        Build binaries + both containers
#   ./scripts/build-rust.sh export     Export morloc-full image to tarball
#
# Environment:
#   MORLOC_VERSION   Container image tag (default: edge)
set -euo pipefail

cd "$(dirname "$0")/.."

MORLOC_VERSION="${MORLOC_VERSION:-edge}"

cmd_rust() {
    echo "=== Building static Rust binaries ==="
    podman build -t morloc-rust-build -f container/static-build/Dockerfile .
    mkdir -p out
    podman run --rm -v "$(pwd)/out:/out" morloc-rust-build
    echo "=== Output in out/ ==="
    ls -lh out/
}

cmd_tiny() {
    echo "=== Building morloc-tiny:${MORLOC_VERSION} ==="
    make -C container MORLOC_VERSION="$MORLOC_VERSION" build-tiny
}

cmd_full() {
    echo "=== Building morloc-full:${MORLOC_VERSION} ==="
    make -C container MORLOC_VERSION="$MORLOC_VERSION" build-full
}

cmd_all() {
    cmd_rust
    cmd_tiny
    cmd_full
}

cmd_export() {
    local tarball="/tmp/morloc-full-${MORLOC_VERSION}.tar"
    echo "=== Exporting morloc-full:${MORLOC_VERSION} to ${tarball} ==="
    podman save "ghcr.io/morloc-project/morloc/morloc-full:${MORLOC_VERSION}" -o "$tarball"
    ls -lh "$tarball"
}

usage() {
    echo "Usage: $(basename "$0") <command>"
    echo ""
    echo "Commands:"
    echo "  rust     Build static Rust binaries (morloc-manager, morloc-nexus, libmorloc.so)"
    echo "  tiny     Build morloc-tiny container"
    echo "  full     Build morloc-full container (requires tiny)"
    echo "  all      Build everything (binaries + containers)"
    echo "  export   Export morloc-full image to /tmp/ tarball"
    echo ""
    echo "Environment:"
    echo "  MORLOC_VERSION=edge  (default)"
}

case "${1:-}" in
    rust)   cmd_rust ;;
    tiny)   cmd_tiny ;;
    full)   cmd_full ;;
    all)    cmd_all ;;
    export) cmd_export ;;
    -h|--help|"")
        usage
        exit 0
        ;;
    *)
        echo "Unknown command: $1" >&2
        usage >&2
        exit 1
        ;;
esac


================================================
FILE: scripts/bump-version.sh
================================================
#!/usr/bin/env bash
# Sync version from ChangeLog.md to package.yaml and Cargo.toml files.
# Usage: after adding a new ChangeLog.md entry, run:
#   ./scripts/bump-version.sh
set -euo pipefail

cd "$(dirname "$0")/.."

if [[ -n "${1:-}" ]]; then
  VERSION="$1"
else
  VERSION=$(head -1 ChangeLog.md | grep -oP '^\d+\.\d+\.\d+[^ ]*')
  if [[ -z "$VERSION" ]]; then
    echo "Error: could not parse version from first line of ChangeLog.md" >&2
    echo "Expected format: X.Y.Z [YYYY-MM-DD]" >&2
    exit 1
  fi
fi

echo "Syncing version $VERSION ..."

sed -i "s/^version:          .*/version:          $VERSION/" package.yaml
echo "  updated package.yaml"

# Regenerate morloc.cabal from package.yaml
if command -v hpack >/dev/null 2>&1; then
  hpack
elif stack exec -- hpack --version >/dev/null 2>&1; then
  stack exec -- hpack
else
  # Direct sed fallback: update the version line in morloc.cabal
  sed -i "s/^version:        .*/version:        $VERSION/" morloc.cabal
fi
echo "  updated morloc.cabal"

for f in data/rust/morloc-{nexus,manifest,runtime}/Cargo.toml; do
  sed -i "s/^version = \".*\"/version = \"$VERSION\"/" "$f"
  echo "  updated $f"
done

echo "Done. Verify with: git diff"


================================================
FILE: spec/SPEC.md
================================================
# Morloc Language Specification

This document is the master table of contents for the Morloc formal specification. It describes the language, its type system, its runtime behavior, and its compiler architecture.

## Conventions

- Syntax examples use `morloc` code blocks
- Type rules use standard inference notation
- Cross-references use `[[file]]` links
- This spec describes *what* the language does, not how the compiler implements it

## Table of Contents

### Language Reference

Surface syntax and semantics of morloc programs.

- [[language/LANGUAGE.md]] -- Overview: design philosophy and core concepts
- [[language/lexical-structure.md]] -- Tokens, literals, comments, whitespace, indentation
- [[language/expressions.md]] -- Application, lambda, composition, where-clauses, accessors
- [[language/declarations.md]] -- Functions, type aliases, records, typeclasses, instances
- [[language/operators.md]] -- Fixity declarations, precedence, and associativity
- [[language/annotations.md]] -- Docstrings and CLI argument metadata tags

### Type System

The formal type system underlying morloc's multi-language guarantees.

- [[types/TYPES.md]] -- Overview: two-level design and role in cross-language safety
- [[types/primitive-types.md]] -- Built-in types and sized variants
- [[types/type-declarations.md]] -- Type aliases, language-specific mappings, terminal types
- [[types/records.md]] -- Record, object, and table types
- [[types/typeclasses.md]] -- Typeclass declarations, instances, and constraint resolution
- [[types/polymorphism.md]] -- Parametric polymorphism and quantification
- [[types/subtyping.md]] -- Subtyping rules and instantiation
- [[types/inference.md]] -- Bidirectional type inference

### Module System

How morloc code is organized, shared, and resolved.

- [[modules/MODULES.md]] -- Overview: namespaces, planes, and the dependency DAG
- [[modules/imports-and-exports.md]] -- Module declarations, imports, exports, visibility
- [[modules/resolution.md]] -- Path resolution: local, system, and plane lookups
- [[modules/packages.md]] -- Package metadata, versioning, and installation

### Cross-Language Interoperability

Mechanisms enabling function composition across Python, C++, and R.

- [[interop/INTEROP.md]] -- Overview: unifying multiple languages under one type system
- [[interop/foreign-functions.md]] -- Source declarations, function binding, renaming
- [[interop/type-mappings.md]] -- General-to-concrete type resolution per language
- [[interop/serialization.md]] -- Msgpack protocol, schema encoding, packing rules
- [[interop/implementation-selection.md]] -- Realization algorithm and language selection

### Runtime System

How compiled morloc programs execute.

- [[runtime/RUNTIME.md]] -- Overview: the nexus-pool model
- [[runtime/execution-model.md]] -- Nexus lifecycle, pool management, dispatch, errors
- [[runtime/ipc.md]] -- Unix socket protocol, message format, data flow
- [[runtime/manifest.md]] -- JSON manifest schema
- [[runtime/cli.md]] -- Automatic CLI generation from type signatures

### Compiler Architecture

The compilation pipeline from source to executable.

- [[compiler/COMPILER.md]] -- Overview: stages, IRs, and design principles
- [[compiler/pipeline.md]] -- End-to-end compilation flow
- [[compiler/parsing.md]] -- Lexing, tokenization, expression parsing
- [[compiler/typechecking.md]] -- Bidirectional inference, subtyping, context threading
- [[compiler/codegen.md]] -- Two-phase lower-then-print model and per-language translators
- [[compiler/build.md]] -- Manifest writing, pool generation, compilation, deployment


================================================
FILE: spec/compiler/COMPILER.md
================================================
# Compiler Architecture

The morloc compiler transforms `.loc` source files into executable programs consisting of a nexus binary, a JSON manifest, and language-specific pool files. The compilation pipeline is structured as a sequence of transformations over progressively lower-level intermediate representations.

## Design Principles

- **Separation of concerns.** Parsing, type checking, realization, code generation, and building are distinct phases with well-defined interfaces.
- **Language-parametric code generation.** A shared imperative IR and a configurable lowering engine allow new target languages to be added by supplying a configuration record and a printer, without modifying the core pipeline.
- **Compile-time language selection.** The compiler resolves which language implements each function before any code is generated. There is no runtime dispatch logic for language selection.

## Intermediate Representations

| IR | Phase | Description |
|----|-------|-------------|
| `ExprI` | Parsing | Indexed expression AST with unique IDs per node |
| `AnnoS TypeU` | Type checking | Annotated syntax tree with general types |
| `AnnoS Type Lang` | Realization | Annotated tree with concrete types and language tags |
| `PolyExpr` | Parameterize/Express | Polymorphic manifold tree |
| `MonoExpr` | Segment | Monomorphic per-language tree with boundary markers |
| `SerialExpr` | Serialize | Tree with serialization/deserialization operations |
| `IStmt`/`IExpr` | Lower | Shared imperative IR |
| `MDoc` | Print | Rendered source text |

## Subfiles

- [[pipeline.md]] -- End-to-end compilation flow
- [[parsing.md]] -- Lexing, tokenization, expression parsing
- [[typechecking.md]] -- Bidirectional inference, subtyping, context threading
- [[codegen.md]] -- Lower-then-print model and per-language translators
- [[build.md]] -- Manifest writing, pool generation, compilation, deployment


================================================
FILE: spec/compiler/build.md
================================================
# Build System

The build phase writes generated code to disk, compiles what needs compiling, and assembles the final executable program.

## System Initialization

Before any program can be built, the runtime must be initialized with `morloc init`. This one-time step compiles:

1. **libmorloc.so** -- shared C library providing socket communication, shared memory, msgpack serialization, and error handling.
2. **morloc-nexus** -- static C binary (the nexus), linked against libmorloc.
3. **libcppmorloc.a** -- static C++ library with template-based serialization.
4. **pymorloc** -- Python C extension for msgpack serialization.
5. **rmorloc** -- R C extension for msgpack serialization.

These artifacts are installed to `~/.local/share/morloc/`:

```
bin/morloc-nexus        -- pre-compiled nexus binary
include/morloc.h        -- C runtime header
include/cppmorloc.hpp   -- C++ serialization header
lib/libmorloc.so        -- C runtime library
lib/libcppmorloc.a      -- C++ serialization library
lib/libpymorloc.so      -- Python C extension
lib/librmorloc.so       -- R C extension
```

## Program Build Process

When the user runs `morloc make -o foo script.loc`, the build phase:

1. **Writes the manifest**: `foo.manifest` (JSON file).
2. **Copies the nexus binary**: copies `~/.local/share/morloc/bin/morloc-nexus` to `./foo`.
3. **Writes pool source files**: `pool.py`, `pool.cpp`, `pool.R` as needed.
4. **Compiles C++ pools**: invokes the C++ compiler to produce `pool-cpp.out`.
5. **Sets permissions**: marks interpreted pools and the nexus as executable.

## Output Structure

After a successful build:

```
./foo                  -- nexus binary (copy of morloc-nexus)
./foo.manifest         -- JSON manifest
./pool.py              -- Python pool (if Python functions used)
./pool.cpp             -- C++ pool source (if C++ functions used)
./pool-cpp.out         -- compiled C++ pool
./pool.R               -- R pool (if R functions used)
```

## Compilation Commands

### C++ Pools

```
g++ -O2 --std=c++17 -o pool-cpp.out pool.cpp \
  -I~/.local/share/morloc/include \
  -L~/.local/share/morloc/lib \
  -lmorloc -lcppmorloc -lpthread
```

The C++ compiler, optimization level, and standard are configurable. The pool links against both libmorloc (for socket communication) and libcppmorloc (for serialization).

### Python Pools

No compilation. The generated `pool.py` is an executable script that imports `pymorloc` for serialization and the user's source modules for function implementations.

### R Pools

No compilation. The generated `pool.R` is an executable script that loads `rmorloc` via `dyn.load` and sources the user's R files.

## Runtime Directory

At execution time, the nexus creates a temporary directory for socket files:

```
/tmp/morloc.XXXXXX/
  pipe-py             -- Python pool socket
  pipe-cpp            -- C++ pool socket
  pipe-r              -- R pool socket
```

This directory is cleaned up when the program exits.

## Dependencies

| Requirement | When Needed |
|-------------|-------------|
| C compiler (gcc/clang) | `morloc init` only |
| C++ compiler (g++/clang++) | Programs using C++ functions |
| Python 3 | Programs using Python functions |
| R | Programs using R functions |
| libmorloc.so | Always (runtime communication) |

## Error Handling

The build system reports:
- Missing compilers with actionable error messages.
- Compilation failures with the compiler's full output.
- Missing libraries or headers with paths that were searched.


================================================
FILE: spec/compiler/codegen.md
================================================
# Code Generation

Code generation transforms the type-checked, realized program into a JSON manifest and language-specific pool source files. It uses a two-phase architecture -- lower to a shared imperative IR, then print to target language syntax -- to maximize code reuse across languages.

## Sub-Phases

Code generation proceeds through five sub-phases:

### 1. Parameterize

Thread function arguments through expression trees. Each manifold (a callable unit in the generated code) receives its argument list explicitly. Unused arguments are removed.

### 2. Express

Create polymorphic manifold trees that represent the program's call structure. Each manifold captures a function, its arguments, and its body. Lambdas, lists, tuples, and records are normalized into a uniform manifold representation.

### 3. Segment

Break polymorphic trees at language boundaries. Each manifold is assigned to a specific language. Where a manifold in language A calls a function in language B, a boundary marker is inserted. The result is a set of monomorphic, per-language manifold trees.

Manifold forms after segmentation:

| Form | Description |
|------|-------------|
| LocalRoot | Entry point callable from the nexus |
| LocalForeign | Calls a function in another pool |
| RemoteWorker | Called by another pool via the nexus |

### 4. Serialize

Insert serialization and deserialization operations at every language boundary. For each cross-language call, the compiler:

1. Determines the msgpack schema for each argument and the return value.
2. Wraps the caller's output in a serialize call.
3. Wraps the callee's input in a deserialize call.

The result is a tree where every value crossing a boundary is explicitly packed/unpacked.

### 5. Emit

Translate each serialized manifold tree into target language source code. This phase uses the two-phase lower-then-print architecture described below.

## Two-Phase Architecture

### Lowering

The lowering phase converts the compiler's manifold AST into a shared imperative IR (`IStmt` / `IExpr`). The IR supports:

- Variable assignment
- Function calls (local and remote)
- Serialize/deserialize calls
- List/map iteration
- Lambda expressions
- Return statements

Lowering is parameterized by a configuration record (`LowerConfig`) with approximately 30 fields covering:

| Category | Examples |
|----------|---------|
| Type rendering | How to render type names, template parameters |
| Accessors | Record field access, tuple indexing syntax |
| Constructors | List, tuple, record literal syntax |
| Calls | Local function calls, remote pool calls |
| Serialization | Pack/unpack function names and calling conventions |
| Statements | Let binding, return, function definition syntax |

A single generic fold (`defaultFoldRules`) walks the AST and produces the IR using the language's `LowerConfig`. This fold is written once and shared by all languages.

### Printing

The printing phase converts the imperative IR into rendered source text. Each language provides:

- `printExpr`: render an IR expression as source text.
- `printStmt`: render an IR statement as source text.
- `printProgram`: assemble a complete pool source file from rendered fragments.

## Per-Language Specifics

### C++

- **Stateful**: uses a monadic translator that tracks generated struct types, forward declarations, and serializer functions.
- **Type-aware**: `LowerConfig` type fields produce concrete C++ type strings (used for variable declarations, template parameters).
- **Struct generation**: anonymous record types produce `struct` definitions and corresponding serializer/deserializer functions.

### Python

- **Stateless**: uses a pure translator with only a counter for unique names.
- **No types**: `LowerConfig` type fields return nothing (Python is dynamically typed).
- **Import handling**: source file paths are converted to Python import statements.

### R

- **Stateless**: similar to Python.
- **R conventions**: 1-indexed access, `c()` for vectors, `$` for field access, `list()` for records.

## Pool Template Assembly

Each language has a pool template with `<<<BREAK>>>` markers. The code generator splits the template at these markers and interleaves generated code:

```
[template header]
[generated imports]
[template middle]
[generated function definitions]
[template dispatch section]
[generated dispatch table]
[template footer]
```

The result is a complete, self-contained pool source file.

## Manifest Generation

In parallel with pool generation, the compiler produces a JSON manifest describing:

- Pool definitions (language, executable command, socket name)
- Command definitions (subcommand name, manifold ID, pool index, schemas)
- Argument metadata (kind, metavar, type, default, description)
- Pure expression trees (for commands that need no pool)

See [[../runtime/manifest.md]].


================================================
FILE: spec/compiler/parsing.md
================================================
# Parsing

The parser transforms morloc source text into an indexed expression AST. It uses parser combinators with stateful tracking of fixity tables, expression indices, and indentation.

## Lexical Analysis

The lexer and parser are combined in a single pass using parser combinators (Megaparsec). There is no separate tokenization step; the parser directly consumes characters and builds AST nodes.

Key lexer features:

- **Indentation tracking**: the parser maintains a minimum indentation position. Continuation lines must be indented beyond the start of their expression.
- **Docstring recognition**: `--'` comments are captured as documentation and attached to subsequent declarations.
- **String interpolation**: `#{}` within string literals introduces embedded expressions.
- **Number formats**: decimal, hexadecimal (`0x`), octal (`0o`), and binary (`0b`) integer literals; decimal and scientific floating-point literals.

## Parser State

The parser carries mutable state through parsing:

| Field | Purpose |
|-------|---------|
| Fixity table | Maps operator names to (associativity, precedence) |
| Expression index | Counter for assigning unique IDs to AST nodes |
| Variable index | Counter for generating fresh variable names |
| Generics | Set of type variables in the current generic scope |
| Module config | Settings specific to the current module |
| Source positions | Maps expression IDs to source locations (for error reporting) |

## Top-Level Forms

The parser recognizes these top-level constructs:

1. **Module declaration**: `module name (exports)`
2. **Import**: `import name (terms)`
3. **Type signature**: `f a b :: Type`
4. **Function definition**: `f x y = body`
5. **Type alias**: `type Name = Type` or `type Lang => Name = "concrete"`
6. **Record/object/table declaration**: `record Name where ...`
7. **Typeclass declaration**: `class Name a where ...`
8. **Instance declaration**: `instance Name Type where ...`
9. **Fixity declaration**: `infixl 6 +, -`
10. **Source declaration**: `source Lang from "file" ("names")`

## Expression Parsing

Expressions are parsed by a layered grammar:

1. **Atoms**: literals, variables, parenthesized expressions, lists, tuples, records.
2. **Application**: juxtaposition of atoms (left-associative).
3. **Infix expressions**: operators interleaved with applications, resolved by precedence climbing.
4. **Lambda**: `\vars -> body`
5. **Where clauses**: `expr where bindings`

## Precedence Climbing

Infix operator parsing uses the precedence climbing algorithm (a form of Pratt parsing):

1. Parse a left-hand operand (application or atom).
2. Look ahead for an operator. If its precedence is below the current minimum, stop.
3. Consume the operator. Determine the minimum precedence for the right operand:
   - Left-associative: current precedence + 1
   - Right-associative: current precedence
   - Non-associative: current precedence + 1
4. Recursively parse the right operand at the new minimum.
5. Build an application node: `op(lhs, rhs)`.
6. Loop back to step 2 with the application as the new left-hand side.

All infix expressions desugar to prefix function application: `a + b` becomes `(+) a b`.

## Indexed Expressions

Every AST node is wrapped in an `ExprI` that pairs it with a unique integer index:

```
ExprI index Expr
```

These indices serve as keys for attaching metadata (source positions, type annotations, language tags) in later phases without modifying the AST structure.

## Module Parsing

Parsing is recursive over the module dependency graph:

1. Parse the entry-point file.
2. For each import, resolve the module path, parse it (accumulating state), and add it to the DAG.
3. Continue until all transitive imports are parsed.

The resulting DAG, combined with the accumulated parser state, is the input to the link phase.


================================================
FILE: spec/compiler/pipeline.md
================================================
# Compilation Pipeline

The morloc compiler transforms source files into an executable through seven major phases. Each phase produces an intermediate representation consumed by the next.

## Phase Summary

```
.loc files
  |  1. Parse
  v
ExprI (indexed AST) + DAG (module dependencies)
  |  2. Link & Merge
  v
Unified compiler state (signatures, types, sources)
  |  3. Restructure & Treeify
  v
AnnoS TypeU Many Int (annotated syntax tree, general types)
  |  4. Typecheck
  v
AnnoS Type One Lang (concrete types, language tags)
  |  5. Realize
  v
Validated program (all implementations resolved)
  |  6. Generate
  v
JSON manifest + language-specific pool source code
  |  7. Build
  v
Executable (nexus binary + manifest + pool files)
```

## 1. Parse

The parser reads `.loc` files and produces an indexed expression AST (`ExprI`). Each subexpression receives a unique integer ID. The parser handles indentation-sensitive syntax, operator precedence (via precedence climbing), and module structure.

Parsing is recursive over the module DAG: when an import is encountered, the imported module is located, parsed, and added to the dependency graph. Parser state (fixity tables, expression counters) accumulates across modules.

## 2. Link and Merge

**Link** transfers terms, types, typeclasses, and source declarations from the parsed DAG into the compiler's global state. Each module's exports are filtered according to its export list and the importing module's import list.

**Merge** resolves cases where the same function name is imported from multiple modules with different language implementations. If the general types match, the implementations are combined (implementation polymorphism). If the general types conflict, an error is reported.

## 3. Restructure and Treeify

**Restructure** expands type aliases, resolving general type names to their definitions.

**Treeify** converts the flat expression list into an annotated syntax tree (`AnnoS`), threading type annotations and language information through the tree structure.

## 4. Typecheck

The typechecker applies bidirectional type inference to the annotated syntax tree. It:

- Infers types for unannotated expressions (synthesis).
- Verifies annotated expressions match their declared types (checking).
- Resolves existential type variables.
- Checks subtyping at polymorphic boundaries.
- Eta-expands lambdas that return function types.

The output is a fully typed tree with concrete types and language annotations.

See [[typechecking.md]] for details.

## 5. Realize

Realization validates that every function in the typed program has at least one foreign implementation, selects language implementations to minimize serialization boundaries, and checks that all required concrete type mappings exist.

See [[../interop/implementation-selection.md]].

## 6. Generate

Code generation transforms the realized program into:

- A JSON manifest describing commands, pools, and argument schemas.
- Source code for each language pool.

This phase proceeds through several sub-phases:

1. **Parameterize**: thread function arguments through expression trees.
2. **Express**: create polymorphic manifold trees.
3. **Segment**: split trees at language boundaries into monomorphic per-language segments.
4. **Serialize**: insert msgpack serialization/deserialization operations.
5. **Emit**: translate each segment to target language source code via the shared imperative IR.

See [[codegen.md]] for details.

## 7. Build

The build phase writes generated files to disk:

- Copies the pre-compiled nexus binary.
- Writes the JSON manifest.
- Writes pool source files.
- Compiles C++ pools with the system C++ compiler.
- Sets executable permissions on interpreted pools.

See [[build.md]] for details.


================================================
FILE: spec/compiler/typechecking.md
================================================
# Type Checking

The morloc typechecker implements bidirectional type checking based on Dunfield and Krishnaswami (2013). It infers types for unannotated expressions, verifies annotated expressions, and resolves polymorphism through subtyping and existential instantiation.

## Strategy

The typechecker makes a single pass over the annotated syntax tree, alternating between two modes:

- **Synthesis mode**: infer the type of an expression from its structure.
- **Checking mode**: verify that an expression matches an expected type.

The Sub rule bridges the modes: when checking, if no specific rule applies, synthesize the type and verify it is a subtype of the expected type.

## Type Representations

The typechecker operates on general types (`TypeU`), which include:

| Form | Description |
|------|-------------|
| `VarU a` | Universal type variable |
| `ExistU a-hat constraints` | Existential (unsolved) type variable |
| `ForallU a T` | Universal quantification |
| `FunU [A1,...,An] R` | Multi-argument function type |
| `AppU F [A1,...,An]` | Type constructor application |
| `NamU kind name params fields` | Named/record type |

## Context Threading

The typechecker threads an ordered context (Gamma) through every judgment. The context records:

- **Universal markers**: type variables currently in scope.
- **Term annotations**: the type of each bound variable.
- **Unsolved existentials**: type variables awaiting solution.
- **Solved existentials**: type variables resolved to a concrete type.
- **Scope markers**: boundaries for scoped bindings.

Context operations:
- **Extend**: add a new binding.
- **Apply**: substitute all solved existentials into a type.
- **Cut**: remove bindings beyond a scope marker (when exiting a quantifier's scope).
- **Lookup**: find a term's type or an existential's solution.

## Subtyping

The subtyping judgment `A <: B` checks whether A is at least as polymorphic as B:

- **Reflexivity**: `A <: A`.
- **Functions**: contravariant in arguments, covariant in returns.
- **Forall-left**: instantiate with a fresh existential.
- **Forall-right**: abstract over a fresh universal.
- **Existentials**: delegate to instantiation.

For multi-argument functions, all arguments are checked contravariantly in a single batch before applying accumulated context updates. This avoids quadratic behavior.

See [[../types/subtyping.md]] for the formal rules.

## Instantiation

When an existential must equal a concrete type:

- **Solve**: if the type is a monotype and passes the occurs check, solve the existential directly.
- **Function decomposition**: split the existential into argument and return existentials.
- **Forall decomposition**: instantiate the quantifier and continue.

## Expression Rules

### Literals

Literals synthesize their natural type: `42 => Int`, `3.14 => Real`, `"hello" => Str`, `True => Bool`.

### Variables

A variable synthesizes the type found at its binding in the context.

### Application

To typecheck `f x`:
1. Synthesize the type of `f`.
2. If `f : forall a. A`, instantiate `a` with a fresh existential.
3. If `f : FunU [A1,...] R`, check `x` against `A1`; result is the remaining function or return type.
4. If `f : ExistU a-hat`, decompose into `a-hat1 -> a-hat2` and retry.

### Lambda

Checked against `FunU [A1,...] R`: bind parameters to `A1,...`, check body against `R`.

Synthesized (no expected type): create fresh existentials for parameters, synthesize the body. If the body's type is a function, eta-expand to make all arguments explicit.

### Where Clauses

Each binding in a `where` clause is synthesized independently. The resulting types are added to the context before typechecking the main expression.

## Error Reporting

Type errors include source location information (derived from expression indices) and describe the mismatch:

| Error | Cause |
|-------|-------|
| Subtype error | Types incompatible in subtype check |
| Instantiation error | Cannot solve existential |
| Occurs check failure | Infinite type (e.g., `a = [a]`) |
| Application of non-function | Applying a value that is not a function |
| Too many arguments | More arguments than the function accepts |

## Multi-Stage Checking

The full type checking pipeline has two stages:

1. **Frontend typecheck**: operates on general types (`TypeU`). Produces a tree annotated with general types and potentially multiple language implementations.
2. **Value check**: resolves which language implementations to use, matching general types to concrete implementations. Verifies that implementations exist for all required functions.


================================================
FILE: spec/interop/INTEROP.md
================================================
# Cross-Language Interoperability

Morloc's central design goal is composing functions across Python, C++, and R within a single program. This section describes how the language, type system, and runtime cooperate to make cross-language calls transparent to the programmer.

## Why Serialization Boundaries Exist

Each supported language has its own memory layout, calling conventions, and type system. A Python `list` and a C++ `std::vector` cannot share memory directly. Morloc bridges this gap through serialization: when data crosses a language boundary, it is packed into a language-neutral binary format (msgpack), transmitted, and unpacked on the other side.

The compiler's job is to:

1. Determine *where* language boundaries fall in a composition.
2. Insert serialization/deserialization operations at those boundaries.
3. Choose language implementations to *minimize* the number of boundaries.

## How It Works

A function like `map` may have implementations in Python, C++, and R. When the programmer writes `map f xs`, the compiler examines `f` to determine which languages can provide it. If `f` is only available in C++, the compiler selects C++'s `map` as well, avoiding a serialization boundary between `map` and `f`.

This process -- called *realization* -- happens entirely at compile time. The generated program contains no runtime language selection logic.

## Subfiles

- [[foreign-functions.md]] -- Source declarations, function binding, renaming
- [[type-mappings.md]] -- How general types resolve to Python, C++, and R types
- [[serialization.md]] -- Msgpack protocol, schema encoding, packing rules
- [[implementation-selection.md]] -- Realization algorithm and boundary minimization


================================================
FILE: spec/interop/foreign-functions.md
================================================
# Foreign Functions

Foreign function declarations bind functions from Python, C++, or R source files to morloc names. This is morloc's FFI (Foreign Function Interface).

## Source Declarations

The `source` keyword declares where a foreign function lives:

```morloc
source Py from "module.py" ("add", "mul")
source Cpp from "module.hpp" ("add", "mul")
source R from "module.R" ("add", "mul")
```

Each declaration specifies:
- **Language**: `Py`, `Cpp`, or `R`
- **Source file**: path to the implementation file (relative to the module)
- **Function list**: names of functions to import from that file

After a source declaration, the imported names must be given morloc type signatures:

```morloc
source Py from "stats.py" ("mean", "stdev")

mean :: [Real] -> Real
stdev :: [Real] -> Real
```

## Renaming

Foreign functions can be renamed on import to match morloc naming conventions or avoid conflicts:

```morloc
source Py from "module.py" ("python_add" as add)
source Cpp from "module.hpp" ("cpp_multiply" as mul)
```

The foreign name appears first, followed by `as` and the morloc name.

## Built-in Imports

Functions from a language's standard library can be imported without a file path:

```morloc
source Py ("abs", "len", "sorted")
source Cpp ("std::sort" as sort)
```

The compiler generates the appropriate import/include statement for the target language.

## Operator Binding

Operators can be bound to foreign functions using parenthesized syntax:

```morloc
source Py from "pipe.py" ("pipe" as (|>))
```

## Multiple Implementations

The same morloc function may have source declarations in multiple languages:

```morloc
source Py from "stats.py" ("mean")
source Cpp from "stats.hpp" ("mean")
source R from "stats.R" ("mean")

mean :: [Real] -> Real
```

This creates implementation polymorphism: the compiler selects the most efficient implementation at compile time. See [[implementation-selection.md]].

## Interaction with Pure Definitions

A function may have both a pure morloc definition and foreign implementations:

```morloc
mean :: [Real] -> Real
mean xs = div (sum xs) (size xs)           -- pure morloc
source Cpp from "stats.hpp" ("mean")       -- C++ override
```

When the compiler can use the C++ implementation (e.g., the caller is also in C++), it prefers the native implementation over the composed morloc version.

## Source File Resolution

Source file paths are resolved relative to the module directory. For installed packages, this means relative to the package's installation directory.


================================================
FILE: spec/interop/implementation-selection.md
================================================
# Implementation Selection

When a function has implementations in multiple languages, the compiler must choose which to use. This process -- called *realization* -- minimizes the number of serialization boundaries in the generated program.

## The Realization Problem

Consider:

```morloc
import root-py (map, add)
import root-cpp (map)

doubleAll xs = map (add 1) xs
```

`map` has Python and C++ implementations. `add` has only Python. The compiler must choose: if it selects C++'s `map`, then `add 1` must be serialized into C++ and back -- an unnecessary boundary. If it selects Python's `map`, everything runs in one language with no serialization.

## Selection Algorithm

The realization algorithm works as follows:

1. **Build the dependency graph.** For each function call, record which implementations are available and which functions it calls.

2. **Propagate language constraints.** Functions with only one language implementation constrain their callers. In the example above, `add` being Python-only forces `map` to prefer Python.

3. **Score candidate implementations.** For each function with multiple implementations, score each candidate by counting the serialization boundaries it would introduce.

4. **Select minimum-boundary implementations.** Choose the implementation that minimizes total serialization cost.

## Collapse Behavior

When a specialized function (available in only one language) is nested inside a polymorphic function (available in several languages), the outer function "collapses" to the same language:

```morloc
import root-py (map, filter)
import root-cpp (map, filter, applyKernel)

process imgs = map applyKernel (filter isValid imgs)
```

Since `applyKernel` is C++ only, both `map` and `filter` collapse to C++, avoiding two serialization boundaries.

## Explicit Language Control

When the programmer wants to force a specific language, they can use distinct names:

```morloc
import foopy (pyAdd)
import foocpp (cppMul)

mixedOps x = pyAdd (cppMul x 5) 10
```

Here the language boundary between `cppMul` and `pyAdd` is explicit and intentional. The compiler inserts serialization at that boundary.

## Compile-Time Only

Implementation selection is entirely static. The generated program contains no runtime dispatch logic for language choice. Each function call in the generated code targets a specific pool in a specific language.

## Validation

During realization, the compiler validates that:

- Every function in the program has at least one implementation.
- Every selected implementation has the necessary concrete type mappings.
- The serialization schemas are consistent at every boundary.

If validation fails, the compiler reports which functions lack implementations or which type mappings are missing.

## Inspecting Selections

The compiler's implementation choices can be inspected:

```bash
morloc dump script.loc       -- show intermediate representations
```

The dump output includes the realized program with language annotations on each function node.


================================================
FILE: spec/interop/serialization.md
================================================
# Serialization

When data crosses a language boundary, it is serialized to a binary format, transmitted, and deserialized on the other side. Morloc uses MessagePack (msgpack) as its serialization protocol.

## Schema Encoding

Each type has a compact schema string that describes its msgpack representation. Schemas are embedded in the manifest and used by both the nexus and language pools.

### Schema Syntax

| Schema | Type | Msgpack Format |
|--------|------|----------------|
| `z` | `Unit` | nil |
| `b` | `Bool` | boolean |
| `i1` | `Int8` | int8 |
| `i2` | `Int16` | int16 |
| `i4` | `Int32` | int32 |
| `i8` | `Int64` / `Int` | int64 |
| `u1` | `UInt8` | uint8 |
| `u2` | `UInt16` | uint16 |
| `u4` | `UInt32` | uint32 |
| `u8` | `UInt64` | uint64 |
| `f4` | `Float32` | float32 |
| `f8` | `Float64` / `Real` | float64 |
| `s` | `Str` | string |
| `[X]` | `List X` | array of X |
| `(X,Y)` | `(X, Y)` | array [X, Y] |
| `{k1:X,k2:Y}` | record | map {"k1": X, "k2": Y} |

### Annotated Schemas

Schemas may carry a display name prefix for CLI help text:

```
<double>f8        -- Real, displayed as "double"
<integer>i8       -- Int, displayed as "integer"
```

## Packing Rules

### Primitives

Primitives are packed directly as their msgpack counterparts: integers as msgpack integers (at the declared width), floats as msgpack floats, booleans as msgpack booleans, strings as msgpack strings.

### Lists

A `List a` is packed as a msgpack array. Each element is packed according to its element schema.

### Tuples

A tuple `(a, b, c)` is packed as a fixed-length msgpack array `[a, b, c]`.

### Records

Records are packed as msgpack maps with string keys:

```
{name = "Alice", age = 27}  -->  {"name": "Alice", "age": 27}
```

In C++, records may be packed as positional tuples for efficiency when both sides agree on field order.

## Serialization Insertion

The compiler automatically inserts serialization at language boundaries during the Serialize phase of code generation. For each cross-language call:

1. The caller's pool serializes the arguments using the argument schemas.
2. The serialized bytes are sent over the Unix socket.
3. The callee's pool deserializes the bytes into native types.
4. After execution, the result is serialized and sent back.
5. The caller deserializes the result.

## Language Bindings

Each language has a serialization library (compiled during `morloc init`):

- **Python**: `pymorloc` -- C extension providing `pack`/`unpack` functions
- **C++**: `cppmorloc` -- Template header with type-safe serialization
- **R**: `rmorloc` -- C extension for R type serialization

These libraries implement schema-driven serialization: given a schema string and a native value, they produce msgpack bytes, and vice versa.

## Cross-Language Data Representation

The same logical value may have different native representations:

| Morloc Value | Python | C++ | R | Msgpack |
|-------------|--------|-----|---|---------|
| `42` | `int(42)` | `int(42)` | `42L` | `0x2a` (positive fixint) |
| `[1,2,3]` | `[1,2,3]` | `vector{1,2,3}` | `list(1,2,3)` | array of 3 ints |
| `{x=1}` | `{"x":1}` | `struct{x:1}` | `list(x=1)` | map {"x": 1} |

The serialization layer normalizes these representations through the common msgpack format.


================================================
FILE: spec/interop/type-mappings.md
================================================
# Type Mappings

Type mappings define how morloc's general types resolve to concrete representations in each target language. Every general type used at a language boundary must have a concrete mapping for that language.

## Mapping Declaration Syntax

```morloc
type <Lang> => <Name> <params> = "<concrete-string>" <params>
```

Examples:

```morloc
type Py => Int = "int"
type Cpp => Int = "int"
type R => Int = "integer"

type Py => List a = "list" a
type Cpp => List a = "std::vector<$1>" a
type R => List a = "list" a
```

## Parameter Substitution

In the concrete type string, `$1`, `$2`, etc. are replaced by the rendered concrete types of the corresponding parameters:

```morloc
type Cpp => Map k v = "std::map<$1,$2>" k v
```

`Map Str Int` in C++ becomes `std::map<std::string,int>`.

For languages where containers are unparameterized (Python, R), parameters are listed but do not appear in the string:

```morloc
type Py => Map k v = "dict" k v
```

## Standard Mappings

### Primitive Types

| Morloc | Python | C++ | R |
|--------|--------|-----|---|
| `Bool` | `"bool"` | `"bool"` | `"logical"` |
| `Int` | `"int"` | `"int"` | `"integer"` |
| `Int8` | `"int"` | `"int8_t"` | `"integer"` |
| `Int16` | `"int"` | `"int16_t"` | `"integer"` |
| `Int32` | `"int"` | `"int32_t"` | `"integer"` |
| `Int64` | `"int"` | `"int64_t"` | `"integer"` |
| `UInt8` | `"int"` | `"uint8_t"` | `"integer"` |
| `UInt16` | `"int"` | `"uint16_t"` | `"integer"` |
| `UInt32` | `"int"` | `"uint32_t"` | `"integer"` |
| `UInt64` | `"int"` | `"uint64_t"` | `"integer"` |
| `Real` | `"float"` | `"double"` | `"numeric"` |
| `Float32` | `"float"` | `"float"` | `"numeric"` |
| `Float64` | `"float"` | `"double"` | `"numeric"` |
| `Str` | `"str"` | `"std::string"` | `"character"` |
| `Unit` | `"None"` | `"void"` | `"NULL"` |

### Collection Types

| Morloc | Python | C++ | R |
|--------|--------|-----|---|
| `List a` / `[a]` | `"list"` | `"std::vector<$1>"` | `"list"` |
| `(a, b)` | `"tuple"` | `"std::tuple<$1,$2>"` | `"list"` |
| `(a, b, c)` | `"tuple"` | `"std::tuple<$1,$2,$3>"` | `"list"` |

### Record Types

Records use per-declaration mappings:

```morloc
record Py => Person = "dict"
record Cpp => Person = "Person"       -- generates a struct
record R => Person = "list"
```

## Resolution Process

When the compiler needs the concrete type of a general type for a specific language:

1. Fully expand general type aliases.
2. Look up the language-specific mapping for the resulting type constructor.
3. Recursively resolve type parameters.
4. Substitute resolved parameters into the concrete string.

If no mapping exists for a required type in a required language, compilation fails with an error identifying the unmapped type.


================================================
FILE: spec/language/LANGUAGE.md
================================================
# Language Reference

Morloc is a typed, functional workflow language for composing functions across Python, C++, and R under a unified type system. Programs are written in a declarative, ML-style syntax. The compiler resolves types, selects language implementations, and generates executables that orchestrate cross-language calls at runtime.

## Design Philosophy

- **Language-agnostic composition.** Functions from different languages compose as naturally as functions within a single language. The programmer writes workflows; the compiler handles language boundaries.
- **Types as contracts.** A single general type system mediates between languages. Each language maps general types to its own concrete types. The compiler verifies consistency across these mappings.
- **No recursion, no effects.** Morloc programs describe pure data-flow pipelines. Iteration is expressed through higher-order functions (`map`, `fold`). Side effects are confined to foreign function implementations.
- **Serialization is implicit.** When a function in one language calls a function in another, the compiler inserts serialization and deserialization automatically. The programmer never writes marshalling code.

## Core Concepts

- **Modules** organize code into namespaces with explicit exports. See [[LANGUAGE.md#modules]] and [[../modules/MODULES.md]].
- **Expressions** are the building blocks: function application, lambda abstraction, composition, and where-clauses. See [[expressions.md]].
- **Declarations** define functions, type signatures, type aliases, records, typeclasses, and foreign function bindings. See [[declarations.md]].
- **Operators** support user-defined infix syntax with fixity declarations. See [[operators.md]].
- **Annotations** attach documentation and CLI metadata to exported functions. See [[annotations.md]].

## Subfiles

- [[lexical-structure.md]] -- Tokens, literals, comments, whitespace, indentation
- [[expressions.md]] -- Expression forms
- [[declarations.md]] -- Top-level declaration forms
- [[operators.md]] -- Operator syntax and fixity
- [[annotations.md]] -- Docstrings and metadata tags


================================================
FILE: spec/language/annotations.md
================================================
# Annotations

Morloc uses docstring comments and metadata tags to annotate exported functions. These annotations drive automatic CLI generation: the nexus translates them into command-line argument parsers, help text, and usage messages.

## Docstring Syntax

A docstring comment is a single line beginning with `--'` immediately preceding a type signature:

```morloc
--' Add two numbers
add :: Int -> Int -> Int
```

Multi-line docstrings use consecutive `--'` lines:

```morloc
--' Compute the mean of a list of numbers
--' Returns 0 for an empty list
mean :: [Real] -> Real
```

Triple-quoted block docstrings use `"""`:

```morloc
"""
Add two numbers

@arg x First number
@arg y Second number
"""
add :: Int -> Int -> Int
```

## Metadata Tags

Metadata tags within docstrings control how function arguments map to CLI parameters.

### `@arg`

Associates a name and description with a positional argument:

```morloc
"""
@arg x The input value
@arg y The scaling factor
"""
scale :: Real -> Real -> Real
```

This generates: `./program scale <x> <y>`

### `@opt`

Marks an argument as an optional CLI parameter with a default value:

```morloc
"""
@opt n Number of iterations (default: 10)
"""
iterate :: Int -> [Real] -> [Real]
```

This generates: `./program iterate --n=10 <input>`

### `@flag`

Marks a `Bool` argument as a flag:

```morloc
"""
@flag verbose Enable verbose output
"""
process :: Bool -> [Str] -> [Str]
```

This generates: `./program process --verbose <input>`

Flags also generate a negation form: `--no-verbose`.

## Effect on CLI Generation

When a function is exported from the main module, its docstring and type signature together determine the generated CLI interface:

- Each function becomes a subcommand: `./program <function> [args]`
- Positional arguments follow the subcommand in order
- Optional arguments use `--name=value` syntax
- Flags use `--name` / `--no-name` syntax
- Record arguments are expanded into grouped options
- Help text is derived from docstring content

See [[../runtime/cli.md]] for the full CLI generation rules.


================================================
FILE: spec/language/declarations.md
================================================
# Declarations

Top-level declarations define the structure of a morloc program: modules, imports, functions, types, and foreign bindings.

## Module Declaration

Every morloc file may begin with a module declaration specifying the module name and its exports:

```morloc
module main (foo, bar)     -- export foo and bar
module utilities (*)       -- export everything
```

If no module declaration is present, the file is treated as an anonymous module.

## Import Declarations

Imports bring names from other modules into scope:

```morloc
import root-py                  -- import all exports
import foo (bar, baz)           -- import specific names
import math (sin, cos, pi)      -- selective import
```

Multiple imports of the same function from different language modules create implementation polymorphism:

```morloc
import root-py (map, filter)
import root-cpp (map, filter)
-- map and filter now have both Python and C++ implementations
```

## Type Signatures

Type signatures declare the general type of a function:

```morloc
add :: Int -> Int -> Int
map a b :: (a -> b) -> [a] -> [b]
```

Type variables (lowercase) introduce parametric polymorphism. They may be listed after the function name and before `::` to indicate universal quantification.

## Function Definitions

Functions are defined by equation:

```morloc
double x = (x, x)
add3 x y z = x + y + z
```

A function may have both a morloc definition and one or more foreign implementations. The compiler selects among available implementations at compile time.

```morloc
mean :: [Real] -> Real
mean xs = div (sum xs) (size xs)         -- pure morloc definition
source Cpp from "stats.hpp" ("mean")     -- C++ implementation
```

## Type Alias Declarations

Type aliases give names to type expressions:

```morloc
type Filename = Str
type Matrix a = [[a]]
```

Language-specific type declarations map general types to concrete representations:

```morloc
type Py => Int = "int"
type Cpp => Int = "int"
type R => Int = "integer"

type Py => List a = "list" a
type Cpp => List a = "std::vector<$1>" a
type R => List a = "list" a
```

The `$1`, `$2`, ... syntax in language-specific type strings refers to the positional type parameters. See [[../types/type-declarations.md]].

## Record Declarations

Records define named product types with labeled fields:

```morloc
record Person where
  name :: Str
  age :: Int
```

Language-specific record mappings:

```morloc
record Py => Person = "dict"
record Cpp => Person = "Person"
record R => Person = "list"
```

Object and table declarations are variants of record declarations. See [[../types/records.md]].

## Typeclass Declarations

Typeclasses define overloaded interfaces:

```morloc
class Monoid a where
  empty a :: a
  op a :: a -> a -> a
```

## Instance Declarations

Instances provide typeclass implementations for specific types:

```morloc
instance Monoid Int where
  empty = 0
  source Cpp from "monoid.hpp" ("addInt" as op)
  source Py from "monoid.py" ("addInt" as op)
```

See [[../types/typeclasses.md]].

## Source Declarations (Foreign Function Interface)

Source declarations bind foreign functions to morloc names:

```morloc
source Py from "module.py" ("add", "mul")
source Cpp from "module.hpp" ("add", "mul")
source R from "module.R" ("add", "mul")
```

Renaming on import:

```morloc
source Py from "module.py" ("python_add" as add)
```

Importing built-in functions (no file path):

```morloc
source Py ("abs", "len")
```

See [[../interop/foreign-functions.md]].

## Fixity Declarations

Fixity declarations specify operator precedence and associativity:

```morloc
infixl 6 +, -
infixr 5 :
infix  4 ==, !=
```

See [[operators.md]].


================================================
FILE: spec/language/expressions.md
================================================
# Expressions

Morloc expressions describe data transformations. Every expression has a type, inferred or checked by the type system.

## Function Application

Application is by juxtaposition. Arguments follow the function, separated by whitespace:

```morloc
f x
map add [1, 2, 3]
add 1 2
```

Application is left-associative: `f x y` parses as `(f x) y`.

Functions may be partially applied:

```morloc
addFive = add 5       -- partial application of add
increment = (+) 1     -- partial application of operator
```

## Lambda Expressions

Lambdas are introduced with `\` and use `->` to separate parameters from the body:

```morloc
\x -> x + 1
\x y -> x + y
```

Lambdas may appear anywhere an expression is expected:

```morloc
map (\x -> x * 2) xs
```

## Function Composition

The `.` operator composes functions right-to-left:

```morloc
process = show . filter isPositive . map transform
```

The above is equivalent to `\x -> show (filter isPositive (map transform x))`.

The `$` operator provides low-precedence right-associative application, reducing parentheses:

```morloc
result = show $ filter isPositive $ map transform xs
```

## Where Clauses

A `where` clause introduces local bindings scoped to the enclosing definition:

```morloc
hypotenuse a b = sqrt (sqA + sqB) where
  sqA = a * a
  sqB = b * b
```

Local bindings may be functions:

```morloc
foo x = result where
  helper y = y + 1
  result = helper (helper x)
```

There is no `let ... in` syntax; use `where` instead.

## Record Field Access

The `.` operator in prefix position accesses a record field:

```morloc
.name alice        -- extract the "name" field
.age alice         -- extract the "age" field
```

Field accessors may be composed:

```morloc
getName = .name
names = map getName people
```

## Record Construction

Records are constructed with brace syntax:

```morloc
alice = {name = "Alice", age = 27}
```

## Tuple Construction

Tuples are constructed with parentheses:

```morloc
pair = (1, "hello")
triple = (True, 3.14, "x")
```

## List Construction

Lists use bracket syntax:

```morloc
xs = [1, 2, 3]
empty = []
nested = [[1, 2], [3, 4]]
```

## Type Ascription

An expression may be annotated with its type using `::`:

```morloc
(42 :: Int)
```

## Operator Sections

Operators can be used in prefix position by enclosing them in parentheses:

```morloc
(+) 1 2       -- prefix application
(+ 1)         -- right section: \x -> x + 1
```

## Limitations

- **No recursion.** Use higher-order functions (`map`, `fold`, `filter`) for iteration.
- **No conditionals.** Use pattern matching or foreign functions for branching.
- **No side effects.** Morloc expressions are pure; effects are confined to foreign implementations.


================================================
FILE: spec/language/lexical-structure.md
================================================
# Lexical Structure

## Character Set

All morloc source files must contain only ASCII characters. Non-ASCII characters (including Unicode em-dashes, smart quotes, etc.) are not permitted and may cause silent truncation.

## Comments

```morloc
-- Line comment (to end of line)
--' Docstring comment (attaches to next declaration)
{- Block comment (nestable) -}
```

Docstring comments (`--'`) have semantic meaning: they provide documentation that propagates to generated CLI help text. See [[annotations.md]].

## Identifiers

**Term identifiers** begin with a lowercase letter or underscore, followed by alphanumeric characters, underscores, or single quotes:

```
foo, x', my_function, _unused
```

**Type identifiers** begin with an uppercase letter:

```
Int, Bool, List, Person
```

**Module names** consist of alphanumeric segments separated by hyphens:

```
root, root-py, root-cpp, math
```

**Operator identifiers** consist of one or more operator characters:

```
+  -  *  /  .  $  |>  ==  !=  >=  ++
```

Operator characters include: `! # % & * + - . / < = > ? @ \ ^ | ~ :`

## Literals

### Numeric Literals

```morloc
42          -- Int (decimal)
0xFF        -- Int (hexadecimal)
0o77        -- Int (octal)
0b1010      -- Int (binary)
3.14        -- Real (floating point)
1.0e-3      -- Real (scientific notation)
```

### String Literals

```morloc
"hello"              -- String literal
"line1\nline2"       -- Escape sequences: \n, \t, \\, \"
"value: #{expr}"     -- String interpolation
```

### Boolean Literals

```morloc
True
False
```

### Collection Literals

```morloc
[1, 2, 3]                      -- List
(1, "hello", True)              -- Tuple
{name = "Alice", age = 27}      -- Record
```

## Whitespace and Indentation

Morloc is indentation-sensitive, following conventions similar to Haskell:

- Top-level declarations must start at column 0.
- Continuation lines of an expression must be indented further than the start of that expression.
- `where` clauses introduce a new indentation block; all bindings in the block must align.

```morloc
foo x = result where
  helper y = y + 1    -- indented under where
  z = 42              -- aligned with helper
```

## Keywords

The following identifiers are reserved:

```
module  import  from  source  export  where  type  record  object  table
class  instance  infixl  infixr  infix  True  False
```

## Separators and Delimiters

```
(  )    -- Grouping, tuples, operator sections
[  ]    -- Lists
{  }    -- Records
,       -- Element separator
::      -- Type annotation
=       -- Definition, record field binding
->      -- Function type arrow, lambda arrow
\       -- Lambda introduction
.       -- Record field access (prefix), composition (infix)
$       -- Low-precedence application (infix)
=>      -- Language-specific type mapping
```


================================================
FILE: spec/language/operators.md
================================================
# Operators

Morloc supports user-defined infix operators with explicit precedence and associativity declarations.

## Operator Characters

Operators are identifiers composed entirely of the characters:

```
! # % & * + - . / < = > ? @ \ ^ | ~ :
```

Examples: `+`, `*`, `.`, `$`, `|>`, `==`, `!=`, `>=`, `++`, `>>=`

## Fixity Declarations

Every operator has three properties: associativity, precedence, and name. These are declared with fixity statements:

```morloc
infixl 6 +, -       -- left-associative, precedence 6
infixr 5 :          -- right-associative, precedence 5
infix  4 ==, !=     -- non-associative, precedence 4
```

**Precedence** ranges from 0 (loosest) to 9 (tightest). The default for an undeclared operator is `infixl 9`.

**Associativity** determines grouping when operators of the same precedence appear in sequence:

| Associativity | Grouping | Example |
|---------------|----------|---------|
| `infixl` (left) | `(a + b) + c` | arithmetic operators |
| `infixr` (right) | `a : (b : c)` | cons, composition |
| `infix` (none) | `a == b == c` is an **error** | comparison operators |

## Precedence Rules

When two operators appear in the same expression, the one with higher precedence binds tighter:

```morloc
infixl 7 *
infixl 6 +

1 + 2 * 3       -- parses as: 1 + (2 * 3)
```

When two operators have the same precedence:

- If both are `infixl`, they group left: `(a + b) - c`
- If both are `infixr`, they group right: `a : (b : c)`
- If they have conflicting associativity or are both `infix`, it is a **parse error**

## Standard Operators

| Operator | Fixity | Purpose |
|----------|--------|---------|
| `.` | `infixr 9` | Function composition |
| `$` | `infixr 0` | Low-precedence application |
| `+`, `-` | `infixl 6` | Arithmetic |
| `*`, `/` | `infixl 7` | Arithmetic |
| `==`, `!=` | `infix 4` | Comparison |

## Desugaring

All infix expressions desugar to prefix function application:

```morloc
a + b          -- desugars to: (+) a b
a + b * c      -- desugars to: (+) a ((*) b c)
```

Operators in prefix position are enclosed in parentheses:

```morloc
(+) 1 2        -- prefix application
```

## Defining Custom Operators

A custom operator requires a fixity declaration, a type signature, and an implementation:

```morloc
infixl 6 |>

(|>) a b :: a -> (a -> b) -> b
source Py from "pipe.py" ("pipe" as (|>))

result = xs |> filter isPositive |> map transform
```

## Position Independence

Fixity declarations may appear anywhere in the module -- before or after the expressions that use the operator. The parser applies fixity information retroactively.

## Precedence Climbing

The parser uses a precedence climbing algorithm (Pratt parsing) to resolve operator expressions. The algorithm recursively parses operands, accepting only operators whose precedence meets or exceeds a minimum threshold. Left-associative operators increment the threshold for the right operand; right-associative operators do not.


================================================
FILE: spec/modules/MODULES.md
================================================
# Module System

Morloc code is organized into modules with explicit exports and imports. Modules form a directed acyclic graph (DAG) of dependencies. The module system supports hierarchical naming, namespace isolation, and a plane-based organization for package distribution.

## Core Concepts

**Modules** are the unit of compilation and distribution. Each `.loc` file defines at most one module. A module declares its name, its exports, and its imports from other modules.

**Planes** are top-level namespaces that partition the module universe. The default plane contains the standard library and user-installed packages. Custom planes allow organizations to maintain private module collections.

**The dependency DAG** tracks which modules import which others. The compiler resolves this DAG during parsing, loading each module exactly once and accumulating state (fixity tables, type definitions, typeclasses) across the graph.

## State Accumulation

As modules are loaded, three kinds of state accumulate:

- **Parser state**: fixity tables propagate across modules so that operator precedence is consistent.
- **Compiler state**: type signatures, typeclass definitions, type aliases, and source declarations are collected globally.
- **Dependency graph**: the DAG records import relationships for linking and merge phases.

## Subfiles

- [[imports-and-exports.md]] -- Module declarations, import forms, export lists, visibility
- [[resolution.md]] -- Path resolution: local, system, and plane lookups
- [[packages.md]] -- Package metadata, versioning, and installation


================================================
FILE: spec/modules/imports-and-exports.md
================================================
# Imports and Exports

## Module Declaration

A module declaration names the module and lists its exports:

```morloc
module main (foo, bar)
```

The export list determines which names are visible to importers. The wildcard `(*)` exports all top-level definitions:

```morloc
module utilities (*)
```

If no module declaration is present, the file is an anonymous module. Anonymous modules cannot be imported by other modules but may serve as the entry point for `morloc make`.

## Export Lists

Only names listed in the export list are available to importing modules. This includes:
- Function names
- Type names
- Operator names (in parentheses)

```morloc
module math (sin, cos, pi, (+))
```

Names not in the export list are private to the module.

## Import Forms

### Import All

Import all exports from a module:

```morloc
import root-py
```

### Selective Import

Import specific names:

```morloc
import foo (bar, baz)
```

Only `bar` and `baz` are brought into scope. Other exports of `foo` are not accessible.

### Multiple Imports of the Same Name

Importing the same function name from multiple language-specific modules creates implementation polymorphism:

```morloc
import root-py (map, filter, fold)
import root-cpp (map, filter, fold)
import root-r (map, filter, fold)
```

After these imports, `map`, `filter`, and `fold` each have three language implementations. The compiler selects among them during realization. See [[../interop/implementation-selection.md]].

## Visibility Rules

- A name is visible in a module if it is defined there or imported.
- Imported names do not automatically re-export. To re-export, the name must appear in the module's own export list.
- Name collisions between imports are resolved during the merge phase: if two imports provide the same name with different general types, it is an error. If they provide the same name with the same general type but different language implementations, they are merged (implementation polymorphism).

## Import Side Effects

Importing a module causes its type declarations, fixity declarations, and typeclass definitions to become visible in the importing module. This is necessary for correct parsing (fixity affects precedence) and type checking (type aliases and typeclasses must be in scope).


================================================
FILE: spec/modules/packages.md
================================================
# Packages

A package is a distributable collection of morloc modules. Packages provide metadata for dependency management, versioning, and installation.

## Package Metadata

Each package contains a `package.yaml` file in its root directory:

```yaml
name: math
version: 0.1.0
homepage: https://github.com/morloc-project/math
synopsis: Mathematical functions for morloc
description: Provides trigonometric, exponential, and other math functions
bug-reports: https://github.com/morloc-project/math/issues
license: MIT
author: Morloc Project
dependencies:
  - root
```

## Fields

| Field | Required | Description |
|-------|----------|-------------|
| `name` | Yes | Package name (must match directory name) |
| `version` | Yes | Semantic version string |
| `homepage` | No | URL to the project page |
| `synopsis` | No | One-line description |
| `description` | No | Longer description |
| `license` | No | License identifier |
| `author` | No | Package author |
| `dependencies` | No | List of required packages |

## Installation

Packages are installed with `morloc install`:

```bash
morloc install math                          -- from default repository
morloc install github:user/repo              -- from GitHub
morloc install /path/to/local/package        -- from local path
```

Installation copies the package contents to the module library:

```
~/.local/share/morloc/src/morloc/plane/<plane>/<package-name>/
```

## Dependencies

When a package declares dependencies, `morloc install` ensures those dependencies are also installed. Dependencies are resolved transitively: if `A` depends on `B` and `B` depends on `C`, installing `A` also installs `B` and `C`.

## Standard Library Packages

The standard library is distributed as a set of packages:

| Package | Purpose |
|---------|---------|
| `internal` | Compiler internal definitions |
| `root` | Language-agnostic core signatures |
| `root-py` | Python implementations of core functions |
| `root-cpp` | C++ implementations of core functions |
| `root-r` | R implementations of core functions |
| `math` | Mathematical functions |

These are installed during `morloc init`:

```bash
morloc init -f
morloc install internal root root-py root-cpp root-r math
```

## Versioning

Packages use semantic versioning (MAJOR.MINOR.PATCH). The current module system does not enforce version constraints at resolution time; dependency version fields are informational.


================================================
FILE: spec/modules/resolution.md
================================================
# Module Resolution

When a module imports another module by name, the compiler resolves that name to a file path. Resolution follows a three-case algorithm based on the relationship between the importing and imported module names.

## Case 1: No Context (Top-Level File)

When the entry-point file imports a module, or when no parent module context exists, the compiler searches three locations in order:

1. **Local**: `./foo.loc` or `./foo/main.loc` (relative to the importing file)
2. **System**: `$MORLOC_LIB/morloc/foo/main.loc` (core library)
3. **Plane**: `$MORLOC_LIB/<plane>/foo/main.loc` (plane-specific library)

The first match wins. `$MORLOC_LIB` defaults to `~/.local/share/morloc/src/`.

## Case 2: No Common Prefix

When module `foo.bar.baz` imports `bif.buf` and the names share no common prefix, the compiler searches only system and plane locations:

- `$MORLOC_LIB/morloc/bif/buf/main.loc`
- `$MORLOC_LIB/<plane>/bif/buf/main.loc`

Local paths are not searched in this case. This prevents a local file from accidentally shadowing a system library module.

## Case 3: Common Prefix

When module `foo.bar.baz` imports `foo.bif` and the names share a common prefix (`foo`), the compiler resolves the import relative to the shared prefix:

- From `foo/bar/baz/main.loc`, resolve `../../bif/main.loc`

This ensures that modules within the same package can reference siblings reliably, regardless of where the package is installed.

## Hierarchical Naming

Module names use dots as hierarchy separators: `foo.bar.baz`. Each segment maps to a directory level:

```
foo.bar.baz  -->  foo/bar/baz/main.loc
```

The leaf file is always `main.loc`.

## Plane Lookup

The default plane is `default`. The plane can be configured, allowing organizations to maintain private module namespaces. A module `foo` in plane `myorg` resolves to:

```
$MORLOC_LIB/myorg/foo/main.loc
```

## Search Order Summary

| Context | Search Order |
|---------|-------------|
| Top-level import | Local, System, Plane |
| No common prefix | System, Plane |
| Common prefix | Relative to prefix |


================================================
FILE: spec/runtime/RUNTIME.md
================================================
# Runtime System

Compiled morloc programs execute as a **nexus-pool** architecture: a single C orchestrator (the nexus) dispatches function calls to language-specific worker processes (pools) via Unix domain sockets and msgpack serialization.

## Design Rationale

The nexus-pool model separates orchestration from computation:

- **The nexus** is a pre-compiled static C binary, built once during `morloc init`. It is data-driven: a per-program JSON manifest tells it which commands exist, which pools to start, and how to parse arguments. The nexus handles CLI parsing, argument serialization, pool lifecycle, dispatch, and result presentation.

- **Pools** are language-specific processes (one per language per program). Each pool loads generated code for its language, listens for requests from the nexus, executes functions, and returns serialized results. Pools for interpreted languages (Python, R) run the interpreter directly; C++ pools are compiled to native executables.

This separation means the nexus never changes between programs -- only the manifest and pool code differ. It also means language runtimes are isolated in their own processes, preventing memory corruption across language boundaries.

## Components

| Component | Language | Lifecycle |
|-----------|----------|-----------|
| Nexus binary | C | Built once (`morloc init`), copied per program |
| Manifest | JSON | Generated per program by `morloc make` |
| Python pool | Python + C extension | Generated per program |
| C++ pool | C++ | Generated and compiled per program |
| R pool | R + C extension | Generated per program |

## Subfiles

- [[execution-model.md]] -- Nexus lifecycle, pool management, dispatch flow, errors
- [[ipc.md]] -- Unix socket protocol, message format, data flow
- [[manifest.md]] -- JSON manifest schema
- [[cli.md]] -- Automatic CLI generation from type signatures


================================================
FILE: spec/runtime/cli.md
================================================
# CLI Generation

Morloc automatically generates command-line interfaces from exported function signatures and their annotations. Each exported function becomes a subcommand of the compiled program.

## Basic Structure

A compiled program `foo` with exported functions `bar` and `baz` produces:

```
./foo bar [args]
./foo baz [args]
./foo --help
./foo bar --help
```

## Argument Mapping

Function parameters map to CLI arguments based on their types and annotations.

### Positional Arguments

By default, function parameters become positional arguments in declaration order:

```morloc
--' Scale a value
scale :: Real -> Real -> Real
```

```
./foo scale 3.14 2.0
```

### Optional Arguments

Parameters annotated with `@opt` become named optional arguments with defaults:

```morloc
"""
@opt n Number of iterations (default: 10)
"""
iterate :: Int -> [Real] -> [Real]
```

```
./foo iterate --n=20 "[1.0, 2.0]"
```

### Flags

`Bool` parameters annotated with `@flag` become boolean flags:

```morloc
"""
@flag verbose Enable verbose output
"""
process :: Bool -> [Str] -> [Str]
```

```
./foo process --verbose '["a", "b"]'
./foo process --no-verbose '["a", "b"]'
```

### Record Arguments

When a function takes a record type, its fields are expanded into a group of CLI options:

```morloc
record Config where
  threshold :: Real
  maxIter :: Int

--' Run analysis
analyze :: Config -> [Real] -> [Real]
```

```
./foo analyze --threshold=0.5 --max-iter=100 "[1.0, 2.0]"
```

## Help Text

Help text is generated from:

- The function's docstring (description)
- `@arg` annotations (per-argument descriptions)
- Type signatures (type information and metavar names)
- Default values (for optional arguments and flags)

```
$ ./foo bar --help
bar - Scale a value

Usage: foo bar <x> <y>

Arguments:
  x    First number (Real)
  y    Second number (Real)
```

## Input Format

Arguments are parsed according to their type schemas:

- **Numeric types**: parsed as numbers (`42`, `3.14`)
- **Strings**: parsed as-is or quoted
- **Booleans**: `true`/`false` for positional; `--flag`/`--no-flag` for flags
- **Lists**: JSON array syntax (`[1, 2, 3]`)
- **Records**: JSON object syntax or expanded into named options
- **Tuples**: JSON array syntax (`[1, "hello"]`)

## Output Format

Return values are printed to stdout. The nexus deserializes the pool's msgpack response and renders it as human-readable text. Strings are printed without quotes; numbers, lists, and records are printed in JSON-like format.


================================================
FILE: spec/runtime/execution-model.md
================================================
# Execution Model

## Overview

A compiled morloc program executes as a set of cooperating processes: one nexus process and zero or more pool processes. The nexus is the entry point; pools execute language-specific code on demand.

## Nexus Lifecycle

1. **Startup.** The user invokes the program: `./foo subcommand [args]`. The nexus binary loads its manifest from `./foo.manifest`.

2. **CLI parsing.** The nexus parses command-line arguments according to the manifest's argument definitions for the named subcommand. Argument types, defaults, and help text are all manifest-driven.

3. **Pool startup.** The nexus starts the pool processes required for the subcommand. Each pool is a separate OS process communicating via a Unix domain socket. Only pools listed in the command's `needed_pools` are started.

4. **Argument serialization.** The nexus serializes parsed arguments into msgpack format using the argument schemas from the manifest.

5. **Dispatch.** The nexus sends the serialized arguments to the appropriate pool, identified by the command's pool index and manifold ID.

6. **Result handling.** The nexus receives the serialized result from the pool, deserializes it, and prints it to stdout.

7. **Shutdown.** After the command completes, the nexus terminates all pool processes and exits.

## Pure Commands

Some commands are *pure*: they require no pool and are evaluated entirely within the nexus using a built-in expression evaluator. Pure commands have an expression tree in the manifest instead of a pool reference. The nexus evaluates the tree directly, supporting literals, function application, lambda expressions, and string interpolation.

## Pool Process Management

Each pool is a long-running process that:

1. Starts up and loads its generated code (imports for Python/R, compiled code for C++).
2. Opens a Unix domain socket and waits for connections.
3. On each request: deserializes arguments, dispatches to the appropriate function by manifold ID, serializes the result, and sends it back.
4. Exits when the nexus closes the connection or sends a termination signal.

Pools are created in a temporary directory (`/tmp/morloc.XXXXXX/`) with socket files named by language (e.g., `pipe-py`, `pipe-cpp`).

## Worker Dispatch Strategy

Each pool forks multiple worker processes (typically `nproc - 1`) to handle requests concurrently. The dispatcher must route incoming client connections to an available worker.

### Shared Queue (Current Approach)

The Python and R pools use a single Unix socketpair as a shared job queue. The dispatcher writes client file descriptors (via `SCM_RIGHTS` / `sendmsg`) to one end; all workers block on `recvmsg` on the other end. The kernel delivers each fd to exactly one waiting worker.

This design handles re-entrant callbacks correctly. When a worker makes a `foreign_call` to another pool and that pool calls back, the callback arrives as a new client connection. Since the blocked worker never calls `recvmsg`, the callback is picked up by an idle worker. Busy workers are invisible to the dispatch mechanism.

The C++ pool achieves equivalent semantics using a shared queue protected by a mutex and condition variable, with threads instead of processes.

### Why Not Round-Robin

A naive round-robin dispatcher assigns connections to workers in fixed order (W0, W1, ..., W0, ...). This works for unidirectional calls but deadlocks under re-entrant callbacks:

1. Worker W0 receives a job and makes a `foreign_call` to Pool B.
2. Pool B processes the call and issues callbacks back to Pool A. Each callback is a new connection.
3. The round-robin dispatcher sends callbacks to W1, W2, ..., Wn in order.
4. When all N workers are blocked in `foreign_call`, the (N+1)th callback wraps around to W0 -- which is still blocked. The callback sits unread in W0's pipe while Pool B waits for the response.

This circular dependency hangs all workers. The failure threshold is exactly N simultaneous bidirectional calls where N equals the worker count.

### Depth Limitation

Even with the shared queue, deep cross-language call chains are limited by the worker count. Each hop in a chain like `rId (pyId (rId (pyId ...)))` blocks a worker until the deeper computation returns. A depth-D chain (D alternating cross-language calls) requires roughly D/2 workers in each pool simultaneously. Chains deeper than `2 * (nproc - 1)` will deadlock due to worker exhaustion.

## Dispatch Flow

```
User CLI input
  --> Nexus: parse args, serialize
  --> Socket: send to pool
  --> Pool: deserialize, call function
  --> Pool: serialize result
  --> Socket: send to nexus
  --> Nexus: deserialize, print
```

For cross-language function calls *within* the same command, the pool-to-pool path goes through the nexus:

```
Pool A: serialize result --> Nexus --> Pool B: deserialize, call, serialize --> Nexus --> Pool A
```

## Error Propagation

Errors at any stage propagate back to the user:

- **CLI parse errors**: the nexus prints usage information and exits.
- **Pool startup failure**: the nexus reports which pool failed to start.
- **Function execution errors**: the pool sends an error response (status code 1) with an error message; the nexus prints the message and exits with a non-zero code.
- **Communication errors**: socket failures or unexpected disconnections cause the nexus to report the failure and terminate.

## Resource Cleanup

The nexus is responsible for cleaning up all resources:

- Terminating pool processes (via signals)
- Removing Unix domain socket files
- Removing the temporary directory


================================================
FILE: spec/runtime/ipc.md
================================================
# Inter-Process Communication

The nexus and pools communicate over Unix domain sockets using a binary message protocol built on msgpack.

## Transport

Each pool opens a Unix domain socket in the program's temporary directory:

```
/tmp/morloc.XXXXXX/pipe-py
/tmp/morloc.XXXXXX/pipe-cpp
/tmp/morloc.XXXXXX/pipe-r
```

The nexus connects to these sockets to send requests and receive responses. Each socket carries bidirectional traffic for one pool.

## Request Format

A request from the nexus to a pool is a msgpack-encoded structure:

```
{
  function_id: <int>,         -- manifold ID identifying the function
  args: [<msgpack>, ...]      -- serialized arguments
}
```

The `function_id` is an integer assigned by the compiler. Each function in a pool has a unique manifold ID. The pool uses this ID to dispatch to the correct function.

Arguments are pre-serialized by the nexus according to the argument schemas in the manifest. Each argument is an opaque msgpack byte sequence from the pool's perspective until it deserializes with the expected schema.

## Response Format

A response from a pool to the nexus:

```
{
  status: <int>,              -- 0 = success, 1 = error
  result: <msgpack>           -- serialized return value or error message
}
```

On success, `result` contains the function's return value serialized according to the return schema. On error, `result` contains a string error message.

## Data Flow

### Simple Command

```
Nexus                              Pool
  |                                  |
  |-- request(mid=3, args=[...]) --> |
  |                                  | deserialize args
  |                                  | call function #3
  |                                  | serialize result
  | <-- response(status=0, ...) --   |
  |                                  |
```

### Cross-Language Call

When function A (in Pool X) calls function B (in Pool Y):

```
Nexus                Pool X              Pool Y
  |                    |                   |
  |-- request -------> |                   |
  |                    | call A            |
  |                    | A needs B         |
  | <-- call B ------- |                   |
  |-- request(B) -----------------------> |
  |                                        | call B
  | <-- response(B) --------------------- |
  |-- response(B) --> |                   |
  |                    | A continues      |
  | <-- response(A) - |                   |
```

The nexus mediates all cross-pool communication. Pools never communicate directly with each other.

## Packet Format

Messages are framed as length-prefixed packets:

1. **Length header**: 4-byte big-endian unsigned integer specifying the payload size.
2. **Payload**: msgpack-encoded request or response.

This framing allows the receiver to read exactly the right number of bytes for each message.

## Connection Lifecycle

1. The nexus starts a pool process.
2. The pool creates a Unix socket and begins listening.
3. The nexus connects to the socket.
4. Request/response pairs are exchanged.
5. On completion, the nexus closes the connection.
6. The pool detects the closed connection and exits.


================================================
FILE: spec/runtime/manifest.md
================================================
# Manifest Schema

The manifest is a JSON file that drives the nexus at runtime. It describes the pools, commands, argument schemas, and pure expression trees for one compiled morloc program.

## Top-Level Structure

```json
{
  "version": 1,
  "pools": [ ... ],
  "commands": [ ... ]
}
```

## Pool Definitions

Each pool entry describes a language-specific worker process:

```json
{
  "lang": "cpp",                   -- language identifier
  "exec": ["./pool-cpp.out"],      -- command to start the pool
  "socket": "pipe-cpp"             -- Unix socket basename
}
```

| Field | Type | Description |
|-------|------|-------------|
| `lang` | string | Language name (`"cpp"`, `"python3"`, `"r"`) |
| `exec` | [string] | Command and arguments to start the pool |
| `socket` | string | Socket filename (created in temp directory) |

## Command Definitions

Each command corresponds to an exported function. Commands come in two forms.

### Remote Commands

A remote command dispatches to a pool:

```json
{
  "name": "foo",
  "type": "remote",
  "mid": 1,                        -- manifold ID for dispatch
  "pool": 0,                       -- index into pools array
  "needed_pools": [0],             -- pool indices to start
  "arg_schemas": ["<double>f8"],   -- msgpack schemas per argument
  "return_schema": "<double>f8",   -- msgpack schema for return value
  "desc": ["description"],         -- docstring lines
  "return_type": "Real",           -- display type name
  "return_desc": [],               -- return value documentation
  "args": [ ... ]                  -- argument definitions
}
```

### Pure Commands

A pure command is evaluated by the nexus without any pool:

```json
{
  "name": "greeting",
  "type": "pure",
  "arg_schemas": ["s"],
  "return_schema": "s",
  "desc": [],
  "return_type": "Str",
  "return_desc": [],
  "args": [ ... ],
  "expr": { ... }                  -- expression tree
}
```

## Argument Definitions

### Positional

```json
{
  "kind": "pos",
  "metavar": "X",
  "type_desc": "Real",
  "quoted": false,
  "desc": []
}
```

### Optional

```json
{
  "kind": "opt",
  "metavar": "N",
  "type_desc": "Int",
  "quoted": false,
  "short": "n",
  "long": "count",
  "default": "1",
  "desc": []
}
```

### Flag

```json
{
  "kind": "flag",
  "short": "v",
  "long": "verbose",
  "long_rev": "no-verbose",
  "default": "false",
  "desc": []
}
```

### Group (Record Argument)

```json
{
  "kind": "grp",
  "metavar": "CONFIG",
  "desc": [],
  "group_opt": {"short": null, "long": "config"},
  "entries": [
    {"key": "x", "arg": { ... }}
  ]
}
```

## Expression Tree

Pure commands contain an expression tree that the nexus evaluates directly. Node types:

| Tag | Fields | Description |
|-----|--------|-------------|
| `lit` | `schema`, `lit_type`, `value` | Numeric/boolean literal |
| `str` | `schema`, `value` | String literal |
| `container` | `schema`, `elements` | List or tuple |
| `app` | `schema`, `func`, `args` | Function application |
| `lambda` | `vars`, `body` | Lambda abstraction |
| `bound` | `schema`, `var` | Bound variable reference |
| `interpolation` | `schema`, `strings` | String interpolation |
| `pattern` | `schema`, `pattern` | Accessor/setter pattern |

### Selector Patterns

Patterns use selectors for structural access:

```json
{"type": "end"}                                            -- terminal
{"type": "idx", "selectors": [{"index": 0, "sub": ...}]}  -- tuple index
{"type": "key", "selectors": [{"key": "name", "sub": ...}]} -- record key
```


================================================
FILE: spec/types/TYPES.md
================================================
# Type System

Morloc employs a two-level type system that mediates between a language-agnostic *general* type layer and language-specific *concrete* type layers. This design enables the compiler to verify cross-language composition statically: a function's general signature is checked once, while its concrete realizations are checked per language.

## Two-Level Design

**General types** (`TypeU`) are the programmer-facing types: `Int`, `Real`, `[a]`, `a -> b`. They carry no language-specific information. Type checking, inference, and subtyping operate at this level.

**Concrete types** (`Type`) are language-specific: Python's `int`, C++'s `std::vector<int>`, R's `integer`. The compiler resolves general types to concrete types through type declarations (e.g., `type Py => Int = "int"`). Concrete types determine serialization format and foreign function signatures.

A third, minimal representation (`TypeF`) is used at code generation boundaries where only structural shape matters.

## Role in Cross-Language Safety

When a Python function's output feeds into a C++ function's input, the compiler verifies:

1. Both functions share a compatible general type at the boundary.
2. Each side has a concrete type mapping for that general type.
3. A serialization schema exists to convert between the concrete representations.

If any check fails, the program is rejected at compile time.

## Judgment Forms

The type system uses bidirectional type checking with two primary judgments:

- **Synthesis**: given an expression, infer its type.
- **Checking**: given an expression and an expected type, verify compatibility.

Subtyping connects the two: a synthesized type may be a subtype of the expected type. See [[inference.md]] and [[subtyping.md]].

## Subfiles

- [[primitive-types.md]] -- Built-in types and sized variants
- [[type-declarations.md]] -- Type aliases and language-specific mappings
- [[records.md]] -- Record, object, and table types
- [[typeclasses.md]] -- Typeclass declarations and instances
- [[polymorphism.md]] -- Parametric polymorphism and quantification
- [[subtyping.md]] -- Subtyping rules and instantiation
- [[inference.md]] -- Bidirectional type inference


================================================
FILE: spec/types/inference.md
================================================
# Type Inference

Morloc uses bidirectional type checking based on the Dunfield-Krishnaswami algorithm ("Complete and Easy Bidirectional Typechecking for Higher-Rank Polymorphism", 2013). This provides sound and complete type inference for higher-rank polymorphism without requiring type annotations on lambda parameters.

## Judgment Forms

### Synthesis

```
Gamma |- e => A -| Delta
```

Given context Gamma and expression `e`, infer type `A` and produce updated context Delta.

Synthesis applies to:
- **Literals**: synthesize the literal's type (e.g., `42 => Int`)
- **Variables**: look up the type in the context
- **Applications**: synthesize the function type, then check arguments
- **Annotations**: use the declared type

### Checking

```
Gamma |- e <= A -| Delta
```

Given context Gamma, expression `e`, and expected type `A`, verify that `e` has type `A` and produce updated context Delta.

Checking applies to:
- **Lambdas with known argument types**: push argument types into the context, check the body
- **Expressions with type annotations**: verify the annotation matches

### The Sub Rule

When checking, if no specific checking rule applies, the checker falls back to synthesis plus subtyping:

```
  Gamma |- e => A -| Theta       Theta |- [Theta]A <: [Theta]B -| Delta
  -----------------------------------------------------------------------
                      Gamma |- e <= B -| Delta
```

This bridges synthesis and checking: synthesize the actual type, then verify it is a subtype of the expected type.

## Context

The context (Gamma) is an **ordered list** of bindings. Order matters: variables can only reference bindings that appear earlier.

| Entry | Meaning |
|-------|---------|
| Universal variable marker | A type variable is in scope |
| Term annotation `x : A` | Variable `x` has type `A` |
| Unsolved existential `a-hat` | An unknown type, to be solved |
| Solved existential `a-hat = tau` | Existential resolved to `tau` |
| Scope marker | Boundary for cutting |

### Context Operations

- **Extend**: add a binding to the end of the context
- **Apply**: substitute all solved existentials in a type
- **Cut**: remove all bindings after a scope marker (used when exiting a quantifier scope)
- **Lookup**: find a variable's type or an existential's solution
- **Fresh variable**: generate a new existential and add it to the context

### Monotonicity

Once an existential is solved, it remains solved. Later operations can only add more solutions, never retract them. This property enables batched processing: the compiler can process multiple function arguments before applying the accumulated solutions.

## Type Checking Strategy

### Literals

Literals synthesize their obvious type: integers as `Int`, floating-point as `Real`, strings as `Str`, booleans as `Bool`.

### Variables

A variable synthesizes the type recorded in the context at its binding site.

### Lambda Expressions

When a lambda is *checked* against a function type `A -> B`, the parameter is bound to type `A` and the body is checked against `B`.

When a lambda is *synthesized* (no expected type), fresh existentials are created for parameters. The body is synthesized, and if it returns a function type, the lambda is eta-expanded to make all arguments explicit.

### Application

To synthesize `f x`:

1. Synthesize the type of `f`, yielding `A`.
2. Apply the context to `A`.
3. If `A` is a function type `A1 -> A2`, check `x` against `A1`; the result type is `A2`.
4. If `A` is a universal `forall a. B`, instantiate `a` with a fresh existential and retry.
5. If `A` is an existential, decompose it into a function existential and retry.

### Where Clauses

Bindings in a `where` clause are type-checked as local definitions. Each binding's type is synthesized and added to the context before the main expression is checked.

## Occurs Check

Before solving an existential `a-hat = tau`, the checker verifies that `a-hat` does not appear free in `tau`. This prevents infinite types (e.g., `a = [a]`).

## Performance

Two optimizations avoid exponential behavior:

- **Batched function subtyping**: all arguments of a multi-argument function are subtype-checked before applying context updates, reducing O(n^2) to O(n).
- **Direct eta expansion**: when a lambda body returns a function, the expanded form is constructed directly without re-synthesizing, reducing O(2^n) to O(n) for nested lambdas.


================================================
FILE: spec/types/polymorphism.md
================================================
# Polymorphism

Morloc supports parametric polymorphism: functions and types may be parameterized over type variables that are instantiated at each use site.

## Parametric Polymorphism

A polymorphic function operates uniformly over all types. Type variables (lowercase identifiers) in a signature are implicitly universally quantified:

```morloc
id a :: a -> a
map a b :: (a -> b) -> [a] -> [b]
fst a b :: (a, b) -> a
```

The type variable names after the function name and before `::` make the quantification explicit: `map a b :: ...` means "for all types `a` and `b`, ...".

## Universal Quantification

Universal quantification (`forall`) is the standard form of polymorphism. A universally quantified type promises that the function works for *any* instantiation of the type variable:

```
forall a. a -> a
```

In morloc syntax, universal quantification is implicit in type signatures. The type variables listed between the function name and `::` are universally quantified.

## Existential Quantification

Existential types arise internally during type inference. An existential variable (`a-hat`) represents an unknown type that the checker must solve. The programmer does not write existentials directly.

Existentials may carry constraints:
- **Type parameter constraints**: the existential is known to be parameterized (e.g., `a-hat` applied to some types).
- **Record constraints**: the existential is known to have certain fields.
- **Openness**: open existentials may acquire more constraints; closed existentials are fully determined.

## Higher-Rank Types

Morloc's type system supports higher-rank polymorphism, where polymorphic types may appear in argument positions:

```
(forall a. a -> a) -> Int
```

This type requires a function that is polymorphic -- not merely a function at some specific type. The bidirectional type checker handles higher-rank types through its synthesis/checking discipline: polymorphic arguments are checked, not synthesized.

## Multi-Arity Functions

Morloc normalizes curried functions to multi-argument form internally:

```
a -> b -> c    normalizes to    FunU [a, b] c
```

This does not affect the surface syntax, where `->` is right-associative as expected. The normalization is a compiler optimization that simplifies type checking for multi-argument functions.

## Eta Expansion

When a lambda body returns a function type, the compiler eta-expands:

```morloc
\x -> f         -- where f : a -> b
-- becomes
\x y -> f y     -- the hidden argument is made explicit
```

This ensures that all functions are fully applied in the generated code, which is necessary for correct cross-language dispatch.


================================================
FILE: spec/types/primitive-types.md
================================================
# Primitive Types

Morloc provides a set of built-in types that map to native representations across all supported languages.

## Core Types

| Type | Description |
|------|-------------|
| `Unit` | The unit type (no meaningful value) |
| `Bool` | Boolean (`True` or `False`) |
| `Int` | Default-width signed integer |
| `Real` | Default-width floating-point number |
| `Str` | Unicode string |

## Sized Integer Types

| Type | Width | Signedness |
|------|-------|------------|
| `Int8` | 8-bit | Signed |
| `Int16` | 16-bit | Signed |
| `Int32` | 32-bit | Signed |
| `Int64` | 64-bit | Signed |
| `UInt8` | 8-bit | Unsigned |
| `UInt16` | 16-bit | Unsigned |
| `UInt32` | 32-bit | Unsigned |
| `UInt64` | 64-bit | Unsigned |

The unsized `Int` type is equivalent to the platform's default integer width. For serialization, `Int` uses the msgpack `i8` (64-bit signed) schema.

## Sized Floating-Point Types

| Type | Precision |
|------|-----------|
| `Float32` | IEEE 754 single precision |
| `Float64` | IEEE 754 double precision |

The unsized `Real` type is equivalent to `Float64`.

## Collection Types

| Type | Description |
|------|-------------|
| `List a` or `[a]` | Homogeneous ordered collection |
| `Tuple` | Fixed-length heterogeneous product (e.g., `(Int, Str)`) |

List syntax `[a]` is sugar for `List a`.

Tuple types are written with parentheses and commas: `(Int, Str, Bool)`.

## Cross-Language Mapping

Each primitive type must have a concrete mapping for every language in which it is used. The standard library provides these mappings:

| Morloc | Python | C++ | R |
|--------|--------|-----|---|
| `Bool` | `bool` | `bool` | `logical` |
| `Int` | `int` | `int` | `integer` |
| `Real` | `float` | `double` | `numeric` |
| `Str` | `str` | `std::string` | `character` |
| `[a]` | `list` | `std::vector<A>` | `list` |

See [[type-declarations.md]] for how these mappings are declared and [[../interop/type-mappings.md]] for the complete mapping tables.


================================================
FILE: spec/types/records.md
================================================
# Records

Records are named product types with labeled fields. Morloc provides three record-like forms: `record`, `object`, and `table`.

## Record Declaration

A `record` declares a type with named fields:

```morloc
record Person where
  name :: Str
  age :: Int
```

This introduces the type `Person` with fields `name` (of type `Str`) and `age` (of type `Int`).

## Object and Table Declarations

`object` and `table` are variants of `record` that convey intended semantics:

- **`object`** -- a record representing an opaque object (fields may include functions)
- **`table`** -- a record representing columnar/tabular data

All three forms have identical syntax and structural behavior. The distinction is advisory: it informs serialization strategy and documentation but does not affect type checking.

## Language-Specific Mappings

Records require concrete type mappings, just like other types:

```morloc
record Py => Person = "dict"
record Cpp => Person = "Person"
record R => Person = "list"
```

In C++, the compiler generates a `struct` definition. In Python and R, records map to dictionaries and named lists, respectively.

## Construction

Records are constructed with brace syntax, binding field names to values:

```morloc
alice = {name = "Alice", age = 27}
```

All fields must be provided at construction.

## Field Access

The `.` operator in prefix position extracts a field:

```morloc
.name alice       -- "Alice"
.age alice        -- 27
```

Field accessors are first-class functions and may be composed or passed as arguments:

```morloc
names = map .name people
```

## Records with Function Fields

Record fields may have function types:

```morloc
record Tools where
  f :: Int -> Int
  g :: Bool -> Int

tools = {f = add 1, g = \x -> if x then 1 else 0}
.f tools 5       -- 6
```

## Parameterized Records

Records may be parameterized:

```morloc
record Pair a b where
  fst :: a
  snd :: b
```

## Serialization

When records cross language boundaries, they are serialized as msgpack maps (keyed by field name) or as positional tuples, depending on the target language's conventions. The compiler inserts appropriate pack/unpack operations. See [[../interop/serialization.md]].


================================================
FILE: spec/types/subtyping.md
================================================
# Subtyping

Morloc's subtyping relation captures when one type is *more polymorphic* than another. This is not subtyping in the object-oriented sense; it governs how polymorphic types may be used where less polymorphic types are expected.

## Subtyping Judgment

The judgment `A <: B` means "A is at least as polymorphic as B" -- any value of type A can be used where a value of type B is expected.

## Rules

### Reflexivity

A type is a subtype of itself:

```
A <: A
```

### Function Types (Contravariant Arguments)

Function subtyping reverses the direction for arguments:

```
  B1 <: A1       A2 <: B2
  -------------------------
  A1 -> A2  <:  B1 -> B2
```

Arguments are contravariant: if `f : A1 -> A2` is used where `g : B1 -> B2` is expected, then `f` must accept a *wider* range of inputs (`B1 <: A1`) and produce a *narrower* range of outputs (`A2 <: B2`).

For multi-argument functions, each argument is checked contravariantly and the return type covariantly.

### Universal Quantification (Left)

A universally quantified type on the left is instantiated with a fresh existential:

```
  [a-hat/a]A <: B
  -----------------
  forall a. A <: B
```

This means a polymorphic type can be used where a specific type is expected, by choosing an appropriate instantiation.

### Universal Quantification (Right)

A universally quantified type on the right requires the left side to work for all instantiations:

```
  A <: B            (a is fresh)
  ----------------
  A <: forall a. B
```

### Existential Instantiation

When an unsolved existential variable meets a concrete type, the subtyping relation solves the existential:

```
  a-hat not in FV(A)       A <=: a-hat
  --------------------------------------
           a-hat <: A
```

The `<=:` (instantiation) relation handles the mechanics of solving existentials. See [[#instantiation]].

## Instantiation

The instantiation judgment `A <=: a-hat` (or `a-hat <=: A`) solves the existential variable `a-hat` to a specific type.

### Solve

If A is a monotype (no quantifiers, no unsolved existentials):

```
  a-hat <=: tau     solves as     a-hat = tau
```

Subject to the occurs check: `a-hat` must not appear in `tau` (prevents infinite types).

### Function Decomposition

If the existential must be a function type:

```
  a-hat = a-hat1 -> a-hat2       A1 <=: a-hat1       a-hat2 <=: A2
  -------------------------------------------------------------------
                        A1 -> A2 <=: a-hat
```

The existential is decomposed into fresh existentials for the argument and return types.

## Context Threading

Subtyping and instantiation thread a context (Gamma) through the judgment. Each step may add solved existentials to the context, which subsequent steps can observe. The context is an ordered list; variables can only reference bindings earlier in the list. See [[inference.md]] for context operations.


================================================
FILE: spec/types/type-declarations.md
================================================
# Type Declarations

Type declarations establish the relationship between morloc's general types and their language-specific concrete representations.

## General Type Aliases

A type alias introduces a new name for an existing type expression:

```morloc
type Filename = Str
type Matrix a = [[a]]
type Pair a b = (a, b)
```

Aliases are expanded during type resolution. They do not create new types.

## Language-Specific Type Declarations

The `type Lang => Name = "concrete" params` form declares how a general type maps to a concrete type string in a specific language:

```morloc
type Py => Int = "int"
type Cpp => Int = "int"
type R => Int = "integer"
```

For parameterized types, type parameters appear after the concrete string. Positional references (`$1`, `$2`, ...) in the string are substituted with the rendered concrete type parameters:

```morloc
type Cpp => List a = "std::vector<$1>" a
type Cpp => Map k v = "std::map<$1,$2>" k v
```

Here, `List Int` in C++ becomes `std::vector<int>`, and `Map Str Int` becomes `std::map<std::string,int>`.

For languages without parameterized type syntax, parameters are listed but ignored in the string:

```morloc
type Py => List a = "list" a
type R => List a = "list" a
```

## Terminal vs. Non-Terminal Types

A type is **terminal** if it should not be further reduced during type evaluation. Concrete language types (those declared with `type Lang => ...`) are terminal -- the compiler stops resolving once it reaches them.

A type is **non-terminal** if it is an alias that should be expanded. General type aliases (`type Name = ...`) are non-terminal.

This distinction matters during type evaluation: the compiler repeatedly applies type aliases until it reaches a terminal type or a fixed point.

## Type Evaluation

Type evaluation resolves a general type to its concrete representation for a given language through the following process:

1. Look up the type name in the scope.
2. If a general alias exists and is non-terminal, substitute and recurse.
3. If a language-specific mapping exists, substitute parameters and return the concrete type.
4. If no mapping is found, report an error (the type cannot be realized in that language).

## Scope

Type declarations accumulate in a scope: a mapping from type names to their definitions. Each definition records the parameters, the resolved type, and whether it is terminal. Multiple definitions for the same name (at different arities or for different languages) coexist in the scope.


================================================
FILE: spec/types/typeclasses.md
================================================
# Typeclasses

Typeclasses define families of types that share a common interface. They enable ad-hoc polymorphism: the same function name can have different implementations depending on the type at which it is used.

## Class Declaration

A typeclass is declared with the `class` keyword, listing its methods and their signatures:

```morloc
class Monoid a where
  empty a :: a
  op a :: a -> a -> a
```

The type variable `a` after the method name indicates which type the method is parameterized over. Each method's type signature may reference `a` and other type variables.

```morloc
class Eq a where
  eq a :: a -> a -> Bool
```

## Instance Declaration

An instance provides implementations for a typeclass at a specific type:

```morloc
instance Monoid Int where
  empty = 0
  source Cpp from "monoid.hpp" ("addInt" as op)
  source Py from "monoid.py" ("addInt" as op)
```

Instance methods may be defined as:
- Pure morloc expressions (e.g., `empty = 0`)
- Foreign function bindings (e.g., `source Cpp from ... ("fn" as method)`)
- References to existing functions

```morloc
instance Eq Int where
  eq = Int::eq

instance Eq Str where
  eq = Str::eq
```

## Constraint Resolution

When a function uses a typeclass method, the compiler resolves which instance to apply based on the concrete type at the call site:

```morloc
fold a b :: (b -> a -> b) -> b -> [a] -> b

sum :: [Int] -> Int
sum = fold op empty
```

Here, `op` and `empty` resolve to the `Monoid Int` instance. The compiler statically selects the appropriate implementation for each language.

## Constraints in Signatures

Typeclass constraints restrict the types at which a polymorphic function may be used. In morloc, constraints are currently resolved implicitly by the type checker rather than declared explicitly in signatures. The checker verifies that all typeclass methods used in a function body have instances available for the inferred type.

## Multi-Language Instances

A single instance may provide implementations in multiple languages:

```morloc
instance Monoid Int where
  empty = 0
  source Py from "monoid.py" ("addInt" as op)
  source Cpp from "monoid.hpp" ("addInt" as op)
  source R from "monoid.R" ("addInt" as op)
```

The compiler selects the language-specific implementation during realization, following the same rules as for ordinary foreign functions. See [[../interop/implementation-selection.md]].


================================================
FILE: stack.yaml
================================================
# This file was automatically generated by 'stack init'
#
# Some commonly used options have been documented as comments in this file.
# For advanced use and comprehensive documentation of the format, please see:
# https://docs.haskellstack.org/en/stable/yaml_configuration/

# Resolver to choose a 'specific' stackage snapshot or a compiler version.
# A snapshot resolver dictates the compiler version and the set of packages
# to be used for project dependencies. For example:
#
# resolver: lts-3.5
# resolver: nightly-2015-09-21
# resolver: ghc-7.10.2
# resolver: ghcjs-0.1.0_ghc-7.10.2
# resolver:
#  name: custom-snapshot
#  location: "./custom-snapshot.yaml"
resolver: lts-22.44

# User packages to be built.
# Various formats can be used as shown in the example below.
#
# packages:
# - some-directory
# - https://example.com/foo/bar/baz-0.0.2.tar.gz
# - location:
#    git: https://github.com/commercialhaskell/stack.git
#    commit: e7b331f14bcffb8367cd58fbfc8b40ec7642100a
# - location: https://github.com/commercialhaskell/stack/commit/e7b331f14bcffb8367cd58fbfc8b40ec7642100a
#   extra-dep: true
#  subdirs:
#  - auto-update
#  - wai
#
# A package marked 'extra-dep: true' will only be built if demanded by a
# non-dependency (i.e. a user package), and its test suites and benchmarks
# will not be run. This is useful for tweaking upstream packages.
packages:
- .

build:
  test: true
# # Dependency packages to be pulled from upstream that are not in the resolver
# # (e.g., acme-missiles-0.3)
# extra-deps:
#  - partial-order-0.2.0.0@sha256:a0d6ddc9ebcfa965a5cbcff1d06d46a79d44ea5a0335c583c2a51bcb41334487,2275
#  - containers-0.6.8@sha256:bb2bec1bbc6b39a7c97cd95e056a5698ec45beb5d8feb6caae12af64e4bd823c,2670
#  - binary-0.8.9.3@sha256:8b03c7fd5a7f6803280fba87e38d534beb1dc92fec975de5bd36200633996ef2,6576
#  - parsec-3.1.18.0@sha256:dfbb9835b8abc966b6bbd34340ef5122227b4cf4480062b85ca4c4704f054f98,4535
#  - text-2.1.3@sha256:5094b1264f717da458c5fa6690ca5eea90e568e464e33a6defeddeb7810b8053,11202

# Override default flag values for local packages and extra-deps
# flags: {}

# Extra package databases containing global packages
# extra-package-dbs: []

# Control whether we use the GHC we find on the path
# system-ghc: true
#
# Require a specific version of stack, using version ranges
# require-stack-version: -any # Default
# require-stack-version: ">=1.6"
#
# Override the architecture used by stack, especially useful on Windows
# arch: i386
# arch: x86_64
#
# Extra directories used by stack for building
# extra-include-dirs: [/path/to/dir]
# extra-lib-dirs: [/path/to/dir]
#
# Allow a newer minor version of GHC than the snapshot specifies
# compiler-check: newer-minor


================================================
FILE: test-suite/.gitignore
================================================
stack.yaml.lock
tags
*.hi
*.o
.stack-work/
.history
morloc.cabal
*.out
run/
.idea/
*.iml
pool.*
nexus.*
z/
z
zzz
zzz*
z.*
# ignore debugging files
*.aux
*.hp
*.prof
*.ps


================================================
FILE: test-suite/GoldenMakefileTests.hs
================================================
{- |
Module      : GoldenMakefileTests
Description : Run golden tests that build and execute full morloc programs
-}
module GoldenMakefileTests
  ( goldenMakefileTest
  ) where

import qualified System.Directory as SD
import qualified System.IO as SI
import qualified System.Process as SP
import Test.Tasty
import Test.Tasty.Golden

goldenMakefileTest :: String -> String -> TestTree
goldenMakefileTest msg testdir =
  let dir = testdir
      expFile = testdir ++ "/exp.txt"
      obsFile = testdir ++ "/obs.txt"
   in goldenVsFile
        msg
        expFile
        obsFile
        (makeManifoldFile dir)

makeManifoldFile :: String -> IO ()
makeManifoldFile path = do
  abspath <- SD.makeAbsolute path
  devnull <- SI.openFile "/dev/null" SI.WriteMode
  _ <-
    SP.runProcess
      "make" -- command
      ["-C", abspath, "--quiet"] -- arguments
      Nothing -- optional path to working diretory
      Nothing -- optional environment
      Nothing -- stdin handle
      (Just devnull) -- stdout handle
      (Just devnull) -- stderr handle
      >>= SP.waitForProcess

  SP.callProcess "make" ["-C", abspath, "--quiet", "clean"]


================================================
FILE: test-suite/Main.hs
================================================
-- \|
-- Module      : Main
-- Description : Test suite entry point combining unit, property, and golden tests
import qualified System.Directory as SD
import Test.Tasty

import GoldenMakefileTests (goldenMakefileTest)
import PropertyTests (propertyTests)
import UnitTypeTests

main :: IO ()
main = do
  wd <- SD.getCurrentDirectory >>= SD.makeAbsolute
  let golden = \msg f -> goldenMakefileTest msg (wd ++ "/test-suite/golden-tests/" ++ f)
  defaultMain $
    testGroup
      "Morloc tests"
      [ unitTypeTests
      , unitValuecheckTests
      , typeOrderTests
      , typeAliasTests
      , propertyTests
      , whereTests
      , orderInvarianceTests
      , whitespaceTests
      , infixOperatorTests
      , substituteTVarTests
      , subtypeTests
      , complexityRegressionTests
      , effectSubtypeTests
      , effectSynthesisTests
      , effectErrorTests
      , namespaceErrorTests
      , typeclassTests
      , natErrorTests
      , natArithTests
      , natLabelTests
      , natKindPromotionTests
      , letBindingTests
      , aliasConstructorTests

      -- -- These tests pass locally and when I run the same container that I
      -- -- use in github actions. Yet these tests freeze in an infinite loop
      -- -- with no STDERR output on github. I have no idea why. But for now I'm
      -- -- just going to comment them out. Rememver uncomment them on dev cycles
      -- -- so that they are tested somewhere, at least.
      -- , golden "specialization-1-c" "specialization-1-c"
      -- , golden "specialization-2-c" "specialization-2-c"
      -- , golden "specialization-1-py - numpy" "specialization-1-py"
      -- , golden "specialization-2-py - bytes/bytearray" "specialization-2-py"
      -- , golden "specialization-1-r" "specialization-1-r"

      , golden "multiprocessing-py-1" "multiprocessing-py-1"

      , -- bug regression tests from doc-agents code-tester (v0.74.0)
        -- Each test asserts correct behavior; currently FAIL until bug is fixed
        golden "bug-load-type-infer" "bug-load-type-infer"
      , golden "bug-intrinsic-schema-crash" "bug-intrinsic-schema-crash"

      , golden "thunk-basic" "thunk-basic"
      , golden "thunk-effects" "thunk-effects"
      , golden "thunk-do" "thunk-do"
      , golden "thunk-let" "thunk-let"
      , golden "thunk-interop" "thunk-interop"
      , golden "thunk-nullary-interop" "thunk-nullary-interop"
      , golden "thunk-force" "thunk-force"
      , golden "thunk-export" "thunk-export"
      , golden "thunk-choose" "thunk-choose"
      , golden "thunk-export-guard" "thunk-export-guard"
      , golden "thunk-guard-cross" "thunk-guard-cross"
      , golden "thunk-cross-force" "thunk-cross-force"
      , golden "thunk-eval-forall" "thunk-eval-forall"
      , golden "thunk-eval-hk" "thunk-eval-hk"
      , golden "two-module" "two-module"
      , golden "records-alias" "records-alias"
      , golden "infix" "infix"
      , golden "infix-import" "infix-import"
      , golden "infix-generic" "infix-generic"
      , golden "infix-polyglot" "infix-polyglot"
      , golden "infix-typeclass-import" "infix-typeclass-import"
      , golden "infix-typeclass-polyglot" "infix-typeclass-polyglot"
      , golden "infix-typeclass-simple" "infix-typeclass-simple"
      , golden "claude-test-1" "claude-test-1"
      , golden "claude-test-2" "claude-test-2"
      , golden "claude-test-3" "claude-test-3"
      , golden "claude-test-4" "claude-test-4"
      -- , golden "claude-test-5" "claude-test-5"
      , golden "claude-test-6" "claude-test-6"
      , golden "claude-test-7" "claude-test-7"
      , golden "claude-test-8" "claude-test-8"
      , golden "claude-test-9" "claude-test-9"
      , golden "claude-test-10" "claude-test-10"
      , golden "claude-test-11" "claude-test-11"
      , golden "claude-test-12" "claude-test-12"
      , golden "claude-test-13" "claude-test-13"
      , golden "claude-test-14" "claude-test-14"
      , golden "claude-test-15" "claude-test-15"
      , golden "claude-test-16" "claude-test-16"
      , golden "claude-test-17" "claude-test-17"
      , golden "claude-test-18" "claude-test-18"
      , golden "claude-test-19" "claude-test-19"
      , golden "claude-test-20" "claude-test-20"
      , golden "tensor-nat-labeled" "tensor-nat-labeled"
      , golden "tensor-nat-basic" "tensor-nat-basic"
      , golden "slurm-label-codegen" "slurm-label-codegen"
      , golden "let-crosslang" "let-crosslang"
      , golden "functional-data-1" "functional-data-1"
      , golden "functional-data-2" "functional-data-2"
      , golden "functional-data-3a" "functional-data-3a"
      , golden "functional-data-3b" "functional-data-3b"
      , golden "functional-data-3c" "functional-data-3c"
      , golden "functional-data-3d-py" "functional-data-3d-py"
      , golden "functional-data-3d-c" "functional-data-3d-c"
      , golden "functional-data-3d-r" "functional-data-3d-r"
      , golden "functional-data-3e" "functional-data-3e"
      , golden "functional-data-3f" "functional-data-3f"
      , golden "functional-data-4" "functional-data-4"
      , golden "functional-data-5" "functional-data-5"
      , golden "pattern-getters" "pattern-getters"
      , golden "pattern-setters" "pattern-setters"
      , golden "holes-func" "holes-func"
      , golden "holes-record" "holes-record"
      , golden "holes-simple" "holes-simple"
      , golden "type-annotations-1" "type-annotations-1"
      , golden "native-morloc-1" "native-morloc-1"
      , golden "native-morloc-2" "native-morloc-2"
      , golden "native-morloc-3" "native-morloc-3"
      , golden "native-morloc-4" "native-morloc-4"
      , golden "native-morloc-5" "native-morloc-5"
      , golden "native-morloc-6" "native-morloc-6"
      , golden "native-morloc-7" "native-morloc-7"
      , golden "native-morloc-8" "native-morloc-8"
      , golden "native-morloc-9" "native-morloc-9"
      , golden "nexus-let-pure" "nexus-let-pure"
      , golden "nexus-let-lambda" "nexus-let-lambda"
      , golden "demo-trimming" "demo-trimming"
      , golden "formatting" "formatting"
      , golden "record-docstrings" "record-docstrings"
      , golden "command-groups" "command-groups"
      , golden "typeclasses-1" "typeclasses-1"
      , golden "typeclasses-2" "typeclasses-2"
      , golden "typeclasses-3" "typeclasses-3"
      , golden "typeclasses-4" "typeclasses-4"
      , golden "typeclasses-5" "typeclasses-5"
      , golden "typeclasses-6" "typeclasses-6"
      , golden "typeclasses-7" "typeclasses-7"
      , golden "typeclasses-8" "typeclasses-8"
      , golden "typeclasses-9" "typeclasses-9"
      , golden "typeclass-stress" "typeclass-stress"
      , golden "alias-dedup-1" "alias-dedup-1"
      , golden "alias-no-cross-instance" "alias-no-cross-instance"
      , golden "alias-concrete-bugs" "alias-concrete-bugs"
      , golden "alias-constructor-equiv" "alias-constructor-equiv"
      , golden "alias-array-monoid" "alias-array-monoid"
      , golden "poly-list-1" "poly-list-1"
      , golden "higher-kinded-types" "higher-kinded-types"
      , golden "string-encoding" "string-encoding"
      , golden "string-encoding-utf8" "string-encoding-utf8"
      , golden "string-json-parsing" "string-json-parsing"
      , golden "string-multiline" "string-multiline"
      , golden "string-interpolation" "string-interpolation"
      , golden "string-escape" "string-escape"
      , golden "string-pretty" "string-pretty"
      , golden "unicode-source" "unicode-source"
      , golden "unicode-source-cpp" "unicode-source-cpp"
      , golden "unicode-interpolation" "unicode-interpolation"
      , golden "unicode-interop" "unicode-interop"
      , golden "unicode-edge-cases" "unicode-edge-cases"
      , golden "file-input-py" "file-input-py"
      , golden "file-input-c" "file-input-c"
      , golden "file-input-r" "file-input-r"
      , golden "packer-definitions-1" "packer-definitions-1"
      , golden "packer-definitions-2" "packer-definitions-2"
      , golden "packer-definitions-3" "packer-definitions-3"
      , golden "packer-definitions-4" "packer-definitions-4"
      , golden "packer-definitions-5" "packer-definitions-5"
      , golden "import-1" "import-1"
      , golden "import-2" "import-2"
      , -- tests the bug solved involving the lambdaScope function in
        -- Generate.hs:reserialize. See that commit message.
        golden "edge-cases-1" "edge-cases-1"
      , golden "edge-cases-2" "edge-cases-2"
      , golden "type-synthesis-1" "type-synthesis-1"
      , golden "type-synthesis-2" "type-synthesis-2"
      , golden "argument-form-1-c" "argument-form-1-c"
      , golden "argument-form-1-py" "argument-form-1-py"
      , golden "argument-form-1-r" "argument-form-1-r"
      , golden "argument-form-2-c" "argument-form-2-c"
      , golden "argument-form-2-py" "argument-form-2-py"
      , golden "argument-form-2-r" "argument-form-2-r"
      , -- see github issue #7
        golden "argument-form-3-c" "argument-form-3-c"
      , golden "argument-form-3-py" "argument-form-3-py"
      , golden "argument-form-3-r" "argument-form-3-r"
      , golden "composition" "composition"
      , golden "generic-hofs-1" "generic-hofs-1"
      , golden "generic-hofs-2" "generic-hofs-2"
      , golden "eta-reduction-1" "eta-reduction-1"
      , golden "eta-reduction-2" "eta-reduction-2"
      , golden "eta-reduction-3" "eta-reduction-3"
      , golden "eta-reduction-4" "eta-reduction-4"
      , golden "eta-reduction-5" "eta-reduction-5"
      , golden "eta-reduction-6" "eta-reduction-6"
      , golden "eta-reduction-7" "eta-reduction-7"
      , golden "eta-reduction-8-py" "eta-reduction-8-py"
      , golden "eta-reduction-8-cpp" "eta-reduction-8-cpp"
      , golden "path-shadowing-c" "path-shadowing-c"
      , golden "path-shadowing-py" "path-shadowing-py"
      , golden "path-shadowing-r" "path-shadowing-r"
      , golden "local-import-root-py" "local-import-root-py"
      , golden "local-import-cousin-py" "local-import-cousin-py"
      , golden "local-import-nested-py" "local-import-nested-py"
      , golden "argument-form-4-c" "argument-form-4-c"
      , golden "argument-form-4-py" "argument-form-4-py"
      , golden "argument-form-4-r" "argument-form-4-r"
      , golden "argument-form-5-c" "argument-form-5-c"
      , golden "argument-form-5-py" "argument-form-5-py"
      , golden "argument-form-5-r" "argument-form-5-r"
      , golden "argument-form-6-c" "argument-form-6-c"
      , golden "argument-form-6-py" "argument-form-6-py"
      , golden "argument-form-6-r" "argument-form-6-r"
      , golden "argument-form-7-c" "argument-form-7-c"
      , golden "argument-form-7-py" "argument-form-7-py"
      , golden "argument-form-7-r" "argument-form-7-r"
      , golden "argument-form-8-c" "argument-form-8-c"
      , golden "argument-form-8-py" "argument-form-8-py"
      , golden "argument-form-8-r" "argument-form-8-r"
      , golden "interop-1-py" "interop-1-py"
      , golden "interop-1-r" "interop-1-r"
      , golden "interop-2" "interop-2"
      , -- 3a
        golden "interop-3a-cp" "interop-3a-cp"
      , golden "interop-3a-pr" "interop-3a-pr"
      , golden "interop-3a-rc" "interop-3a-rc"
      , golden "interop-3a-pp" "interop-3a-pp"
      , -- 3b
        golden "interop-3b-cp" "interop-3b-cp"
      , golden "interop-3b-pr" "interop-3b-pr"
      , golden "interop-3b-rc" "interop-3b-rc"
      , golden "interop-3b-pp" "interop-3b-pp"
      , -- 3c
        golden "interop-3c-cp" "interop-3c-cp"
      , golden "interop-3c-pr" "interop-3c-pr"
      , golden "interop-3c-rc" "interop-3c-rc"
      , golden "interop-3c-pp" "interop-3c-pp"
      , -- 3d
        golden "interop-3d-cp" "interop-3d-cp"
      , golden "interop-3d-pr" "interop-3d-pr"
      , golden "interop-3d-rc" "interop-3d-rc"
      , golden "interop-3d-pp" "interop-3d-pp"
      , -- 3e
        golden "interop-3e-cp" "interop-3e-cp"
      , golden "interop-3e-pr" "interop-3e-pr"
      , golden "interop-3e-rc" "interop-3e-rc"
      , golden "interop-3e-pp" "interop-3e-pp"
      , -- 3f - test serialization type bug
        golden "interop-3f" "interop-3f"
      , -- other random interop tests (I should kill them)
        golden "interop-4" "interop-4"
      , golden "interop-5" "interop-5"
      , golden "interop-6" "interop-6"
      , golden "interop-7" "interop-7"
      , golden "interop-8-r-to-c" "interop-8-r-to-c"
      , golden "interop-8-r-to-py" "interop-8-r-to-py"
      , golden "interop-8-py-to-r" "interop-8-py-to-r"
      , golden "interop-9" "interop-9"
      , golden "interop-10" "interop-10"
      , golden "interop-11" "interop-11"
      , golden "manifold-form-0" "manifold-form-0"
      , golden "manifold-form-0x" "manifold-form-0x"
      , golden "manifold-form-1" "manifold-form-1"
      , golden "manifold-form-2" "manifold-form-2"
      , golden "manifold-form-2x" "manifold-form-2x"
      , golden "manifold-form-3" "manifold-form-3"
      , golden "manifold-form-3x" "manifold-form-3x"
      , golden "manifold-form-4_c" "manifold-form-4_c"
      , golden "manifold-form-4_py" "manifold-form-4_py"
      , golden "manifold-form-4_r" "manifold-form-4_r"
      , golden "manifold-form-5_c" "manifold-form-5_c"
      , golden "manifold-form-5_py" "manifold-form-5_py"
      , golden "manifold-form-5_r" "manifold-form-5_r"
      , golden "manifold-form-6_c" "manifold-form-6_c"
      , golden "manifold-form-6_py" "manifold-form-6_py"
      , golden "manifold-form-6_r" "manifold-form-6_r"
      , -- see github issue #9
        golden "manifold-form-7_c" "manifold-form-7_c"
      , golden "manifold-form-7_py" "manifold-form-7_py"
      , golden "manifold-form-7_r" "manifold-form-7_r"
      , -- test records
        golden "records-primitive" "records-primitive"
      , golden "records-complex-1" "records-complex-1"
      , golden "records-complex-2" "records-complex-2"
      , golden "records-nested" "records-nested"
      , golden "records-alias" "records-alias"
      , golden "selection-1" "selection-1"
      , golden "selection-2" "selection-2"
      , golden "selection-3" "selection-3"
      , golden "selection-4" "selection-4"
      , -- import two instances in one languages for a function
        -- this is also a test of a function that is defind in a local file
        -- -- With the new stricter implementation, these tests no longer pass
        -- -- They can be reinstated when the morloc compiler learns to
        -- -- distinguish the functions reasonably
        -- , golden "multiple-instances-1-c" "multiple-instances-1-c"
        -- , golden "multiple-instances-1-py" "multiple-instances-1-py"
        -- , golden "multiple-instances-1-r" "multiple-instances-1-r"
        -- multiple sources and a declaration
        golden "multiple-instances-2-c" "multiple-instances-2-c"
      , golden "multiple-instances-2-py" "multiple-instances-2-py"
      , golden "multiple-instances-2-r" "multiple-instances-2-r"
      , golden "multi-lang-mempty-py" "multi-lang-mempty-py"
      , golden "bare-selector-args" "bare-selector-args"
      , golden "bare-selector-chain" "bare-selector-chain"
      , -- tests of module forms
        -- where *-sid
        --   s - number of sourced instances
        --   i - number of imported instances
        --   d - number of declared instances
        golden "module-form-00n" "module-form-00n"
      , golden "module-form-011" "module-form-011"
      , golden "module-form-01n" "module-form-01n"
      , golden "module-form-0n0" "module-form-0n0"
      , golden "module-form-0n1" "module-form-0n1"
      , golden "module-form-101" "module-form-101"
      , golden "module-form-10n" "module-form-10n"
      , golden "module-form-110" "module-form-110"
      , golden "module-form-111" "module-form-111"
      , golden "module-form-1n0" "module-form-1n0"
      , golden "module-form-n00" "module-form-n00"
      , golden "module-form-n01" "module-form-n01"
      , golden "module-form-n10" "module-form-n10"
      , -- tests of serialization
        -- , golden "c  S" "serial-form-1-c"
        -- , golden "py S" "serial-form-1-py"
        -- , golden "r  S" "serial-form-1-r"
        golden "C serial-form-2-c" "serial-form-2-c"
      , golden "C serial-form-2-py" "serial-form-2-py"
      , golden "C serial-form-2-r" "serial-form-2-r"
      , -- , golden "c  R" "serial-form-3-c"
        -- , golden "py R" "serial-form-3-py"
        -- , golden "r  R" "serial-form-3-r"
        -- outer simple type
        golden "S(S) serial-form-4-c" "serial-form-4-c"
      , golden "S(S) serial-form-4-py" "serial-form-4-py"
      , golden "S(S) serial-form-4-r" "serial-form-4-r"
      , golden "S(C) serial-form-5-c" "serial-form-5-c"
      , golden "S(C) serial-form-5-py" "serial-form-5-py"
      , golden "S(C) serial-form-5-r" "serial-form-5-r"
      , golden "S(R) serial-form-6-c" "serial-form-6-c"
      , golden "S(R) serial-form-6-py" "serial-form-6-py"
      , golden "S(R) serial-form-6-r" "serial-form-6-r"
      , -- outer constructed type
        golden "C(S) serial-form-7-c" "serial-form-7-c"
      , golden "C(S) serial-form-7-py" "serial-form-7-py"
      , golden "C(S) serial-form-7-r" "serial-form-7-r"
      , golden "C(C) serial-form-8-c" "serial-form-8-c"
      , -- , golden "C(C) serial-form-8-py" "serial-form-8-py"
        golden "C(C) serial-form-8-r" "serial-form-8-r"
      , golden "C(R) serial-form-9-c" "serial-form-9-c"
      , golden "C(R) serial-form-9-py" "serial-form-9-py"
      , golden "C(R) serial-form-9-r" "serial-form-9-r"
      , -- outer record type
        golden "R(S) serial-form-10-c" "serial-form-10-c"
      , golden "R(S) serial-form-10-py" "serial-form-10-py"
      , golden "R(S) serial-form-10-r" "serial-form-10-r"
      , golden "R(C) serial-form-11-c" "serial-form-11-c"
      , golden "R(C) serial-form-11-py" "serial-form-11-py"
      , golden "R(C) serial-form-11-r" "serial-form-11-r"
      , golden "R(R) serial-form-12-c" "serial-form-12-c"
      , golden "R(R) serial-form-12-py" "serial-form-12-py"
      , golden "R(R) serial-form-12-r" "serial-form-12-r"
      , -- table handling
        golden "table-1-c" "table-1-c"
      , golden "table-1-py" "table-1-py"
      , golden "table-1-r" "table-1-r"
      , golden "table-2-c" "table-2-c"
      , golden "table-2-py" "table-2-py"
      , golden "table-2-r" "table-2-r"
      , -- object handling
        golden "object-1-c" "object-1-c"
      , golden "object-1-py" "object-1-py"
      , golden "object-1-r" "object-1-r"
      , -- scoping
        golden "scoping-1" "scoping-1"
      , golden "scoping-2" "scoping-2"
      , golden "scoping-3" "scoping-3"
      , golden "scoping-4" "scoping-4"
      , golden "scoping-5" "scoping-5"
      , golden "scoping-6" "scoping-6"
      , golden "scoping-7" "scoping-7"
      , golden "scoping-8" "scoping-8"
      , golden "scoping-9" "scoping-9"
      , golden "scoping-10" "scoping-10"
      , golden "scoping-11" "scoping-11"
      , golden "scoping-12" "scoping-12"
      , golden "scoping-13" "scoping-13"
      , -- type alias transitive resolution
        golden "type-alias-transitive" "type-alias-transitive"
      , -- type identities
        golden "type-identities-c" "type-identities-c"
      , -- testing packet transmission
        golden "packets-large (wait ~10s)" "packets-large"
      , golden "packets-interop (wait ~10s)" "packets-interop"
      , -- many tests of higher-order functions
        golden "hofs-1" "hofs-1"
      , -- test errors
        golden "errors (wait ~10s)" "errors"
      , golden "feature-integration-1" "feature-integration-1"
      , golden "let-expressions" "let-expressions"
      , golden "guards-py" "guards-py"
      , golden "guards-cpp" "guards-cpp"
      , golden "guards-r" "guards-r"
      , golden "guards-let-py" "guards-let-py"
      , golden "guards-let-cpp" "guards-let-cpp"
      , golden "guards-let-r" "guards-let-r"
      , golden "guards-inline-cpp" "guards-inline-cpp"
      , golden "recursion-direct-py" "recursion-direct-py"
      , golden "recursion-direct-cpp" "recursion-direct-cpp"
      , golden "recursion-direct-r" "recursion-direct-r"
      , golden "recursion-mutual-py" "recursion-mutual-py"
      , golden "recursion-mutual-cpp" "recursion-mutual-cpp"
      , golden "recursion-mutual-r" "recursion-mutual-r"
      , golden "recursion-cross-py-cpp" "recursion-cross-py-cpp"
      , golden "recursion-cross-r-cpp" "recursion-cross-r-cpp"
      , golden "recursion-helper-py" "recursion-helper-py"
      , golden "recursion-helper-cpp" "recursion-helper-cpp"
      , golden "recursion-thunk-py" "recursion-thunk-py"
      , golden "recursion-thunk-helper-cpp" "recursion-thunk-helper-cpp"
      , -- optional type tests
        golden "optional-py" "optional-py"
      , golden "optional-cpp" "optional-cpp"
      , golden "optional-r" "optional-r"
      , golden "optional-json" "optional-json"
      , golden "optional-interop-cp" "optional-interop-cp"
      , golden "optional-interop-pr" "optional-interop-pr"
      , golden "optional-interop-rc" "optional-interop-rc"
      , golden "optional-records-py" "optional-records-py"
      , golden "optional-records-cpp" "optional-records-cpp"
      , golden "optional-records-r" "optional-records-r"
      , -- optional coercion tests (a -> ?a)
        golden "optional-coerce-py" "optional-coerce-py"
      , golden "optional-coerce-cpp" "optional-coerce-cpp"
      , golden "optional-coerce-interop" "optional-coerce-interop"
      , -- effect coercion tests (a -> <IO> a)
        golden "effect-coerce-py" "effect-coerce-py"
      , golden "effect-coerce-cpp" "effect-coerce-cpp"
      , -- multi-label and subtyping effect tests
        golden "effect-multi-label-py" "effect-multi-label-py"
      , golden "effect-subtype-py" "effect-subtype-py"
      , golden "effect-error-cpp" "effect-error-cpp"
      , golden "effect-accumulate-py" "effect-accumulate-py"
      , -- inline force operator (!) tests
        golden "force-inline-basic" "force-inline-basic"
      , -- intrinsic tests
        golden "intrinsic-agnostic" "intrinsic-agnostic"
      , golden "intrinsic-hash" "intrinsic-hash"
      , golden "intrinsic-constants" "intrinsic-constants"
      , golden "intrinsic-show-read" "intrinsic-show-read"
      , golden "intrinsic-show-read-nexus" "intrinsic-show-read-nexus"
      , golden "intrinsic-show-ho-r" "intrinsic-show-ho-r"
      , -- parser stress test: precedence, parentheses, negatives, numeric literals, getters
        golden "parser-stress" "parser-stress"
      , -- stdout flush test: verify Python pool stdout is flushed before shutdown
        golden "stdout-flush-py" "stdout-flush-py"
      , -- namespace import tests
        golden "namespace-basic" "namespace-basic"
      , golden "namespace-selective" "namespace-selective"
      , golden "namespace-separate-impls" "namespace-separate-impls"
      , golden "namespace-disambiguation" "namespace-disambiguation"
      , golden "namespace-ns-composition" "namespace-ns-composition"
      , golden "namespace-ns-hof" "namespace-ns-hof"
      , golden "namespace-ns-let" "namespace-ns-let"
      , golden "namespace-ns-shadow" "namespace-ns-shadow"
      , golden "namespace-ns-multi" "namespace-ns-multi"
      , golden "namespace-ns-same-func-name" "namespace-ns-same-func-name"
      , golden "namespace-ns-unqualified" "namespace-ns-unqualified"
      , golden "namespace-ns-exported" "namespace-ns-exported"
      , golden "namespace-ns-reexport" "namespace-ns-reexport"
      , golden "namespace-ns-nested-getter" "namespace-ns-nested-getter"
      , golden "namespace-ns-guard" "namespace-ns-guard"
      , golden "namespace-ns-double-import" "namespace-ns-double-import"
      , -- %inline pragma tests
        golden "inline-op-py" "inline-op-py"
      , golden "inline-func-py" "inline-func-py"
      , golden "inline-typeclass-py" "inline-typeclass-py"
      , golden "inline-ho-py" "inline-ho-py"
      , golden "inline-op-ho-py" "inline-op-ho-py"
      , golden "inline-deep-py" "inline-deep-py"
      , golden "inline-mixed-py" "inline-mixed-py"
      , golden "inline-block-py" "inline-block-py"
      , golden "inline-old-style-py" "inline-old-style-py"
      , golden "inline-cross-lang" "inline-cross-lang"
      , -- bare operators in old-style source declarations
        golden "source-old-op-py" "source-old-op-py"
      , -- eval mode restriction tests
        golden "eval-restrict-source" "eval-restrict-source"
      , -- memory alignment tests (document misalignment bugs in voidstar format)
        golden "memory-optional-double-cpp" "memory-optional-double-cpp"
      , golden "memory-optional-double-py" "memory-optional-double-py"
      , golden "memory-record-pack-cpp" "memory-record-pack-cpp"
      , golden "memory-record-pack-py" "memory-record-pack-py"
      , golden "memory-interop-misalign-cp" "memory-interop-misalign-cp"
      , golden "memory-nested-misalign-cpp" "memory-nested-misalign-cpp"
      , golden "memory-nested-misalign-py" "memory-nested-misalign-py"
      , golden "memory-split-block-cpp" "memory-split-block-cpp"
      , -- arrow immutable table tests (large table passed by reference into map)
        golden "arrow-immutable-pr" "arrow-immutable-pr"
      , golden "arrow-immutable-rp" "arrow-immutable-rp"
      , golden "arrow-immutable-cp" "arrow-immutable-cp"
      , golden "arrow-immutable-pc" "arrow-immutable-pc"
      , -- dense tensor tests
        golden "tensor-comprehensive-cpp" "tensor-comprehensive-cpp"
      , golden "tensor-comprehensive-cross" "tensor-comprehensive-cross"
      , golden "tensor-dimensions" "tensor-dimensions"
      , -- nat-parameterized type tests
        golden "nat-typecheck" "nat-typecheck"
      ]


================================================
FILE: test-suite/PropertyTests.hs
================================================
{- |
Module      : PropertyTests
Description : QuickCheck property tests for internal utility functions
-}
module PropertyTests
  ( propertyTests
  ) where

import Morloc.Namespace.Prim

import qualified Data.Set as Set
import Test.Tasty
import Test.Tasty.QuickCheck as TQC

propertyTests :: TestTree
propertyTests =
  testGroup
    "internal list function properties"
    [ TQC.testProperty "unique makes unique lists" prop_unique_unique
    , TQC.testProperty "unique preserves original order" prop_unique_preserves_order
    , TQC.testProperty "duplicates makes unique lists" prop_duplicates_unique
    , TQC.testProperty "duplicates preserves original order" prop_duplicates_preserves_order
    ]

-- for the uniq family of functions (unique, duplicates, isSorted), I will test
-- on the numbers 1 to 5. If the desired property holds over this set, they
-- will hold over any ordered set.
one2five :: [Int] -> [Int]
one2five = map (\x -> mod (abs x) 5)

prop_unique_unique :: [Int] -> Bool
prop_unique_unique [] = True
prop_unique_unique xs =
  let xs' = one2five xs
   in length (unique xs') == Set.size (Set.fromList xs')

-- This test asserts that the first element in the original and unique list is
-- the same. This guarantee alone does not entirely guantee that the original
-- order is preserved, but it is close.
prop_unique_preserves_order :: [Int] -> Bool
prop_unique_preserves_order xs = headMay xs == headMay (unique xs)

-- Each element in the duplicates return list is unique
prop_duplicates_unique :: [Int] -> Bool
prop_duplicates_unique [] = True
prop_duplicates_unique xs =
  let xs' = duplicates (one2five xs)
   in length xs' == Set.size (Set.fromList xs')

prop_duplicates_preserves_order :: [Int] -> Bool
prop_duplicates_preserves_order xs = f Set.empty xs (duplicates xs)
  where
    f _ _ [] = True
    f _ [] _ = False
    f skipped (y : rs) (y' : rs')
      -- if the original and duplicated elements match:
      | y == y' =
          -- if the current element was previously skipped
          if Set.member y' skipped
            -- then the duplicates function failed to respect the initial order
            then False
            -- else continue checking on the next elements
            else f skipped rs rs'
      -- otherwise store record the skipped value and continue
      | otherwise = f (Set.insert y skipped) rs (y' : rs')


================================================
FILE: test-suite/UnitTypeTests.hs
================================================
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE QuasiQuotes #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE ViewPatterns #-}

{- |
Module      : UnitTypeTests
Description : Unit tests for type operations, subtyping, typechecking, and codegen
-}
module UnitTypeTests
  ( subtypeTests
  , substituteTVarTests
  , unitTypeTests
  , unitValuecheckTests
  , typeOrderTests
  , typeAliasTests
  , packerTests
  , whereTests
  , orderInvarianceTests
  , whitespaceTests
  , infixOperatorTests
  , complexityRegressionTests
  , effectSubtypeTests
  , effectSynthesisTests
  , effectErrorTests
  , namespaceErrorTests
  , typeclassTests
  , natErrorTests
  , natArithTests
  , natLabelTests
  , natKindPromotionTests
  , letBindingTests
  , aliasConstructorTests
  ) where

import Morloc (typecheck, typecheckFrontend)
import Morloc.Frontend.Namespace
import Morloc.Frontend.Typecheck (evaluateAnnoSTypes)
import qualified Morloc.Monad as MM
import qualified Morloc.Typecheck.Internal as MTI
import qualified Morloc.Typecheck.NatSolver as NS
import qualified System.Directory as SD
import Text.RawString.QQ

import qualified Data.IntMap.Strict as IntMap
import qualified Data.Map as Map
import qualified Data.Set as Set
import qualified Data.Text as MT
import Test.Tasty (TestTree, localOption, mkTimeout, testGroup)
import Test.Tasty.HUnit

-- get the toplevel general type of a typechecked expression
gtypeof :: AnnoS (Indexed TypeU) f c -> TypeU
gtypeof (AnnoS (Idx _ t) _ _) = t

runFront :: MT.Text -> IO (Either MorlocError [AnnoS (Indexed TypeU) Many Int])
runFront code = do
  config <- emptyConfig
  ((x, _), _) <-
    MM.runMorlocMonad
      Nothing
      0
      config
      defaultValue
      (typecheckFrontend Nothing (Code code) >>= mapM evaluateAnnoSTypes)
  return x

-- | Like runFront but without type alias evaluation, so nat dimensions are preserved.
runFrontRaw :: MT.Text -> IO (Either MorlocError [AnnoS (Indexed TypeU) Many Int])
runFrontRaw code = do
  config <- emptyConfig
  ((x, _), _) <-
    MM.runMorlocMonad
      Nothing
      0
      config
      defaultValue
      (typecheckFrontend Nothing (Code code))
  return x

runMiddle ::
  MT.Text ->
  IO
    ( Either
        MorlocError
        ( [AnnoS (Indexed Type) One ()]
        , [AnnoS (Indexed Type) One (Indexed Lang)]
        )
    )
runMiddle code = do
  config <- emptyConfig
  ((x, _), _) <- MM.runMorlocMonad Nothing 0 config defaultValue (typecheck Nothing (Code code))
  return x

emptyConfig :: IO Config
emptyConfig = do
  home <- SD.getHomeDirectory
  return $
    Config
      { configHome = home <> "/.local/share/morloc"
      , configLibrary = home <> "/.local/share/src/morloc"
      , configPlane = "default"
      , configPlaneCore = "morloclib"
      , configTmpDir = home <> "/.morloc/tmp"
      , configBuildConfig = home <> "/.morloc/.build-config.yaml"
      , configLangOverrides = mempty
      , configRegistry = Nothing
      }

assertGeneralType :: String -> MT.Text -> TypeU -> TestTree
assertGeneralType msg code t = testCase msg $ do
  result <- runFront code
  case result of
    (Right [x]) -> assertEqual "" (closeExistentials . MTI.cleanTypeName $ t) (closeExistentials . MTI.cleanTypeName . renameExistentials . gtypeof $ x)
    (Right _) -> error "Expected exactly one export from main for assertGeneralType"
    (Left e) ->
      error $
        "The following error was raised: " <> show e <> "\nin:\n" <> show code

renameExistentials :: TypeU -> TypeU
renameExistentials = snd . f (0 :: Int, Map.empty)
  where
    f s (VarU v) = (s, VarU v)
    f (i, m) (ExistU v (ps, pc) (rs, rc)) =
      case Map.lookup v m of
        (Just v') -> ((i, m), ExistU v' (ps, pc) (rs, rc))
        Nothing ->
          let v' = TV ("e" <> MT.pack (show i))
              i' = i + 1
              m' = Map.insert v v' m
              (s', ps') = statefulMap f (i', m') ps
              (s'', vs') = statefulMap f s' (map snd rs)
           in (s'', ExistU v' (ps', pc) (zip (map fst rs) vs', rc))
    f s (ForallU v t) =
      let (s', t') = f s t
       in (s', ForallU v t')
    f s t@(NatVarU _) = (s, t)
    f s (FunU ts t) =
      let (s', ts') = statefulMap f s ts
          (s'', t') = f s' t
       in (s'', FunU ts' t')
    f s (AppU t ts) =
      let (s', t') = f s t
          (s'', ts') = statefulMap f s' ts
       in (s'', AppU t' ts')
    f s (NamU o n vs rs) =
      let (s', ts') = statefulMap f s (map snd rs)
       in (s', NamU o n vs (zip (map fst rs) ts'))
    f s (EffectU effs t) =
      let (s', t') = f s t
       in (s', EffectU effs t')
    f s (OptionalU t) =
      let (s', t') = f s t
       in (s', OptionalU t')
    f s t@(NatLitU _) = (s, t)
    f s (NatAddU a b) = let (s', a') = f s a; (s'', b') = f s' b in (s'', NatAddU a' b')
    f s (NatMulU a b) = let (s', a') = f s a; (s'', b') = f s' b in (s'', NatMulU a' b')
    f s (NatSubU a b) = let (s', a') = f s a; (s'', b') = f s' b in (s'', NatSubU a' b')
    f s (NatDivU a b) = let (s', a') = f s a; (s'', b') = f s' b in (s'', NatDivU a' b')
    f s (LabeledU n t) = let (s', t') = f s t in (s', LabeledU n t')

closeExistentials :: TypeU -> TypeU
closeExistentials = f
  where
    f (ExistU v (ts, _) (rs, _)) = ExistU v (map f ts, Closed) (map (second f) rs, Closed)
    f t@(VarU _) = t
    f t@(NatVarU _) = t
    f (ForallU v t) = ForallU v (f t)
    f (FunU ts t) = FunU (map f ts) (f t)
    f (AppU t ts) = AppU (f t) (map f ts)
    f (NamU o v ts rs) = NamU o v (map f ts) (map (second f) rs)
    f (EffectU effs t) = EffectU effs (f t)
    f (OptionalU t) = OptionalU (f t)
    f t@(NatLitU _) = t
    f (NatAddU a b) = NatAddU (f a) (f b)
    f (NatMulU a b) = NatMulU (f a) (f b)
    f (NatSubU a b) = NatSubU (f a) (f b)
    f (NatDivU a b) = NatDivU (f a) (f b)
    f (LabeledU n t) = LabeledU n (f t)

-- | Assert the general type before alias evaluation (preserves nat dimensions).
assertRawType :: String -> MT.Text -> TypeU -> TestTree
assertRawType msg code t = testCase msg $ do
  result <- runFrontRaw code
  case result of
    (Right [x]) -> assertEqual "" (closeExistentials . MTI.cleanTypeName $ t) (closeExistentials . MTI.cleanTypeName . renameExistentials . gtypeof $ x)
    (Right _) -> error "Expected exactly one export from main for assertRawType"
    (Left e) ->
      error $
        "The following error was raised: " <> show e <> "\nin:\n" <> show code

assertSubtypeGamma :: String -> [GammaIndex] -> TypeU -> TypeU -> [GammaIndex] -> TestTree
assertSubtypeGamma msg gs1 a b gs2 = testCase msg $ do
  let g0 = listToGamma gs1
  case MTI.subtype Map.empty a b g0 of
    Left e -> error $ show e
    Right g -> assertEqual "" gs2 (MTI.gammaContextList g)

-- | Convert a list of GammaIndex (newest first) to a Gamma with IntMap.
-- Uses slot spacing of 256 to match production code.
listToGamma :: [GammaIndex] -> Gamma
listToGamma gs =
  let spacing = 256
      n = length gs
      -- Newest entry gets highest slot
      indexed = zip [spacing * (n - 1), spacing * (n - 2) .. 0] gs
      ctx = IntMap.fromList indexed
      existMap = Map.fromList [(v, s) | (s, ExistG v _ _) <- indexed]
  in Gamma
    { gammaCounter = 0
    , gammaSlot = spacing * n
    , gammaContext = ctx
    , gammaExist = existMap
    , gammaSolved = Map.empty
    , gammaDeferred = []
    , gammaNatSubs = Map.empty
    , gammaIntVals = Map.empty
    }

exprTestBad :: String -> MT.Text -> TestTree
exprTestBad msg code =
  testCase msg $ do
    result <- runFront code
    case result of
      (Right _) -> assertFailure . MT.unpack $ "Expected '" <> code <> "' to fail"
      (Left _) -> return ()

valuecheckFail :: String -> MT.Text -> TestTree
valuecheckFail msg code =
  testCase msg $ do
    result <- runMiddle code
    case result of
      (Right _) -> assertFailure . MT.unpack $ "Expected '" <> code <> "' to fail"
      (Left _) -> return ()

valuecheckPass :: String -> MT.Text -> TestTree
valuecheckPass msg code =
  testCase msg $ do
    result <- runMiddle code
    case result of
      (Right _) -> return ()
      (Left _) -> assertFailure . MT.unpack $ "Expected '" <> code <> "' to pass"

-- Don't test the type of error message, that would incur too much fiddly
-- overhead as the messages and such are tweaked.
expectError :: String -> MT.Text -> TestTree
expectError msg code =
  testCase msg $ do
    result <- runFront code
    case result of
      (Right _) -> assertFailure . MT.unpack $ "Expected failure"
      (Left _) -> return ()

testEqual :: (Eq a, Show a) => String -> a -> a -> TestTree
testEqual msg x y =
  testCase msg $ assertEqual "" x y

testTrue :: String -> Bool -> TestTree
testTrue msg x =
  testCase msg $ assertEqual "" x True

testFalse :: String -> Bool -> TestTree
testFalse msg x =
  testCase msg $ assertEqual "" x False

bool :: TypeU
bool = VarU (TV "Bool")

real :: TypeU
real = VarU (TV "Real")

int :: TypeU
int = VarU (TV "Int")

str :: TypeU
str = VarU (TV "Str")

fun :: [TypeU] -> TypeU
fun [] = error "Cannot infer type of empty list"
fun [t] = FunU [] t
fun ts = FunU (init ts) (last ts)

forallu :: [MT.Text] -> TypeU -> TypeU
forallu ss t = foldr (\s -> ForallU (TV s)) t ss

exist :: MT.Text -> TypeU
exist v = ExistU (TV v) ([], Open) ([], Open)

existP v ts rs = ExistU (TV v) (ts, Open) (rs, Open)

var :: MT.Text -> TypeU
var s = VarU (TV s)

arr :: MT.Text -> [TypeU] -> TypeU
arr s = AppU (VarU (TV s))

lst :: TypeU -> TypeU
lst t = arr "List" [t]

tuple :: [TypeU] -> TypeU
tuple ts = AppU v ts
  where
    v = VarU . TV . MT.pack $ "Tuple" ++ show (length ts)

record' :: MT.Text -> [(Key, TypeU)] -> TypeU
record' n = NamU NamRecord (TV n) []

subtypeTests :: TestTree
subtypeTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Test subtype within context"
      [ -- basic general cases
        assertSubtypeGamma "G -| A <: A |- G" [] a a []
      , assertSubtypeGamma "<a>, <b> -| <a> <: <b> |- <a>:<b>, <b>" [eag, ebg] ea eb [solvedA eb, ebg]
      , assertSubtypeGamma "<a>, <b> -| <b> <: <a> |- <a>:<b>, <b>" [eag, ebg] ea eb [solvedA eb, ebg]
      , assertSubtypeGamma "G -| (A -> B) <: (A -> B) |- G" [] (fun [a, b]) (fun [a, b]) []
      , assertSubtypeGamma "G -| [A] <: [A] |- G" [] (lst a) (lst a) []
      , assertSubtypeGamma
          "G -| {K :: a, L :: b} <: {K :: a, L :: b}"
          []
          (record' "Foo" [(Key "K", a), (Key "L", b)])
          (record' "Foo" [(Key "K", a), (Key "L", b)])
          []
      , assertSubtypeGamma "<a> -| <a> <: A |- <a>:A" [eag] ea a [solvedA a]
      , assertSubtypeGamma "<a> -| A <: <a> |- <a>:A" [eag] a ea [solvedA a]
      , assertSubtypeGamma "<b> -| [A] <: <b> |- <b>:[A]" [ebg] (lst a) (eb) [solvedB (lst a)]
      , assertSubtypeGamma "<a> -| <a> <: [B] |- <a>:[B]" [eag] (lst b) (ea) [solvedA (lst b)]
      , assertSubtypeGamma
          "<a>, <b> -| <a> <b> <: [C] |- <a>:[C], <b>:C"
          [eag, ebg]
          (existP "x1" [eb] [])
          (lst c)
          [solvedA (lst c), solvedB c]
      , assertSubtypeGamma
          "<a>, <b> -|[C] <: <a> <b> |- <a>:[C], <b>:C"
          [eag, ebg]
          (lst c)
          (existP "x1" [eb] [])
          [solvedA (lst c), solvedB c]
      , assertSubtypeGamma
          "[] -| forall a . a <: A -| a:A"
          []
          (forallu ["a"] (var "a"))
          a
          [SolvedG (TV "a") a]
      , -- nested types
        assertSubtypeGamma "<b> -| [A] <: [<b>] |- <b>:A" [ebg] (lst a) (lst eb) [solvedB a]
      , assertSubtypeGamma "<a> -| [<a>] <: [B] |- <a>:B" [eag] (lst b) (lst ea) [solvedA b]
      , assertSubtypeGamma
          "<a>, <b> -| (A, B) <: (<a>, <b>) |- <a>:A, <b>:B"
          [eag, ebg]
          (tuple [a, b])
          (tuple [ea, eb])
          [solvedA a, solvedB b]
      , assertSubtypeGamma
          "<a>, <b> -| (<a>, <b>) <: (A, B) |- <a>:A, <b>:B"
          [eag, ebg]
          (tuple [ea, eb])
          (tuple [a, b])
          [solvedA a, solvedB b]
      , assertSubtypeGamma
          "<a>, <b>, <c>, <d> -| (<a>, <b>) <: (<c>, <d>) -| <a>:<c>, <b>:<d>, <c>, <d>"
          [eag, ebg, ecg, edg]
          (tuple [ea, eb])
          (tuple [ec, ed])
          [solvedA ec, solvedB ed, ecg, edg]
      ]
  where
    a = var "A"
    b = var "B"
    c = var "C"
    ea = exist "x1"
    eb = exist "x2"
    ec = exist "x3"
    ed = exist "x4"
    eag = ExistG (TV "x1") ([], Open) ([], Open)
    ebg = ExistG (TV "x2") ([], Open) ([], Open)
    ecg = ExistG (TV "x3") ([], Open) ([], Open)
    edg = ExistG (TV "x4") ([], Open) ([], Open)
    solvedA t = SolvedG (TV "x1") t
    solvedB t = SolvedG (TV "x2") t

substituteTVarTests :: TestTree
substituteTVarTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "test variable substitution"
      [ testEqual "[x/y]Int" (substituteTVar (TV "x") (var "y") int) int
      , testEqual
          "[y/x]([x] -> x)"
          (substituteTVar (TV "x") (var "y") (fun [lst (var "x"), var "x"]))
          (fun [lst (var "y"), var "y"])
      ]

whitespaceTests :: TestTree
whitespaceTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Tests whitespace handling for modules"
      [ assertGeneralType
          "module indent == 1 and top indent == module indent"
          "module foo (y)\nx = 1\ny = 2"
          int
      , assertGeneralType
          "module indent == 1 and top indent > module indent"
          "module foo (y)\n  x = 1\n  y = 2"
          int
      , assertGeneralType
          "module indent > 1 and top indent > module indent"
          " module foo (y)\n   x = 1\n   y = 2"
          int
      , assertGeneralType
          "module indent > 1 and top indent = module indent"
          "  module foo (y)\n  x = 1\n  y = 2"
          int
      , -- indenting main
        assertGeneralType
          "main indent == 1"
          "module main (y)\nx = 1\ny = 2"
          int
      , assertGeneralType
          "main indent > 1"
          "module main (y)\n  x = 1\n  y = 2"
          int
      , -- multiple modules
        assertGeneralType
          "multiple modules at pos 1 with pos > 1 exprs"
          [r|
module foo (x)
  x = True
module bar (y)
  import foo
  y = True
module main (z)
  import bar
  z = 1
      |]
          int
      ]

packerTests :: TestTree
packerTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Test building of packer maps"
      [testEqual "packer test" (1 :: Int) 1]

typeAliasTests :: TestTree
typeAliasTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Test type alias substitutions"
      [ assertGeneralType
          "general type alias"
          [r|
        module main (f)
        type Foo = A
        f :: Foo
        |]
          (var "A")
      , assertGeneralType
          "parameterized generic"
          [r|
        module main (f)
        f :: m (a -> b)
        |]
          (forallu ["m___q0", "a___q1", "b___q2"] (arr "m___q0" [fun [var "a___q1", var "b___q2"]]))
      , assertGeneralType
          "non-parametric, general type alias"
          [r|
        module main (f)
        type Foo = A
        f :: Foo -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "deep type substitution: `[Foo] -> B`"
          [r|
        module main (f)
        type Foo = A
        f :: [Foo] -> B
        |]
          (fun [lst (var "A"), var "B"])
      , assertGeneralType
          "deep type substitution: `[Foo] -> Foo`"
          [r|
        module main (f)
        type Foo = A
        f :: [Foo] -> Foo
        |]
          (fun [lst (var "A"), var "A"])
      , assertGeneralType
          "parametric alias, general type alias"
          [r|
        module main (f)
        type (Foo a b) = (a,b)
        f :: Foo X Y -> Z
        |]
          (fun [tuple [var "X", var "Y"], var "Z"])
      , assertGeneralType
          "nested types"
          [r|
           module main (foo)
           type A = B
           type B = C
           foo :: A -> B -> C
        |]
          (fun [var "C", var "C", var "C"])
      , assertGeneralType
          "state is preserved across binding"
          [r|
           module main (f)
           type Foo = A
           g :: Foo -> Int
           f = g
        |]
          (fun [var "A", var "Int"])
      , assertGeneralType
          "state is inherited across binding"
          [r|
           module main (f)
           type Foo = A
           g :: a -> b
           f :: Foo -> Int
           f = g  {- yes, g isn't defined -}
        |]
          (fun [var "A", var "Int"])
      , expectError
          "fail on too many type aliases parameters"
          [r|
           type A = B
           foo :: A Int -> C
           foo
        |]
      , expectError
          "fail on too few type aliases parameters"
          [r|
           type (A a) = (a,a)
           foo :: A -> C
           foo
        |]
      , expectError
          "fail on conflicting types (Int vs Str)"
          [r|
           type A = Int
         
           module b (A)
           type A = Str
         
           module main (foo)
           import a (A)
           import b (A)
         
           foo :: A -> A -> A
        |]
      , expectError
          "fail on conflicting types (Map vs List)"
          [r|
           module a (A)
           type A a b = Map a b
           
           module b (A)
           type A a b = List (Tuple2 a b)
           
           module main (foo)
           import a (A)
           import b (A)
           
           foo :: A a b -> A a b -> A a b
        |]
      , -- import tests ---------------------------------------
        assertGeneralType
          "non-parametric, general type alias, imported"
          [r|
           module m1 (Foo)
             type Foo = A
           module main (f)
             import m1 (Foo)
             f :: Foo -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "non-parametric, general type alias, reimported"
          [r|
           module m3 (Foo)
             type Foo = A
           module m2 (Foo)
             import m3 (Foo)
           module m1 (Foo)
             import m2 (Foo)
           module main (f)
             import m1 (Foo)
             f :: Foo -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "non-parametric, general type alias, imported aliased"
          [r|
           module m1 (Foo)
             type Foo = A
           module main (f)
             import m1 (Foo as Bar)
             f :: Bar -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "non-parametric, general type alias, reimported aliased"
          [r|
           module m3 (Foo1)
             type Foo1 = A

           module m2 (Foo2)
             import m3 (Foo1 as Foo2)

           module m1 (Foo3)
             import m2 (Foo2 as Foo3)

           module main (f)
             import m1 (Foo3 as Foo4)
             f :: Foo4 -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "non-parametric, general type alias, duplicate import"
          [r|
           module m2 (Foo)
             type Foo = A

           module m1 (Foo)
             type Foo = A

           module main (f)
             import m1 (Foo)
             import m2 (Foo)
             f :: Foo -> B
        |]
          (fun [var "A", var "B"])
      , assertGeneralType
          "parametric alias, general type alias, duplicate import"
          [r|
           module m2 (Foo)
             type (Foo a b) = (a,b)

           module m1 (Foo)
             type (Foo c d) = (c,d)

           module main (f)
             import m1 (Foo)
             import m2 (Foo)
             f :: Foo X Y -> Z
        |]
          (fun [tuple [var "X", var "Y"], var "Z"])
      ]

whereTests :: TestTree
whereTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Test of where statements"
      [ assertGeneralType
          "simple where"
          [r|
            f :: Int
            f = z where
                z = 42
            f
        |]
          int
      , assertGeneralType
          "calling simple where"
          [r|
            inc :: Int -> Int
            f = inc z where
                z = 42
            f
        |]
          int
      , assertGeneralType
          "calling deeper where"
          [r|
            id :: a -> a
            inc :: Int -> Int
            f = id z where
                z = inc y where
                  y = 42
            f
        |]
          int
      ]

orderInvarianceTests :: TestTree
orderInvarianceTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Test order invariance"
      [ assertGeneralType
          "definitions work"
          "x = 42\nx"
          int
      , assertGeneralType
          "terms may be defined before they are used"
          "y = 42\nx = y\nx"
          int
      , assertGeneralType
          "long chains of substitution are OK too"
          "z = 42\ny = z\nx = y\nx"
          int
      ]

typeOrderTests :: TestTree
typeOrderTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Tests of type partial ordering (subtype)"
      [ testFalse
          "Str !< Real"
          (isSubtypeOf str real)
      , testFalse
          "Real !< Str"
          (isSubtypeOf real str)
      , testFalse
          "[Real] !< [Str]"
          (isSubtypeOf (lst real) (lst str))
      , testFalse
          "[Str] !< [Real]"
          (isSubtypeOf (lst str) (lst real))
      , testFalse
          "Str -> Str -> Str !< Real -> Real -> Real"
          (isSubtypeOf (fun [str, str, str]) (fun [real, real, real]))
      , testFalse
          "Real -> Real -> Real !< Str -> Str -> Str"
          (isSubtypeOf (fun [real, real, real]) (fun [str, str, str]))
      , testFalse
          "Str -> Str !< Int -> Int -> Int"
          (isSubtypeOf (fun [str, str]) (fun [int, int, int]))
      , testTrue
          "a <: Int"
          (isSubtypeOf (forallu ["a"] (var "a")) int)
      , testFalse
          "Int !< forall a . a"
          (isSubtypeOf int (forallu ["a"] (var "a")))
      , testTrue
          "forall a . (Int, a) <: (Int, Str)"
          (isSubtypeOf (forallu ["a"] (tuple [int, var "a"])) (tuple [int, str]))
      , testTrue
          "forall a b . (a, b) <: (Int, Str)"
          (isSubtypeOf (forallu ["a", "b"] (tuple [var "a", var "b"])) (tuple [int, str]))
      , testTrue
          "forall a . (Int, a) <: forall b . (Int, b)"
          ( isSubtypeOf
              (forallu ["a"] (tuple [int, var "a"]))
              (forallu ["b"] (tuple [int, var "b"]))
          )
      , testTrue
          "forall a . a <: (Int, Str)"
          (isSubtypeOf (forallu ["a"] (var "a")) (tuple [int, str]))
      , testTrue
          "forall a . a <: forall a b . (a, b)"
          (isSubtypeOf (forallu ["a"] (var "a")) (forallu ["a", "b"] (tuple [var "a", var "b"])))
      , -- cannot compare
        testFalse
          "[Int] !< Int"
          (isSubtypeOf (lst int) int)
      , testFalse
          "Int !< [Int]"
          (isSubtypeOf int (lst int))
      , -- partial order of types
        testTrue
          "forall a . [a] <= [Int]"
          ((forallu ["a"] (lst (var "a"))) <= (lst (var "a")))
      , testFalse
          "[Int] !< forall a . [a]"
          ((lst (var "a")) <= (forallu ["a"] (lst (var "a"))))
      , testTrue
          "forall a . (Int, a) <= (Int, Bool)"
          ((forallu ["a"] (tuple [int, var "a"])) <= (tuple [int, bool]))
      , testFalse
          "(Int, Bool) !<= forall a . (Int, a)"
          ((tuple [int, bool]) <= (forallu ["a"] (tuple [int, var "a"])))
      , testTrue
          "forall a b . (a, b) <= forall c . (Int, c)"
          ((forallu ["a", "b"] (tuple [var "a", var "b"])) <= (forallu ["c"] (tuple [int, var "c"])))
      , testFalse
          "forall c . (Int, c) !<= forall a b . (a, b)"
          ((forallu ["c"] (tuple [int, var "c"])) <= (forallu ["a", "b"] (tuple [var "a", var "b"])))
      , testTrue
          "forall a . a <= forall a b . (a, b)"
          ((forallu ["a"] (var "a")) <= (forallu ["a", "b"] (tuple [var "a", var "b"])))
      , -- test "mostSpecific"
        testEqual
          "mostSpecific [Int, Str, forall a . a] = [Int, Str]"
          (mostSpecific [int, str, forallu ["a"] (var "a")])
          [int, str]
      , -- test "mostGeneral"
        testEqual
          "mostGeneral [Int, Str, forall a . a] = forall a . a"
          (mostGeneral [int, str, forallu ["a"] (var "a")])
          [forallu ["a"] (var "a")]
      , -- test mostSpecificSubtypes
        testEqual
          "mostSpecificSubtypes: Int against [forall a . a]"
          (mostSpecificSubtypes int [forallu ["a"] (var "a")])
          [forallu ["a"] (var "a")]
      , testEqual
          "mostSpecificSubtypes: (Int -> Int)"
          ( mostSpecificSubtypes
              (fun [int, int])
              [fun [str, str], fun [int, int], forallu ["a"] (fun [var "a", var "a"])]
          )
          [fun [int, int]]
      , testEqual
          "mostSpecificSubtypes: empty"
          (mostSpecificSubtypes (fun [str, str, str]) [fun [real, real, real]])
          []
      , -- test mostSpecificSubtypes for tuples
        testEqual
          "mostSpecificSubtypes: tuples"
          ( mostSpecificSubtypes
              (tuple [int, int])
              [ forallu ["a"] (var "a")
              , forallu ["a", "b"] (tuple [var "a", var "b"])
              , forallu ["a", "b", "c"] (tuple [var "a", var "b", var "c"])
              ]
          )
          [forallu ["a", "b"] (tuple [var "a", var "b"])]
      , -- test mostSpecificSubtypes for tuples
        testEqual
          "mostSpecificSubtypes: with partially generic tuples"
          ( mostSpecificSubtypes
              (forallu ["a"] (tuple [int, var "a"]))
              [ forallu ["a"] (var "a")
              , forallu ["a", "b"] (tuple [var "a", var "b"])
              , forallu ["a"] (tuple [int, var "a"])
              , forallu ["a"] (tuple [int, bool])
              , forallu ["a", "b", "c"] (tuple [var "a", var "b", var "c"])
              ]
          )
          [forallu ["a"] (tuple [int, var "a"])]
      ]

unitTypeTests :: TestTree
unitTypeTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Typechecker unit tests"
      -- comments
      [ assertGeneralType "block comments (1)" "{- -} 42" int
      , assertGeneralType "block comments (2)" " {--} 42{-   foo -} " int
      , assertGeneralType "line comments (3)" "-- foo\n 42" int
      , -- reals versus integers
        assertGeneralType "0 is an int" "0" int
      , assertGeneralType "42 is an int" "42" int
      , assertGeneralType "-42 is an int" "-42" int
      , assertGeneralType "big integers are OK" "123456789123456789123456789123456789123456789123456789" int
      , assertGeneralType
          "big negative integers are OK"
          "-123456789123456789123456789123456789123456789123456789"
          int
      , assertGeneralType "0.0 is a real" "0.0" real
      , assertGeneralType "4.2 is a real" "4.2" real
      , assertGeneralType "-4.2 is a real" "-4.2" real
      , assertGeneralType "4e1 is a real (scientific notation is real)" "4e1" real
      , assertGeneralType "-4e1 is a real" "-4e1" real
      , assertGeneralType "-4e-1 is a real" "-4e-1" real
      , assertGeneralType "4.2e3000 is a real" "4.2e3000" real
      , assertGeneralType "irregular scientific notation is OK" "123456789123456789123456789e-3000" real
      , assertGeneralType "reals may be big" "123456789123456789123456789.123456789123456789123456789" real
      , -- other primitives
        assertGeneralType "primitive boolean" "True" bool
      , assertGeneralType "primitive string" "\"this is a string literal\"" str
      , assertGeneralType "primitive integer annotation" "42 :: Int" int
      , assertGeneralType "primitive boolean annotation" "True :: Bool" bool
      , assertGeneralType "primitive double annotation" "4.2 :: Real" real
      , assertGeneralType
          "primitive string annotation"
          "\"this is a string literal\" :: Str"
          str
      , assertGeneralType "primitive declaration" "x = True\n4.2" real
      , -- containers
        -- - lists
        assertGeneralType "list of one primitive" "[1]" (lst int)
      , assertGeneralType "list of many primitives" "[1,2,3]" (lst int)
      , assertGeneralType "list of many containers" "[(True,1),(False,2)]" (lst (tuple [bool, int]))
      , -- - tuples
        assertGeneralType "tuple of primitives" "(1,2,True)" (tuple [int, int, bool])
      , assertGeneralType "tuple with containers" "(1,(2,True))" (tuple [int, tuple [int, bool]])
      , -- - records
        assertGeneralType
          "primitive record statement"
          [r|
        {x=42, y="yolo"}
        |]
          (existP "e0" [] [(Key "x", int), (Key "y", str)])
      , assertGeneralType
          "primitive record signature"
          [r|
        record Foo = Foo {x :: Int, y :: Str}
        f :: Int -> Foo
        f 42
        |]
          (record' "Foo" [(Key "x", int), (Key "y", str)])
      , assertGeneralType
          "primitive record declaration"
          [r|
        foo = {x = 42, y = "yolo"}
        foo
        |]
          (existP "e0" [] [(Key "x", int), (Key "y", str)])
      , assertGeneralType
          "nested records"
          [r|
        {x = 42, y = {bob = 24601, tod = "listen now closely and hear how I've planned it"}}
        |]
          (existP "e0" [] [(Key "x", int), (Key "y", existP "e1" [] [(Key "bob", int), (Key "tod", str)])])
      , assertGeneralType
          "records with bound variables"
          [r|
        foo a = {x=a, y="yolo"}
        foo 42
        |]
          (existP "e0" [] [(Key "x", int), (Key "y", str)])
      , -- functions
        assertGeneralType
          "1-arg function declaration without signature"
          [r|
        f x = True
        f 42
        |]
          bool
      , assertGeneralType
          "2-arg function declaration without signature"
          [r|
        f x y = True
        f 42 True
        |]
          bool
      , assertGeneralType
          "1-arg function signature without declaration"
          [r|
        f :: Int -> Bool
        f 42
        |]
          bool
      , assertGeneralType
          "2-arg function signature without declaration"
          [r|
        f :: Int -> Bool -> Str
        f 42 True
        |]
          str
      , assertGeneralType
          "partial 1-2 function signature without declaration"
          [r|
        f :: Int -> Bool -> Str
        f 42
        |]
          (fun [bool, str])
      , assertGeneralType
          "identity function declaration and application"
          [r|
        f x = x
        f 42
        |]
          int
      , assertGeneralType
          "const declared function"
          [r|
        const x y = x
        const 42 True
        |]
          int
      , assertGeneralType
          "identity signature function"
          [r|
        id :: a -> a
        id 42
        |]
          int
      , assertGeneralType
          "const signature function"
          [r|
        const :: a -> b -> a
        const 42 True
        |]
          int
      , assertGeneralType
          "fst signature function"
          [r|
        fst :: (a,b) -> a
        fst (42,True)
        |]
          int
      , assertGeneralType
          "value to list function"
          [r|
        single :: a -> [a]
        single 42
        |]
          (lst int)
      , assertGeneralType
          "head function"
          [r|
        head :: [a] -> a
        head [1,2,3]
        |]
          int
      , assertGeneralType
          "make list function"
          [r|
        f :: a -> [a]
        f 1
        |]
          (lst int)
      , assertGeneralType
          "make list function"
          [r|
        single :: a -> [a]
        single 1
        |]
          (lst int)
      , assertGeneralType
          "existential function passing"
          [r|
        module main (g)
        g f = f True
        |]
          (fun [fun [bool, exist "e0"], exist "e0"])
      , assertGeneralType
          "app single function"
          [r|
        app :: (a -> b) -> a -> b
        f :: a -> [a]
        app f 42
        |]
          (lst int)
      , assertGeneralType
          "app head function"
          [r|
        app :: (a -> b) -> a -> b
        f :: [a] -> a
        app f [42]
        |]
          int
      , assertGeneralType
          "simple nested call"
          [r|
      f x = x
      g x = f x
      g 1
      |]
          int
      , assertGeneralType
          "nested calls"
          [r|
      f x y = (x, y)
      g x y = (x, f 1 y)
      g True "hi"
      |]
          (tuple [bool, tuple [int, str]])
      , assertGeneralType
          "zip pair"
          [r|
      pair x y = (x, y)
      zip :: (x -> y -> z) -> [x] -> [y] -> [z]
      zip pair [1,2] [True, False]
      |]
          (lst (tuple [int, bool]))
      , assertGeneralType
          "nested identity"
          [r|
      id :: a -> a
      id (id (id 1))
      |]
          int
      , assertGeneralType
          "head (head [[1]])"
          [r|
      head :: [a] -> a
      head (head [[42]])
      |]
          int
      , assertGeneralType
          "snd (snd (1,(1,True)))"
          [r|
      snd :: (a, b) -> b
      snd (snd (1, (1, True)))
      |]
          bool
      , assertGeneralType
          "f x y = [x, y]"
          [r|
        f x y = [x, y]
        f 1
        |]
          (fun [int, lst int])
      , assertGeneralType
          "map head function"
          [r|
        map :: (a -> b) -> [a] -> [b]
        head :: [a] -> a
        map head [[1],[1,2,3]]
        |]
          (lst int)
      , assertGeneralType
          "t a -> a"
          [r|
        gify :: a -> G a
        out :: f a -> a
        out (gify 1)
        |]
          int
      , assertGeneralType
          "f a b -> b"
          [r|
        gify :: a -> b -> G a b
        snd :: f a b -> b
        snd (gify 1 True)
        |]
          bool
      , assertGeneralType
          "map id over number list"
          [r|
        map :: (a -> b) -> [a] -> [b]
        id :: a -> a
        map id [1,2,3]
        |]
          (lst int)
      , assertGeneralType
          "map fst over tuple list"
          [r|
        map :: (a -> b) -> [a] -> [b]
        fst :: (a,b) -> a
        map fst [(1,True),(2,False)]
        |]
          (lst int)
      , assertGeneralType
          "map fstG over (G a b) list"
          [r|
        gify :: a -> b -> G a b
        map :: (a -> b) -> [a] -> [b]
        fstF :: f a b -> a
        map fstF [gify 1 True, gify 2 False]
        |]
          (lst int)
      , assertGeneralType
          "fmap generic fst over functor"
          [r|
        gify :: a -> G a
        fmap :: (a -> b) -> f a -> f b
        out :: f a -> a
        fmap out (gify [1])
        |]
          (arr "G" [int])
      , assertGeneralType
          "generic parameter reordering"
          [r|
        module m (biz)
        type M a b c = R b a c
        foo :: M a b c -> N b c
        bar :: a -> b -> c -> R a b c
        da :: Int -> X
        db :: Int -> Y
        dc :: Int -> Z
        baz a b c = foo (bar a b c)
        -- biz :: N X Z
        biz = baz (da 1) (db 2) (dc 3)
        |]
          (arr "N" [var "X", var "Z"])
      , assertGeneralType
          "variable annotation"
          [r|
        module main (f)
        f :: Foo
        |]
          (var "Foo")
      , -- lambdas
        assertGeneralType
          "function with parameterized types"
          [r|
        module main (f)
        f :: A B -> C
        |]
          (fun [arr "A" [var "B"], var "C"])
      , assertGeneralType "fully applied lambda (1)" "(\\x y -> x) 1 True" int
      , assertGeneralType "fully applied lambda (2)" "(\\x -> True) 42" bool
      , assertGeneralType "fully applied lambda (3)" "(\\x -> (\\y -> True) x) 42" bool
      , assertGeneralType "fully applied lambda (4)" "(\\x -> (\\y -> x) True) 42" int
      , assertGeneralType
          "unapplied lambda, polymorphic (1)"
          [r|\x -> True|]
          (fun [exist "e0", bool])
      , assertGeneralType
          "unapplied lambda, polymorphic (2)"
          "(\\x y -> x) :: a -> b -> a"
          (fun [exist "e0", exist "e1", exist "e0"])
      , assertGeneralType
          "annotated, fully applied lambda"
          "((\\x -> x) :: a -> a) True"
          bool
      , assertGeneralType
          "annotated, partially applied lambda"
          "((\\x y -> x) :: a -> b -> a) True"
          (fun [exist "e0", bool])
      , assertGeneralType
          "recursive functions are A-OK"
          "\\f -> f 5"
          (fun [fun [int, exist "e0"], exist "e0"])
      , -- applications
        assertGeneralType
          "primitive variable in application"
          [r|
        x = True
        (\y -> y) x
        |]
          bool
      , assertGeneralType
          "function variable in application"
          [r|
        f x y = x
        f 42 True
        |]
          int
      , assertGeneralType
          "partially applied function variable in application"
          [r|
        f x y = x
        x = f 42
        x
        |]
          (fun [exist "e0", int])
      , exprTestBad
          "applications with too many arguments fail"
          [r|
        f :: a -> a
        f True 12
        |]
      , exprTestBad
          "applications with mismatched types fail (1)"
          [r|
        abs :: Int -> Int
        abs True
        |]
      , exprTestBad
          "applications with mismatched types fail (2)"
          [r|
        f = 14
        g = \x h -> h x
        (g True) f
        |]
      , expectError
          "applications of non-functions should fail (1)"
          [r|
        f = 5
        g = \x -> f x
        g 12
        |]
      , expectError
          "applications of non-functions should fail (2)"
          [r|
        f = 5
        g = \h -> h 5
        g f
        |]
      , -- evaluation within containers
        expectError
          "arguments to a function are monotypes"
          [r|
        f :: a -> a
        g = \h -> (h 42, h True)
        g f
        |]
      , assertGeneralType
          "polymorphism under lambdas (203f8c) (1)"
          [r|
        f :: a -> a
        g = \h -> (h 42, h 1234)
        g f
        |]
          (tuple [int, int])
      , assertGeneralType
          "polymorphism under lambdas (203f8c) (2)"
          [r|
        f :: a -> a
        g = \h -> [h 42, h 1234]
        g f
        |]
          (lst int)
      , -- binding
        assertGeneralType
          "annotated variables without definition are legal"
          [r|
        module main (x)
        x :: Int
        |]
          int
      , assertGeneralType
          "unannotated variables with definition are legal"
          [r|
        x = 42
        x
        |]
          int
      , -- , exprTestBad
        --     "unannotated variables without definitions are illegal ('x')"
        --     "x"

        -- parameterized types
        assertGeneralType
          "parameterized type (n=1)"
          [r|
        module main (xs)
        xs :: Foo A
        |]
          (arr "Foo" [var "A"])
      , assertGeneralType
          "parameterized type (n=2)"
          [r|
        module main (xs)
        xs :: Foo A B
        |]
          (arr "Foo" [var "A", var "B"])
      , assertGeneralType
          "nested parameterized type"
          [r|
        module main (xs)
        xs :: Foo (Bar A) [B]
        |]
          (arr "Foo" [arr "Bar" [var "A"], arr "List" [var "B"]])
      , -- type signatures and higher-order functions
        assertGeneralType
          "type signature: identity function"
          [r|
        f :: a -> a
        f 42
        |]
          int
      , assertGeneralType
          "type signature: apply function with primitives"
          [r|
        apply :: (Int -> Bool) -> Int -> Bool
        f :: Int -> Bool
        apply f 42
        |]
          bool
      , assertGeneralType
          "type signature: generic apply function"
          [r|
        apply :: (a->b) -> a -> b
        f :: Int -> Bool
        apply f 42
        |]
          bool
      , assertGeneralType
          "type signature: map"
          [r|
        map :: (a->b) -> [a] -> [b]
        f :: Int -> Bool
        map f [5,2]
        |]
          (lst bool)
      , -- shadowing
        assertGeneralType
          "name shadowing in lambda expressions"
          [r|
        f x = (14, x)
        g x f = f x
        g True f
        |]
          (tuple [int, bool])
      , assertGeneralType
          "function passing without shadowing"
          [r|
        f x = (14, x)
        g foo = foo True
        g f
        |]
          (tuple [int, bool])
      , assertGeneralType
          "shadowed qualified type variables (7ffd52a)"
          [r|
        f :: a -> a
        g :: a -> Int
        g f
        |]
          int
      , assertGeneralType
          "non-shadowed qualified type variables (7ffd52a)"
          [r|
        f :: a -> a
        g :: b -> Int
        g f
        |]
          int
      , -- lists
        assertGeneralType "list of primitives" "[1,2,3]" (lst int)
      , assertGeneralType
          "list containing an applied variable"
          [r|
        f :: a -> a
        [53, f 34]
        |]
          (lst int)
      , -- NOTE: this test relies on internal renaming implementation
        assertGeneralType "empty list" "[]" (lst (exist "e0"))
      , assertGeneralType
          "list in function signature and application"
          [r|
        f :: [Int] -> Bool
        f [1]
        |]
          bool
      , -- , assertGeneralType
        --     "list in generic function signature and application"
        --     "f :: [a] -> Bool\nf [1]"
        --     [bool]
        -- , exprTestBad "failure on heterogenous list" "[1,2,True]"

        -- tuples
        assertGeneralType
          "tuple of primitives"
          [r|
        (4.2, True)
        |]
          (tuple [real, bool])
      , assertGeneralType
          "tuple containing an applied variable"
          [r|
        f :: a -> a
        (f 53, True)
        |]
          (tuple [int, bool])
      , assertGeneralType
          "check 2-tuples type signature"
          [r|
        module main (f)
        f :: (Int, Str)
        |]
          (tuple [int, str])
      , assertGeneralType "1-tuples are just for grouping" "module main (f)\nf :: (Int)" int
      , -- unit type
        assertGeneralType
          "unit as input"
          [r|
        module main (f)
        f :: () -> Bool
        |]
          (fun [VarU (TV "Unit"), bool])
      , assertGeneralType
          "unit as 2rd input"
          [r|
        module main (f)
        f :: Int -> () -> Bool
        |]
          (fun [int, VarU (TV "Unit"), bool])
      , assertGeneralType
          "unit as output"
          [r|
        module main (f)
        f :: Bool -> ()
        |]
          (fun [bool, VarU (TV "Unit")])
      , -- FIXME - I really don't like "Unit" being a normal var ...
        -- I am inclined to cast it as the unit type
        assertGeneralType "empty tuples are of unit type" "module main (f)\nf :: ()" (var "Unit")
      , -- extra space
        assertGeneralType "leading space" " 42" int
      , assertGeneralType "trailing space" "42 " int
      , -- adding signatures to declarations
        assertGeneralType
          "declaration with a signature (1)"
          [r|
        f :: a -> a
        f x = x
        f 42
        |]
          int
      , assertGeneralType
          "declaration with a signature (2)"
          [r|
        f :: Int -> Bool
        f x = True
        f 42
        |]
          bool
      , assertGeneralType
          "declaration with a signature (3)"
          [r|
        f :: Int -> Bool
        f x = True
        f
        |]
          (fun [int, bool])
      , expectError
          "primitive type mismatch should raise error"
          [r|
        module main (f)
        f :: Int -> Bool
        f x = 9999
        |]
      , expectError
          "catch infinite recursion of list"
          [r|
        module main (f)
        g :: [a] -> a
        f :: a -> a
        f x = g x
        |]
      , expectError
          "catch infinite recursion of tuple"
          [r|
        module main (f)
        g :: (a, b) -> a
        f :: a -> a
        f x = g x
        |]
      , expectError
          "check signatures under supposed identity"
          [r|
        module main (f)
        g :: (a -> b) -> a
        f :: a -> a
        f x = g x
        |]
      ,

        -- constraint syntax (implicit quantification wraps free vars in ForallU)
        assertGeneralType
          "constraint syntax (1)"
          "module main (f)\nf :: (Ord a) => a -> a -> a"
          (forallu ["a"] (fun [var "a", var "a", var "a"]))
      , assertGeneralType
          "constraint syntax (2)"
          "module main (f)\nf :: Ord a => a -> a -> a"
          (forallu ["a"] (fun [var "a", var "a", var "a"]))
      , assertGeneralType
          "constraint syntax (3)"
          "module main (f)\nf :: (Ord a, Eq b) => a -> b -> Bool"
          (forallu ["a", "b"] (fun [var "a", var "b", VarU (TV "Bool")]))
      , -- tests modules
        assertGeneralType
          "basic main module"
          [r|
          module main(x)
          x = [1,2,3]
        |]
          (lst int)
      , (flip $ assertGeneralType "import/export") (lst int) $
          [r|
          module foo (x)
            x = 42
          module bar (f)
            f :: a -> [a]
          module main (z)
            import foo (x)
            import bar (f)
            z = f x
        |]
      , (flip $ assertGeneralType "complex parse (1)") int $
          [r|
         module foo (x)
           add :: Int -> Int -> Int
           x = add a y where
             a = 1
             y = add b z where
               b = 42
           z = 19
      |]
      ]

unitValuecheckTests :: TestTree
unitValuecheckTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Valuechecker unit tests"
      [ valuecheckFail
          "unequal primitives fail"
          -- primitives
          [r|
         module foo (x)
           x = 1
           x = 2
      |]
      , valuecheckPass
          "equal primitives pass"
          [r|
         module foo (x)
           x = 1
           x = 1
      |]
      , -- containers
        valuecheckFail
          "lists with unequal values fail"
          [r|
         module foo (x)
           x = [1,3]
           x = [1,2]
      |]
      , valuecheckFail
          "lists of unequal length fail"
          [r|
         module foo (x)
           x = [1]
           x = [1,2]
      |]
      , valuecheckPass
          "identical lists pass"
          [r|
         module foo (x)
           x = [1,2]
           x = [1,2]
      |]
      , -- bound terms in simple expressions
        valuecheckFail
          "argument constraints"
          [r|
         module foo (f)
           f x y = x
           f a b = b
      |]
      , valuecheckFail
          "lambda var mismatches"
          [r|
         module foo (f)
           f x y = [x,y]
           f a b = [b,a]
      |]
      , valuecheckPass
          "identical lambda passes"
          [r|
         module foo (f)
           f x y = [x,y]
           f a b = [a,b]
      |]
      , -- comparisons of simple and non-simple
        valuecheckFail
          "constrained values fail"
          [r|
         module foo (x)
           source Py ("sum")
           sum :: [Int] -> Int
           x = sum [1, 2]
           x = 3
      |]
      , valuecheckFail
          "unequal types"
          [r|
         module foo (f)
           source Py ("sum")
           sum :: [Int] -> Int
           f xs = [1, sum xs]
           f xs = [2, sum xs]
      |]
      ]

{- | Tests for infix operator functionality
All tests have a 1-second timeout to prevent infinite loops
-}
infixOperatorTests :: TestTree
infixOperatorTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout in microseconds
    testGroup
      "Infix operator tests"
      [ -- Basic precedence tests
        assertGeneralType
          "default precedence: multiplication before addition"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Int -> Int -> Int
          (+) x y = x
          (*) :: Int -> Int -> Int
          (*) x y = y
          z = 1 + 2 * 3
          z
        |]
          int
      , assertGeneralType
          "custom precedence: higher binds tighter"
          [r|
          infixl 3 #
          infixl 8 @
          (#) :: Int -> Int -> Int
          (#) x y = x
          (@) :: Int -> Int -> Int
          (@) x y = y
          x = 1 # 2 @ 3
          x
        |]
          int
      , -- Associativity tests
        assertGeneralType
          "left associative operators"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = 1 + 2 + 3
          x
        |]
          int
      , assertGeneralType
          "right associative operators"
          [r|
          infixr 5 ++
          (++) :: [Int] -> [Int] -> [Int]
          (++) xs ys = xs
          x = [1] ++ [2] ++ [3]
          x
        |]
          (lst int)
      , -- Operators in prefix position
        assertGeneralType
          "operator used prefix"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = (+) 1 2
          x
        |]
          int
      , assertGeneralType
          "operator in lambda"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          f :: Int -> Int -> Int
          f = \x y -> x + y
          f
        |]
          (fun [int, int, int])
      , -- Default precedence tests
        assertGeneralType
          "default * has precedence 7"
          [r|
          infixl 6 +
          (*) :: Int -> Int -> Int
          (*) x y = y
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = 1 + 2 * 3
          x
        |]
          int
      , assertGeneralType
          "default + has precedence 6"
          [r|
          infixl 7 *
          (*) :: Int -> Int -> Int
          (*) x y = y
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = 1 + 2 * 3
          x
        |]
          int
      , -- Multiple operators in one declaration
        assertGeneralType
          "multiple operators same fixity"
          [r|
          infixl 6 +, -
          (+) :: Int -> Int -> Int
          (-) :: Int -> Int -> Int
          x = 1 + 2 - 3
          x
        |]
          int
      , -- Polymorphic operators
        assertGeneralType
          "polymorphic operator"
          [r|
          infixl 9 .
          infixl 6 +
          infixr 0 $
          (.) :: (b -> c) -> (a -> b) -> a -> c
          ($) :: (a -> b) -> a -> b
          (+) :: Int -> Int -> Int
          show :: a -> Str
          x = show . (+) 9 $ 5
          x
        |]
          str
      , assertGeneralType
          "polymorphic list append"
          [r|
          infixl 6 ++
          (++) :: [a] -> [a] -> [a]
          (++) xs ys = xs
          x = [1] ++ [2]
          x
        |]
          (lst int)
      , -- Complex expressions
        assertGeneralType
          "nested operations with parens"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Int -> Int -> Int
          (+) x y = x
          (*) :: Int -> Int -> Int
          (*) x y = y
          x = (1 + 2) * (3 + 4)
          x
        |]
          int
      , -- Operators in different contexts
        assertGeneralType
          "operator in where clause"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = y + z where
            y = 1
            z = 2
          x
        |]
          int
      , assertGeneralType
          "operator in list"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          xs = [1 + 2, 3 + 4]
          xs
        |]
          (lst int)
      , assertGeneralType
          "operator in tuple"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = (1 + 2, "hi")
          x
        |]
          (AppU (VarU (TV "Tuple2")) [int, str])
      , -- Edge cases
        assertGeneralType
          "operator precedence 0 (lowest)"
          [r|
          infixr 0 $
          ($) :: (Int -> Int) -> Int -> Int
          ($) f x = f x
          g :: Int -> Int
          x = g $ 5
          x
        |]
          int
      , assertGeneralType
          "operator precedence 9 (highest)"
          [r|
          infixl 9 !!!
          (!!!) :: Int -> Int -> Int
          (!!!) x y = x
          x = 1 !!! 2
          x
        |]
          int
      , -- Operators with both parens and bare syntax in fixity decls
        assertGeneralType
          "fixity with parentheses"
          [r|
          infixl 6 (+)
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = 1 + 2
          x
        |]
          int
      , assertGeneralType
          "fixity without parentheses"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          (+) x y = x
          x = 1 + 2
          x
        |]
          int
      , -- Type-verified precedence: asymmetric operator types ensure
        -- only the correct parse tree typechecks
        assertGeneralType
          "type-verified: * at 7 binds tighter than + at 6"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Str -> Int -> Str
          (*) :: Int -> Int -> Int
          x = "a" + 1 * 2
          x
        |]
          str
      , assertGeneralType
          "type-verified: @ at 8 binds tighter than # at 3"
          [r|
          infixl 3 #
          infixl 8 @
          (#) :: Str -> Int -> Str
          (@) :: Int -> Int -> Int
          x = "a" # 1 @ 2
          x
        |]
          str
      , assertGeneralType
          "type-verified: three-operator precedence chain"
          [r|
          infixl 3 <$>
          infixl 6 +
          infixl 9 *
          (<$>) :: Str -> Str -> Int
          (+) :: Str -> Int -> Str
          (*) :: Int -> Int -> Int
          x = "a" <$> "b" + 1 * 2
          x
        |]
          int
      , -- Type-verified associativity: asymmetric operator types ensure
        -- only the correct associativity typechecks
        assertGeneralType
          "type-verified: left-assoc chain"
          [r|
          infixl 6 +
          (+) :: Int -> Str -> Int
          x = 1 + "a" + "b"
          x
        |]
          int
      , assertGeneralType
          "type-verified: right-assoc chain"
          [r|
          infixr 5 ++
          (++) :: Str -> Int -> Int
          x = "a" ++ "b" ++ 1
          x
        |]
          int
      , -- Application operator ($)
        assertGeneralType
          "$ applies function to argument"
          [r|
          infixr 0 $
          ($) :: (a -> b) -> a -> b
          f :: Int -> Str
          x = f $ 1
          x
        |]
          str
      , assertGeneralType
          "nested $ is right-associative (type-verified)"
          [r|
          infixr 0 $
          ($) :: (a -> b) -> a -> b
          f :: Int -> Str
          g :: Str -> Int
          x = g $ f $ 1
          x
        |]
          int
      , assertGeneralType
          "$ binds looser than + (type-verified)"
          [r|
          infixr 0 $
          infixl 6 +
          ($) :: (a -> b) -> a -> b
          (+) :: Int -> Int -> Int
          f :: Int -> Str
          x = f $ 1 + 2
          x
        |]
          str
      , -- Composition operator (.)
        assertGeneralType
          "composition of two functions"
          [r|
          infixr 9 .
          (.) :: (b -> c) -> (a -> b) -> a -> c
          g :: Str -> Int
          f :: Int -> Str
          x = g . f
          x
        |]
          (fun [int, int])
      , assertGeneralType
          "composition chain of three functions"
          [r|
          infixr 9 .
          (.) :: (b -> c) -> (a -> b) -> a -> c
          h :: Str -> Int
          g :: Int -> Str
          f :: Bool -> Int
          x = h . g . f
          x
        |]
          (fun [bool, int])
      , assertGeneralType
          "composition binds tighter than $ (type-verified)"
          [r|
          infixr 9 .
          infixr 0 $
          (.) :: (b -> c) -> (a -> b) -> a -> c
          ($) :: (a -> b) -> a -> b
          f :: Int -> Int
          g :: Int -> Str
          x = g . f $ 5
          x
        |]
          str
      , -- Position independence of fixity declarations
        assertGeneralType
          "fixity declared after usage"
          [r|
          (+) :: Int -> Str -> Int
          x = 1 + "a"
          infixl 6 +
          x
        |]
          int
      , assertGeneralType
          "fixity and type sig both declared after usage"
          [r|
          x = 1 + "a"
          infixl 6 +
          (+) :: Int -> Str -> Int
          x
        |]
          int
      , assertGeneralType
          "both fixities at end, precedence still works"
          [r|
          (+) :: Str -> Int -> Str
          (*) :: Int -> Int -> Int
          x = "a" + 1 * 2
          infixl 6 +
          infixl 7 *
          x
        |]
          str
      , -- Default fixity is infixl 9
        assertGeneralType
          "undeclared operator defaults to prec 9 (type-verified)"
          [r|
          infixl 6 +
          (+) :: Str -> Int -> Str
          (*) :: Int -> Int -> Int
          x = "a" + 1 * 2
          x
        |]
          str
      , assertGeneralType
          "undeclared operator defaults to left-associative (type-verified)"
          [r|
          (+) :: Int -> Str -> Int
          x = 1 + "a" + "b"
          x
        |]
          int
      , -- Where-clause bindings with infix operators
        assertGeneralType
          "infix operator in where binding (type-verified)"
          [r|
          infixl 6 +
          (+) :: Int -> Str -> Int
          x = y where
            y = 1 + "a"
          x
        |]
          int
      , assertGeneralType
          "multiple where bindings with different operators"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Str -> Int -> Str
          (*) :: Int -> Int -> Int
          x = (y, z) where
            y = "hello" + 3
            z = 2 * 4
          x
        |]
          (tuple [str, int])
      , -- Ambiguity and conflict errors
        exprTestBad
          "non-associative operator chained"
          [r|
          infix 6 ~~
          (~~) :: Int -> Int -> Int
          x = 1 ~~ 2 ~~ 3
          x
        |]
      , exprTestBad
          "two non-associative operators at same precedence"
          [r|
          infix 6 ~~
          infix 6 @@
          (~~) :: Int -> Int -> Int
          (@@) :: Int -> Int -> Int
          x = 1 ~~ 2 @@ 3
          x
        |]
      , exprTestBad
          "left-assoc and right-assoc at same precedence"
          [r|
          infixl 6 +
          infixr 6 ++
          (+) :: Int -> Int -> Int
          (++) :: Int -> Int -> Int
          x = 1 + 2 ++ 3
          x
        |]
      , exprTestBad
          "conflicting fixity declarations for same operator"
          [r|
          infixl 6 +
          infixr 7 +
          (+) :: Int -> Int -> Int
          x = 1 + 2
          x
        |]
      , -- Operators in various expression contexts
        assertGeneralType
          "infix in parenthesized function argument"
          [r|
          infixl 6 +
          (+) :: Int -> Int -> Int
          f :: Int -> Str
          x = f (1 + 2)
          x
        |]
          str
      , assertGeneralType
          "infix in multiple function arguments"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Int -> Int -> Int
          (*) :: Int -> Int -> Int
          f :: Int -> Int -> Str
          x = f (1 + 2) (3 * 4)
          x
        |]
          str
      , assertGeneralType
          "infix expressions as applied functions"
          [r|
          infixl 6 +
          infixl 7 *
          infixr 9 .
          (+) :: Int -> Int -> Int
          (*) :: Int -> Int -> Int
          (.) :: (b -> c) -> (a -> b) -> a -> c
          foo x = ((+) 1 . (*) 2) x
          foo
        |]
          (fun [int, int])
      , assertGeneralType
          "infix in lambda body with asymmetric types"
          [r|
          infixl 6 +
          (+) :: Int -> Str -> Int
          f = \x y -> x + y
          f
        |]
          (fun [int, str, int])
      , assertGeneralType
          "infix across tuple elements with different result types"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Int -> Int -> Str
          (*) :: Int -> Int -> Int
          x = (1 + 2, 3 * 4)
          x
        |]
          (tuple [str, int])
      , assertGeneralType
          "mixed infix operators across list elements"
          [r|
          infixl 6 +
          infixl 7 *
          (+) :: Int -> Int -> Int
          (*) :: Int -> Int -> Int
          xs = [1 + 2, 3 * 4, 5 + 6 * 7]
          xs
        |]
          (lst int)
      ]

{- | Tests for typechecker complexity - these would timeout with O(2^n) behavior
All tests have a 0.1-second timeout to catch exponential blowup
-}
complexityRegressionTests :: TestTree
complexityRegressionTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Complexity regression tests"
      [ -- Deep function composition - tests batch subtype optimization
        assertGeneralType
          "deep identity composition"
          [r|
          id :: a -> a
          f = id (id (id (id (id (id (id (id (id (id 42)))))))))
          f
        |]
          int
      , assertGeneralType
          "deep function composition chain"
          [r|
          id :: a -> a
          (.) :: (b -> c) -> (a -> b) -> a -> c
          f = id . id . id . id . id . id . id . id . id . id
          f 42
        |]
          int
      , -- Eta expansion - tests avoiding re-inference
        assertGeneralType
          "nested lambdas returning functions"
          [r|
          add :: Int -> Int -> Int
          f = \x -> add x
          f
        |]
          (fun [int, int, int])
      , assertGeneralType
          "deeply nested partial application"
          [r|
          add3 :: Int -> Int -> Int -> Int
          f = \x -> \y -> add3 x y
          f
        |]
          (fun [int, int, int, int])
      , assertGeneralType
          "lambda with multi-arg function body"
          [r|
          add4 :: Int -> Int -> Int -> Int -> Int
          g = \a -> \b -> add4 a b
          g 1 2 3 4
        |]
          int
      , -- Multi-argument function subtyping
        assertGeneralType
          "many-argument function"
          [r|
          f :: Int -> Int -> Int -> Int -> Int -> Int -> Int
          f 1 2 3 4 5 6
        |]
          int
      , assertGeneralType
          "polymorphic many-argument function"
          [r|
          f :: a -> b -> c -> d -> e -> (a, b, c, d, e)
          f 1 True "x" 2.0 [1]
        |]
          (tuple [int, bool, str, real, lst int])
      , -- HOF shared type variable enforcement
        exprTestBad
          "fold with (==) should fail: shared var c gets Bool and Str"
          [r|
          fold :: (b -> a -> b) -> b -> [a] -> b
          (==) :: c -> c -> Bool
          test = fold (==) True ["hello", "hello"]
          test
        |]
      , assertGeneralType
          "fold with (+) should succeed: shared var resolved consistently"
          [r|
          fold :: (b -> a -> b) -> b -> [a] -> b
          (+) :: Int -> Int -> Int
          test = fold (+) 0 [1, 2, 3]
          test
        |]
          int
      , assertGeneralType
          "map with lambda using (==) should succeed: same type both args"
          [r|
          map :: (a -> b) -> [a] -> [b]
          (==) :: c -> c -> Bool
          test = map (\x -> x == x) ["hello"]
          test
        |]
          (lst bool)
      , -- zipSubtype path: type constructor with repeated variable
        exprTestBad
          "zipSubtype: Pair a a cannot unify with Pair Bool Str"
          [r|
          mkPair :: a -> Pair a a
          consume :: Pair Bool Str -> Int
          test = consume (mkPair True)
          test
        |]
      , assertGeneralType
          "zipSubtype: Pair a a consistent with Pair Int Int"
          [r|
          mkPair :: a -> Pair a a
          fst :: Pair a b -> a
          test = fst (mkPair 42)
          test
        |]
          int
      , -- Shared var in return: id passed where Bool -> Str expected
        exprTestBad
          "shared var via HOF: id cannot satisfy Bool -> Str"
          [r|
          apply :: (a -> b) -> a -> b
          id :: a -> a
          asStr :: Str -> Str
          test = asStr (apply id True)
          test
        |]
      , -- Triple-shared variable through HOF
        exprTestBad
          "triple-shared var forced to different types through fold"
          [r|
          fold :: (b -> a -> b) -> b -> [a] -> b
          choose :: c -> c -> c
          test = fold choose "hello" [1, 2]
          test
        |]
      , -- Shared return var conflicts with arguments
        exprTestBad
          "shared var return type conflicts with argument through fold"
          [r|
          fold :: (b -> a -> b) -> b -> [a] -> b
          weirdEq :: c -> c -> Str
          test = fold weirdEq "start" [1, 2]
          test
        |]
      , -- Two distinct shared vars both violated
        exprTestBad
          "two distinct shared vars both inconsistent through HOF"
          [r|
          hof :: (a -> b -> c -> d -> e) -> a -> b -> c -> d -> e
          f :: x -> y -> x -> y -> Bool
          test = hof f 1 "hi" True 42.0
          test
        |]
      , -- Nested HOF shared var conflict
        exprTestBad
          "nested HOF: shared var conflict through double application"
          [r|
          apply :: (a -> b) -> a -> b
          (==) :: c -> c -> Bool
          test = apply (apply (==) True) "hello"
          test
        |]
      , -- Regression: fold with (==) on consistent types should pass
        assertGeneralType
          "fold with (==) consistent types: all Bool"
          [r|
          fold :: (b -> a -> b) -> b -> [a] -> b
          (==) :: c -> c -> Bool
          test = fold (==) True [True, False]
          test
        |]
          bool
      , -- Regression: multiple shared vars all consistent
        assertGeneralType
          "multiple shared vars consistent through HOF"
          [r|
          hof :: (a -> b -> c -> d -> e) -> a -> b -> c -> d -> e
          f :: x -> y -> x -> y -> Bool
          test = hof f 1 2 3 4
          test
        |]
          bool
      ]

-- Effect type helpers
ioEff :: TypeU -> TypeU
ioEff = EffectU ioEffectSet

_errEff :: TypeU -> TypeU
_errEff = EffectU (EffectSet (Set.singleton "Error"))

emptyEff :: TypeU -> TypeU
emptyEff = EffectU emptyEffectSet

effectSubtypeTests :: TestTree
effectSubtypeTests =
  localOption (mkTimeout 100000) $ -- 0.1 second timeout
    testGroup
      "Effect subtype tests"
      [ -- identical effect sets are subtypes of each other
        assertSubtypeGamma "<IO> A <: <IO> A" [] (ioEff a) (ioEff a) []
      , -- fewer effects is a subtype (IO subset of {IO,Error})
        assertSubtypeGamma "<IO> A <: <IO,Error> A"
          [] (ioEff a) (EffectU (EffectSet (Set.fromList ["IO", "Error"])) a) []
      , -- empty effect set is subtype of any effect set
        assertSubtypeGamma "<> A <: <IO> A" [] (emptyEff a) (ioEff a) []
      , -- superset effects currently accepted (permissive behavior)
        assertSubtypeGamma "<IO,Error> A <: <IO> A (permissive)"
          [] (EffectU (EffectSet (Set.fromList ["IO", "Error"])) a) (ioEff a) []
      , -- effect subtyping with function inner types
        assertSubtypeGamma "<IO> (A -> B) <: <IO> (A -> B)"
          [] (ioEff (fun [a, b])) (ioEff (fun [a, b])) []
      , -- effect subtyping solves existentials in inner types
        assertSubtypeGamma "<a> -| <IO> <a> <: <IO> A |- <a>:A"
          [eag] (ioEff ea) (ioEff a) [solvedA a]
      , -- effect subtyping solves existentials (reverse direction)
        assertSubtypeGamma "<a> -| <IO> A <: <IO> <a> |- <a>:A"
          [eag] (ioEff a) (ioEff ea) [solvedA a]
      , -- effects compose with optional inner types
        assertSubtypeGamma "<IO> ?A <: <IO> ?A"
          [] (ioEff (OptionalU a)) (ioEff (OptionalU a)) []
      , -- effects compose with list inner types
        assertSubtypeGamma "<IO> [A] <: <IO> [A]"
          [] (ioEff (lst a)) (ioEff (lst a)) []
      , -- empty effects both sides
        assertSubtypeGamma "<> A <: <> A" [] (emptyEff a) (emptyEff a) []
      ]
  where
    a = var "A"
    b = var "B"
    ea = exist "x1"
    eag = ExistG (TV "x1") ([], Open) ([], Open)
    solvedA t = SolvedG (TV "x1") t

effectSynthesisTests :: TestTree
effectSynthesisTests =
  localOption (mkTimeout 100000) $ -- 0.1 second timeout
    testGroup
      "Effect synthesis tests"
      [ -- pure do-block with no effects infers empty effect set
        assertGeneralType
          "pure do-block infers empty effects"
          [r|
        module main (x)
        x = do 42
          |]
          (emptyEff int)
      , -- force operator collects effect from forced expression
        assertGeneralType
          "do-block with force collects IO effect"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do !(f 1)
          |]
          (ioEff int)
      , -- force in tuple: effects collected, tuple gets plain inner types
        assertGeneralType
          "do-block with tuple of forces"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do (!(f 1), !(f 2))
          |]
          (ioEff (tuple [int, int]))
      , -- force in function args: effects bubble up, function sees plain args
        assertGeneralType
          "do-block with forces in function args"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        add :: Int -> Int -> Int
        x = do add !(f 1) !(f 2)
          |]
          (ioEff int)
      , -- bind extracts value from effectful expr, adds effect to block
        assertGeneralType
          "do-block with bind"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do
            y <- f 1
            y
          |]
          (ioEff int)
      , -- multiple binds collect effects from all bound expressions
        assertGeneralType
          "do-block with chained binds"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        add :: Int -> Int -> Int
        x = do
            a <- f 1
            b <- f 2
            add a b
          |]
          (ioEff int)
      , -- let with pure RHS in do-block infers empty effect
        assertGeneralType
          "do-block with pure let binding"
          [r|
        module main (x)
        x = do
            let y = 1
            y
          |]
          (emptyEff int)
      , -- let with forced RHS collects effect from the force
        assertGeneralType
          "do-block with bind and let"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        add :: Int -> Int -> Int
        x = do
            y <- f 1
            let z = add y 1
            z
          |]
          (ioEff int)
      , -- pure value auto-coerces to effectful when annotation demands it
        assertGeneralType
          "pure value coerces to effectful via annotation"
          [r|
        module main (x)
        x :: <IO> Int
        x = 42
          |]
          (ioEff int)
      , -- pure expression in do-block produces empty effects
        assertGeneralType
          "pure expression in do-block"
          [r|
        module main (x)
        add :: Int -> Int -> Int
        x = do add 1 2
          |]
          (emptyEff int)
      , -- forces with different effects produce EffectUnion
        -- (order: IO first because it appears first in the application)
        assertGeneralType
          "do-block with multiple effect labels"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        g :: Int -> <Error> Int
        add :: Int -> Int -> Int
        x = do add !(f 1) !(g 2)
          |]
          (EffectU (EffectUnion (EffectSet (Set.singleton "IO")) (EffectSet (Set.singleton "Error"))) int)
      , -- bind and force mix in same do-block, effects combine
        assertGeneralType
          "do-block mixing bind and force"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        add :: Int -> Int -> Int
        x = do
            y <- f 1
            add y !(f 2)
          |]
          (ioEff int)
      , -- chained binds feeding results forward
        assertGeneralType
          "do-block with chained dependent binds"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        add :: Int -> Int -> Int
        x = do
            a <- f 1
            b <- f a
            add a b
          |]
          (ioEff int)
      , -- do-block with effect annotation matching inferred effects
        assertGeneralType
          "annotated do-block matches inferred effects"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x :: <IO> Int
        x = do
            y <- f 1
            y
          |]
          (ioEff int)
      , -- polymorphic function applied inside do-block
        assertGeneralType
          "polymorphic function in do-block"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        id :: a -> a
        x = do !(f (id 42))
          |]
          (ioEff int)
      , -- do-block returning a list with forces
        assertGeneralType
          "do-block returning list"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do [!(f 1), !(f 2)]
          |]
          (ioEff (lst int))
      ]

effectErrorTests :: TestTree
effectErrorTests =
  localOption (mkTimeout 100000) $ -- 0.1 second timeout
    testGroup
      "Effect error tests"
      [ -- forcing a non-effectful expression should fail
        exprTestBad
          "force on non-effectful value"
          [r|
        module main (x)
        x = do !(42)
          |]
      , -- type mismatch inside do-block force should fail
        exprTestBad
          "type mismatch inside do-block force"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do !(f "hello")
          |]
      , -- effectful type where plain type expected should fail
        exprTestBad
          "effectful type where plain type expected"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        g :: Int -> Int
        x = g (f 1)
          |]
      ]

namespaceErrorTests :: TestTree
namespaceErrorTests =
  localOption (mkTimeout 2000000) $ -- 2 second timeout
    testGroup
      "Tests for namespace import error cases"
      [ -- chained namespace dots should be a parse error
        exprTestBad
          "chained namespace dots a.b.c"
          [r|
        module main (x)
        x :: Int
        x = a.b.c
          |]
      , -- keyword used as namespace should fail
        exprTestBad
          "keyword as namespace name (let)"
          [r|
        module foo (y)
        y :: Int
        y = 1
        module main (x)
        import foo as let
        x :: Int
        x = let.y
          |]
      , -- keyword used as namespace should fail
        exprTestBad
          "keyword as namespace name (do)"
          [r|
        module foo (y)
        y :: Int
        y = 1
        module main (x)
        import foo as do
        x :: Int
        x = do.y
          |]
      , -- undefined namespace prefix should fail
        exprTestBad
          "undefined namespace prefix"
          [r|
        module main (x)
        x :: Int
        x = noexist.foo 5
          |]
      , -- namespace-qualified name used with wrong arg type
        exprTestBad
          "namespace qualified name type mismatch"
          [r|
        module helpers (double)
        double :: Int -> Int
        double x = x
        module main (x)
        import helpers as h
        x :: Int
        x = h.double "hello"
          |]
      , -- bare name should fail when imported with namespace
        exprTestBad
          "bare name fails with namespace import"
          [r|
        module helpers (double)
        double :: Int -> Int
        double x = x
        module main (x)
        import helpers as h
        x :: Int
        x = double 5
          |]
      ]

typeclassTests :: TestTree
typeclassTests =
  localOption (mkTimeout 200000) $ -- 0.2 second timeout
    testGroup
      "Typeclass tests"
      [ -- === ANNOTATION PROPAGATION FIX (the core bug) ===
        -- Annotation leaked through copyState/reindexExprI to implementation
        -- indices, causing checkG to wrongly constrain non-matching instances.

        -- Instance declaration order must not matter
        assertGeneralType
          "annotation selects Str instance (Str declared first)"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x :: Str
        x = mempty :: Str
          |]
          str

      , assertGeneralType
          "annotation selects Str instance (List declared first)"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid (List a) where
          mempty = []
        instance Monoid Str where
          mempty = ""
        x :: Str
        x = mempty :: Str
          |]
          str

      , -- Annotation selects the parametric instance
        assertGeneralType
          "annotation selects List instance"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x :: [Int]
        x = mempty :: [Int]
          |]
          (lst int)

      , -- Export signature alone (no inline annotation) resolves the instance
        assertGeneralType
          "export signature resolves instance without inline annotation"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x :: Str
        x = mempty
          |]
          str

      , -- === MONOMORPHIC ANNOTATION FIX ===
        -- Annotation on standalone polymorphic functions (not typeclass methods)
        -- leaked via copyState to MonomorphicExpr implementation indices.

        assertGeneralType
          "annotation on standalone polymorphic function with args"
          [r|
        module main (foo)
        type Py => Int = "int"
        myId :: a -> a
        source Py ("lambda x: x" as myId)
        foo :: Int
        foo = (myId :: Int -> Int) 42
          |]
          int

      , assertGeneralType
          "annotation on standalone polymorphic nullary function"
          [r|
        module main (foo)
        type Py => Real = "float"
        myVal :: a
        source Py ("lambda: 3.14" as myVal)
        foo :: Real
        foo = myVal :: Real
          |]
          real

      , -- === SUPERCLASS CONSTRAINTS ===

        assertGeneralType
          "superclass method usable with subclass instance"
          [r|
        module main (x)
        type Py => Str = "str"
        class Semigroup a where
          append :: a -> a -> a
        class Semigroup a => Monoid a where
          mempty :: a
        instance Semigroup Str where
          source Py from "foo.py" ("appendStr" as append)
        instance Monoid Str where
          mempty = ""
        x :: Str
        x = append "" ""
          |]
          str

      , -- === NEGATIVE TESTS ===

        exprTestBad
          "ambiguous: multiple instances, no annotation"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x = mempty
          |]

      , exprTestBad
          "no matching instance for annotated type"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        x :: Real
        x = mempty :: Real
          |]

      , exprTestBad
          "no instances defined"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        x :: Str
        x = mempty
          |]

      , exprTestBad
          "annotation contradicts export signature"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x :: Int
        x = mempty :: Str
          |]

      , -- === COERCION-AWARE INSTANCE RESOLUTION ===

        assertGeneralType
          "instance resolved through optional coercion"
          [r|
        module main (x)
        class Default a where
          def :: a
        instance Default Int where
          def = 0
        x :: ?Int
        x = def
          |]
          (OptionalU int)

      , assertGeneralType
          "typeclass method in effectful do-block"
          [r|
        module main (x)
        class Default a where
          def :: a
        instance Default Int where
          def = 0
        f :: Int -> <IO> Int
        x = do !(f def)
          |]
          (ioEff int)

      , -- === INTERACTION WITH OTHER FEATURES ===

        assertGeneralType
          "typeclass method in let binding"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        x :: Str
        x =
          let y = (mempty :: Str)
          in y
          |]
          str

      , assertGeneralType
          "typeclass method resolved by function argument context"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid Str where
          mempty = ""
        instance Monoid (List a) where
          mempty = []
        f :: Str -> Str
        x :: Str
        x = f mempty
          |]
          str

      , assertGeneralType
          "class with multiple nullary methods"
          [r|
        module main (x)
        class Bounded a where
          minBound :: a
          maxBound :: a
        instance Bounded Int where
          minBound = 0
          maxBound = 100
        x :: Int
        x = minBound
          |]
          int

      , assertGeneralType
          "nested parametric instance"
          [r|
        module main (x)
        class Monoid a where
          mempty :: a
        instance Monoid (List a) where
          mempty = []
        x :: [[Int]]
        x = mempty
          |]
          (lst (lst int))
      ]

natErrorTests :: TestTree
natErrorTests =
  testGroup
    "nat typecheck errors"
    [ expectError
        "add dimension mismatch (4 != 5)"
        [r|
      module main (x)
      type Tensor2 d1 d2 a
      add :: Tensor2 m n Real -> Tensor2 m n Real -> Tensor2 m n Real
      a :: Tensor2 3 4 Real
      b :: Tensor2 3 5 Real
      x = add a b
        |]
    , expectError
        "matmul inner dimension mismatch (4 != 5)"
        [r|
      module main (x)
      type Tensor2 d1 d2 a
      matmul :: Tensor2 m k Real -> Tensor2 k n Real -> Tensor2 m n Real
      a :: Tensor2 3 4 Real
      b :: Tensor2 5 6 Real
      x = matmul a b
        |]
    , expectError
        "trace requires square matrix (3 != 4)"
        [r|
      module main (x)
      type Tensor2 d1 d2 a
      trace :: Tensor2 n n Real -> Real
      a :: Tensor2 3 4 Real
      x = trace a
        |]
    , expectError
        "dot product length mismatch (3 != 5)"
        [r|
      module main (x)
      type Tensor1 d1 a
      dot :: Tensor1 n Real -> Tensor1 n Real -> Real
      a :: Tensor1 3 Real
      b :: Tensor1 5 Real
      x = dot a b
        |]
    , expectError
        "vstack column dimension mismatch (3 != 4)"
        [r|
      module main (x)
      type Tensor2 d1 d2 a
      vstack :: Tensor2 m n Real -> Tensor2 p n Real -> Tensor2 m n Real
      a :: Tensor2 2 3 Real
      b :: Tensor2 4 4 Real
      x = vstack a b
        |]
    , expectError
        "nat arithmetic mismatch: (2+3) != 4"
        [r|
      module main (x)
      type SizedList n a = [a]
      append :: SizedList m a -> SizedList n a -> SizedList (m + n) a
      a :: SizedList 2 Int
      b :: SizedList 3 Int
      x :: SizedList 4 Int
      x = append a b
        |]
    ]

natArithTests :: TestTree
natArithTests =
  testGroup
    "nat arithmetic (sub, div, solver fix)"
    [ -- NatSolver unit tests
      testCase "ground subtraction: (10 - 3) ~ 7" $
        let e1 = NS.NatSub (NS.NatLit 10) (NS.NatLit 3)
            e2 = NS.NatLit 7
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" subs Map.empty
             Left err -> assertFailure $ "Expected success, got: " ++ show err
    , testCase "ground division: (12 / 4) ~ 3" $
        let e1 = NS.NatDiv (NS.NatLit 12) (NS.NatLit 4)
            e2 = NS.NatLit 3
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" subs Map.empty
             Left err -> assertFailure $ "Expected success, got: " ++ show err
    , testCase "subtraction mismatch: (10 - 3) ~ 8" $
        let e1 = NS.NatSub (NS.NatLit 10) (NS.NatLit 3)
            e2 = NS.NatLit 8
        in case NS.solveNat e1 e2 of
             Left NS.Contradiction -> return ()
             other -> assertFailure $ "Expected Contradiction, got: " ++ show other
    , testCase "division mismatch: (12 / 4) ~ 4" $
        let e1 = NS.NatDiv (NS.NatLit 12) (NS.NatLit 4)
            e2 = NS.NatLit 4
        in case NS.solveNat e1 e2 of
             Left NS.Contradiction -> return ()
             other -> assertFailure $ "Expected Contradiction, got: " ++ show other
    , testCase "subtraction with variable: n - 3 ~ 5 => n = 8" $
        let e1 = NS.NatSub (NS.NatVar (TV "n")) (NS.NatLit 3)
            e2 = NS.NatLit 5
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" (Map.singleton (TV "n") (NS.NatLit 8)) subs
             Left err -> assertFailure $ "Expected n=8, got: " ++ show err
    , testCase "division by constant: n / 3 with n = 9 / 3 ~ 3" $
        let e1 = NS.NatDiv (NS.NatLit 9) (NS.NatLit 3)
            e2 = NS.NatLit 3
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" subs Map.empty
             Left err -> assertFailure $ "Expected success, got: " ++ show err
    -- extractLinearVar soundness fix: i*j ~ n must be Deferred, not n=0
    , testCase "extractLinearVar fix: i*j ~ n is Deferred" $
        let e1 = NS.NatMul (NS.NatVar (TV "i")) (NS.NatVar (TV "j"))
            e2 = NS.NatVar (TV "n")
        in case NS.solveNat e1 e2 of
             Left (NS.Deferred _) -> return ()
             Right subs -> assertFailure $ "Expected Deferred, got solved: " ++ show subs
             Left NS.Contradiction -> assertFailure "Expected Deferred, got Contradiction"
    , testCase "linear solving still works: n + 3 ~ 8 => n = 5" $
        let e1 = NS.NatAdd (NS.NatVar (TV "n")) (NS.NatLit 3)
            e2 = NS.NatLit 8
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" (Map.singleton (TV "n") (NS.NatLit 5)) subs
             Left err -> assertFailure $ "Expected n=5, got: " ++ show err
    , testCase "simple variable solving: n ~ 5" $
        let e1 = NS.NatVar (TV "n")
            e2 = NS.NatLit 5
        in case NS.solveNat e1 e2 of
             Right subs -> assertEqual "" (Map.singleton (TV "n") (NS.NatLit 5)) subs
             Left err -> assertFailure $ "Expected n=5, got: " ++ show err
    -- Typechecker integration tests for sub/div syntax
    , expectError
        "ground subtraction mismatch: (10-3) != 8 in type annotation"
        [r|
      module main (x)
      type SizedList n a = [a]
      a :: SizedList (10 - 3) Int
      x :: SizedList 8 Int
      x = a
        |]
    , expectError
        "ground division mismatch: (12/4) != 4 in type annotation"
        [r|
      module main (x)
      type SizedList n a = [a]
      a :: SizedList (12 / 4) Int
      x :: SizedList 4 Int
      x = a
        |]
    -- deferred constraint re-checking: variable arithmetic caught after solving
    , expectError
        "deferred subtraction mismatch: m=8, n=3, but m-n used as 7"
        [r|
      module main (x)
      type SizedList n a = [a]
      take :: SizedList (m - n) a -> SizedList n a -> SizedList m a
      a :: SizedList 7 Int
      b :: SizedList 3 Int
      x :: SizedList 8 Int
      x = take a b
        |]
    , expectError
        "deferred multiplication mismatch: n*m=12 but n=5 (no integer m)"
        [r|
      module main (x)
      type SizedList n a = [a]
      split :: SizedList (n * m) a -> SizedList n a
      a :: SizedList 12 Int
      x :: SizedList 5 Int
      x = split a
        |]
    ]

natLabelTests :: TestTree
natLabelTests =
  testGroup
    "nat labeled params (m:Int syntax)"
    [ -- === Positive: literal int args resolve nat vars ===
      assertRawType
        "labeled literal resolves dimension: makeVec 5 :: Tensor1 5 Real"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec 5
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 5, VarU (TV "Real")])
    , assertRawType
        "labeled literal zero dimension: makeVec 0 :: Tensor1 0 Real"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec 0
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 0, VarU (TV "Real")])
    , assertRawType
        "two labeled params resolve: makeMat 3 4 :: Tensor2 3 4 Real"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      makeMat :: m:Int -> n:Int -> Tensor2 m n Real
      x = makeMat 3 4
        |]
        (AppU (VarU (TV "Tensor2")) [NatLitU 3, NatLitU 4, VarU (TV "Real")])
    , assertRawType
        "labeled dims flow through generic op: id_ (makeVec 7) :: Tensor1 7 Real"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      id_ :: Tensor1 n Real -> Tensor1 n Real
      x = id_ (makeVec 7)
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 7, VarU (TV "Real")])
    , assertRawType
        "labeled dims with nat arithmetic: conv output dims computed"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      type Tensor3 (d1 :: Nat) (d2 :: Nat) (d3 :: Nat) a
      makeImg :: h:Int -> w:Int -> Tensor2 h w Real
      makeK :: k:Int -> fh:Int -> fw:Int -> Tensor3 k fh fw Real
      type Tensor1 (d :: Nat) a = [a]
      makeB :: k:Int -> Tensor1 k Real
      conv :: Tensor2 h w Real -> Tensor3 k fh fw Real -> Tensor1 k Real -> Tensor3 k (h - fh + 1) (w - fw + 1) Real
      x = conv (makeImg 5 5) (makeK 2 3 3) (makeB 2)
        |]
        (AppU (VarU (TV "Tensor3")) [NatLitU 2, NatLitU 3, NatLitU 3, VarU (TV "Real")])
    , assertRawType
        "labeled + flatten nat arithmetic: 2*3*3 = 18"
        [r|
      module main (x)
      type Tensor3 (d1 :: Nat) (d2 :: Nat) (d3 :: Nat) a
      type Tensor1 (d :: Nat) a = [a]
      makeT :: a:Int -> b:Int -> c:Int -> Tensor3 a b c Real
      flatten :: Tensor3 a b c Real -> Tensor1 (a * b * c) Real
      x = flatten (makeT 2 3 3)
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 18, VarU (TV "Real")])
    , assertRawType
        "mixed labeled and unlabeled args"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      makeT :: m:Int -> n:Int -> Tensor2 m n Real
      scale :: Real -> Tensor2 m n Real -> Tensor2 m n Real
      x = scale 2.0 (makeT 3 4)
        |]
        (AppU (VarU (TV "Tensor2")) [NatLitU 3, NatLitU 4, VarU (TV "Real")])
    , assertRawType
        "same label var used in two positions (diagonal)"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      eye :: n:Int -> Tensor2 n n Real
      x = eye 4
        |]
        (AppU (VarU (TV "Tensor2")) [NatLitU 4, NatLitU 4, VarU (TV "Real")])

    -- === Positive: let-bound integers resolve nat labels ===
    , assertRawType
        "let-bound int resolves label: let n = 5 in makeVec n"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = let n = 5 in makeVec n
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 5, VarU (TV "Real")])
    , assertRawType
        "chained let-bound: let a = 7 in let b = a in makeVec b"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = let a = 7 in let b = a in makeVec b
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 7, VarU (TV "Real")])
    , assertRawType
        "multiple let-bound dims: let m=3, n=4 in makeMat m n"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      makeMat :: m:Int -> n:Int -> Tensor2 m n Real
      x = let m = 3 in let n = 4 in makeMat m n
        |]
        (AppU (VarU (TV "Tensor2")) [NatLitU 3, NatLitU 4, VarU (TV "Real")])

    -- === Positive: tuple accessor evaluation ===
    , assertRawType
        "tuple accessor resolves: makeVec (.0 (5, 6))"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec (.0 (5, 6))
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 5, VarU (TV "Real")])
    , assertRawType
        "let-bound tuple + accessor: let dims = (3,4) in makeMat (.0 dims) (.1 dims)"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      makeMat :: m:Int -> n:Int -> Tensor2 m n Real
      x = let dims = (3, 4) in makeMat (.0 dims) (.1 dims)
        |]
        (AppU (VarU (TV "Tensor2")) [NatLitU 3, NatLitU 4, VarU (TV "Real")])
    , assertRawType
        "chained let + accessor: let d=(8,9); let n=.0 d in makeVec n"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = let d = (8, 9) in let n = .0 d in makeVec n
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 8, VarU (TV "Real")])

    -- === Positive: lambda application evaluation ===
    , assertRawType
        "identity lambda: makeVec ((\\x -> x) 5)"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec ((\n -> n) 5)
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 5, VarU (TV "Real")])
    , assertRawType
        "lambda + accessor: makeVec ((\\t -> .1 t) (1,2,3))"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec ((\t -> .1 t) (1, 2, 3))
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 2, VarU (TV "Real")])
    , assertRawType
        "lambda selects first of two args: (\\x y -> x) 7 99"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x = makeVec ((\a b -> a) 7 99)
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 7, VarU (TV "Real")])

    -- === Negative: dimension mismatches caught despite labels ===
    , expectError
        "labeled dim mismatch: add (makeT 3 4) (makeT 3 5) fails"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      makeT :: m:Int -> n:Int -> Tensor2 m n Real
      add :: Tensor2 m n Real -> Tensor2 m n Real -> Tensor2 m n Real
      x = add (makeT 3 4) (makeT 3 5)
        |]
    , expectError
        "labeled dim mismatch: dot product length mismatch"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      dot :: Tensor1 n Real -> Tensor1 n Real -> Real
      x = dot (makeVec 3) (makeVec 5)
        |]
    , expectError
        "labeled dim mismatch through arithmetic: conv wrong kernel size"
        [r|
      module main (x)
      type Tensor2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      type Tensor3 (d1 :: Nat) (d2 :: Nat) (d3 :: Nat) a
      type Tensor1 (d :: Nat) a = [a]
      makeImg :: h:Int -> w:Int -> Tensor2 h w Real
      makeK :: k:Int -> fh:Int -> fw:Int -> Tensor3 k fh fw Real
      makeB :: k:Int -> Tensor1 k Real
      conv :: Tensor2 h w Real -> Tensor3 k fh fw Real -> Tensor1 k Real -> Tensor3 k (h - fh + 1) (w - fw + 1) Real
      x :: Tensor3 2 3 4 Real
      x = conv (makeImg 5 5) (makeK 2 3 3) (makeB 2)
        |]
    , expectError
        "annotated return type contradicts labeled resolution"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeVec :: n:Int -> Tensor1 n Real
      x :: Tensor1 99 Real
      x = makeVec 5
        |]

    -- === Interesting edge cases ===
    , assertRawType
        "no labels: plain nat vars remain generic"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      id_ :: Tensor1 n Real -> Tensor1 n Real
      a :: Tensor1 5 Real
      x = id_ a
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 5, VarU (TV "Real")])
    , assertRawType
        "label on non-first param position"
        [r|
      module main (x)
      type Tensor1 (d :: Nat) a = [a]
      makeFrom :: Real -> n:Int -> Tensor1 n Real
      x = makeFrom 1.0 10
        |]
        (AppU (VarU (TV "Tensor1")) [NatLitU 10, VarU (TV "Real")])
    ]

natKindPromotionTests :: TestTree
natKindPromotionTests =
  testGroup
    "nat kind promotion and cross-feature interaction"
    [
    -- ================================================================
    -- (:: Nat) annotation effects on type variable promotion
    -- ================================================================
    -- When a typedef has (d :: Nat), variables at that position MUST be
    -- promoted from VarU to NatVarU. Without this promotion, nat label
    -- resolution and nat constraint solving both silently fail.

      assertRawType
        "with (:: Nat): labels resolve to concrete dimensions"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      makeVec :: n:Int -> T1 n Real
      x = makeVec 5
        |]
        (AppU (VarU (TV "T1")) [NatLitU 5, VarU (TV "Real")])

    , assertRawType
        "without (:: Nat): labels do NOT resolve (dim stays generic)"
        [r|
      module main (x)
      type T1 d a = [a]
      makeVec :: n:Int -> T1 n Real
      x = makeVec 5
        |]
        -- Without :: Nat, n is VarU not NatVarU, so resolveNatLabels cannot
        -- find nat vars to solve. The type stays generic (existential).
        (AppU (VarU (TV "T1")) [ExistU (TV "a") ([], Open) ([], Open), VarU (TV "Real")])

    -- ================================================================
    -- Nat constraint solving requires (:: Nat) promotion
    -- ================================================================

    , expectError
        "with (:: Nat): dimension mismatch is caught (4 != 5)"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      dot :: T1 n Real -> T1 n Real -> Real
      a :: T1 4 Real
      b :: T1 5 Real
      x = dot a b
        |]

    -- Without (:: Nat), the params are still NatLitU from the literal syntax.
    -- The typechecker catches the mismatch through existential solving since
    -- the NatLit values 4 and 5 cannot unify. This is actually sound.
    , expectError
        "without (:: Nat): dimension mismatch still caught via existentials"
        [r|
      module main (x)
      type T1 d a = [a]
      dot :: T1 n Real -> T1 n Real -> Real
      a :: T1 4 Real
      b :: T1 5 Real
      x = dot a b
        |]

    -- ================================================================
    -- Multi-step composition: labels propagate through chains
    -- ================================================================

    , assertRawType
        "labeled dims propagate through 3-function chain"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 n Real
      f :: T1 n Real -> T1 n Real
      g :: T1 n Real -> T1 n Real
      x = g (f (makeVec 9))
      makeVec :: n:Int -> T1 n Real
      x = g (f (make 9))
        |]
        (AppU (VarU (TV "T1")) [NatLitU 9, VarU (TV "Real")])

    , assertRawType
        "labeled dims propagate through let chain"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 n Real
      f :: T1 n Real -> T1 n Real
      x = let a = make 4
          in let b = f a
          in f b
        |]
        (AppU (VarU (TV "T1")) [NatLitU 4, VarU (TV "Real")])

    -- ================================================================
    -- Nat arithmetic with labeled params
    -- ================================================================

    , assertRawType
        "labeled subtraction: h=10 w=3, h-w+1 = 8"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: h:Int -> w:Int -> T1 (h - w + 1) Real
      x = make 10 3
        |]
        (AppU (VarU (TV "T1")) [NatLitU 8, VarU (TV "Real")])

    , assertRawType
        "labeled multiplication: m=3 n=4, m*n = 12"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: m:Int -> n:Int -> T1 (m * n) Real
      x = make 3 4
        |]
        (AppU (VarU (TV "T1")) [NatLitU 12, VarU (TV "Real")])

    , assertRawType
        "labeled division: n=12 d=4, n/d = 3"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> d:Int -> T1 (n / d) Real
      x = make 12 4
        |]
        (AppU (VarU (TV "T1")) [NatLitU 3, VarU (TV "Real")])

    , assertRawType
        "compound arithmetic: a=6 b=2 c=1, (a*b)-c = 11"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: a:Int -> b:Int -> c:Int -> T1 (a * b - c) Real
      x = make 6 2 1
        |]
        (AppU (VarU (TV "T1")) [NatLitU 11, VarU (TV "Real")])

    -- ================================================================
    -- Negative: arithmetic mismatches with labels
    -- ================================================================

    , expectError
        "labeled arithmetic mismatch: 10-3+1=8 but annotated as 7"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: h:Int -> w:Int -> T1 (h - w + 1) Real
      x :: T1 7 Real
      x = make 10 3
        |]

    , expectError
        "labeled multiplication mismatch: 3*4=12 but used where 11 expected"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: m:Int -> n:Int -> T1 (m * n) Real
      consume :: T1 11 Real -> Int
      x = consume (make 3 4)
        |]

    -- ================================================================
    -- Cross-feature: nat dims with optional types
    -- ================================================================

    , assertRawType
        "optional tensor: ?(T1 n Real) with labeled dim"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      tryMake :: n:Int -> ?(T1 n Real)
      x = tryMake 5
        |]
        (OptionalU (AppU (VarU (TV "T1")) [NatLitU 5, VarU (TV "Real")]))

    -- ================================================================
    -- Cross-feature: nat dims with effect types
    -- ================================================================

    , assertRawType
        "effectful tensor: <IO> T1 n Real with labeled dim"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      ioMake :: n:Int -> <IO> T1 n Real
      x = ioMake 5
        |]
        (EffectU (EffectSet (Set.singleton "IO"))
          (AppU (VarU (TV "T1")) [NatLitU 5, VarU (TV "Real")]))

    -- ================================================================
    -- Nat dims nested inside other type constructors
    -- ================================================================

    , assertRawType
        "list of nat-parameterized type: [T1 n Real]"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> [T1 n Real]
      x = make 5
        |]
        (AppU (VarU (TV "List")) [AppU (VarU (TV "T1")) [NatLitU 5, VarU (TV "Real")]])

    , assertRawType
        "tuple of nat-parameterized types"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: m:Int -> n:Int -> (T1 m Real, T1 n Real)
      x = make 3 7
        |]
        (AppU (VarU (TV "Tuple2"))
          [ AppU (VarU (TV "T1")) [NatLitU 3, VarU (TV "Real")]
          , AppU (VarU (TV "T1")) [NatLitU 7, VarU (TV "Real")]
          ])

    -- ================================================================
    -- Multiple nat-parameterized typedefs interacting
    -- ================================================================

    , assertRawType
        "conversion between two nat-parameterized types"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      type T2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      flatten :: T2 m n Real -> T1 (m * n) Real
      make :: m:Int -> n:Int -> T2 m n Real
      x = flatten (make 3 4)
        |]
        (AppU (VarU (TV "T1")) [NatLitU 12, VarU (TV "Real")])

    , expectError
        "cross-type dim mismatch: flatten 3x4=12 but consume expects 11"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      type T2 (d1 :: Nat) (d2 :: Nat) a = [[a]]
      flatten :: T2 m n Real -> T1 (m * n) Real
      make :: m:Int -> n:Int -> T2 m n Real
      consume :: T1 11 Real -> Int
      x = consume (flatten (make 3 4))
        |]

    -- ================================================================
    -- Partial nat annotation: some params Nat, some not
    -- ================================================================

    , assertRawType
        "mixed params: first is Nat, second is Type"
        [r|
      module main (x)
      type Sized (n :: Nat) a = [a]
      make :: n:Int -> Sized n Int
      x = make 10
        |]
        (AppU (VarU (TV "Sized")) [NatLitU 10, VarU (TV "Int")])

    -- ================================================================
    -- Negative: bad label syntax and semantics
    -- ================================================================

    -- Label n resolves nothing in return type (m is a different var), so
    -- m stays generic. This is valid — the label just has no effect.
    -- m is promoted to NatVarU (it's in a :: Nat position) but stays unresolved.
    , assertRawType
        "label on param that doesn't appear in return type: dim stays generic"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 m Real
      x = make 5
        |]
        (AppU (VarU (TV "T1")) [NatVarU (TV "a"), VarU (TV "Real")])

    -- ================================================================
    -- Edge: nat literal 0 in arithmetic
    -- ================================================================

    , assertRawType
        "nat literal 0 in subtraction: n-0 = n"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 (n - 0) Real
      x = make 7
        |]
        (AppU (VarU (TV "T1")) [NatLitU 7, VarU (TV "Real")])

    , assertRawType
        "nat literal 1 in multiplication: n*1 = n"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 (n * 1) Real
      x = make 7
        |]
        (AppU (VarU (TV "T1")) [NatLitU 7, VarU (TV "Real")])

    , assertRawType
        "nat literal 0 in multiplication: n*0 = 0"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 (n * 0) Real
      x = make 7
        |]
        (AppU (VarU (TV "T1")) [NatLitU 0, VarU (TV "Real")])

    -- ================================================================
    -- Regression: multiple exports with nat dims
    -- ================================================================

    , testCase "multiple exports all resolve independently" $ do
        result <- runFrontRaw [r|
      module main (x, y)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 n Real
      x = make 3
      y = make 7
          |]
        case result of
          Right [xExpr, yExpr] -> do
            let xt = MTI.cleanTypeName . renameExistentials . gtypeof $ xExpr
                yt = MTI.cleanTypeName . renameExistentials . gtypeof $ yExpr
                expected3 = MTI.cleanTypeName $ AppU (VarU (TV "T1")) [NatLitU 3, VarU (TV "Real")]
                expected7 = MTI.cleanTypeName $ AppU (VarU (TV "T1")) [NatLitU 7, VarU (TV "Real")]
            assertEqual "first export" (closeExistentials expected3) (closeExistentials xt)
            assertEqual "second export" (closeExistentials expected7) (closeExistentials yt)
          Right other -> assertFailure $ "Expected 2 exports, got " ++ show (length other)
          Left e -> assertFailure $ "Unexpected error: " ++ show e

    -- ================================================================
    -- Regression: large nat literals
    -- ================================================================

    , assertRawType
        "large nat literal: 1000000"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      make :: n:Int -> T1 n Real
      x = make 1000000
        |]
        (AppU (VarU (TV "T1")) [NatLitU 1000000, VarU (TV "Real")])

    -- ================================================================
    -- Negative: nat constraint contradictions caught through labels
    -- ================================================================

    , expectError
        "labeled: same label used for different values"
        [r|
      module main (x)
      type T1 (d :: Nat) a = [a]
      combine :: T1 n Real -> T1 n Real -> T1 n Real
      make :: n:Int -> T1 n Real
      x = combine (make 3) (make 5)
        |]

    -- ================================================================
    -- Forward-declared type (no RHS) with :: Nat
    -- ================================================================

    , assertRawType
        "forward-declared type with :: Nat resolves labels"
        [r|
      module main (x)
      type Opaque (d :: Nat) a
      make :: n:Int -> Opaque n Real
      x = make 42
        |]
        (AppU (VarU (TV "Opaque")) [NatLitU 42, VarU (TV "Real")])

    , expectError
        "forward-declared type: dim mismatch caught"
        [r|
      module main (x)
      type Opaque (d :: Nat) a
      make :: n:Int -> Opaque n Real
      consume :: Opaque 10 Real -> Int
      x = consume (make 5)
        |]
    ]

-- ============================================================
-- Let binding syntax tests
-- ============================================================

letBindingTests :: TestTree
letBindingTests =
  localOption (mkTimeout 1000000) $ -- 1 second timeout
    testGroup
      "Let binding syntax"
      [ -- === Regular let expressions ===
        assertGeneralType
          "single let binding"
          [r|
        module main (x)
        x = let y = 42 in y
          |]
          int

      , assertGeneralType
          "let with multiple bindings (omit repeated let)"
          [r|
        module main (x)
        x =
          let a = 1
              b = 2
          in b
          |]
          int

      , assertGeneralType
          "let with repeated let keywords"
          [r|
        module main (x)
        x =
          let a = 1
          let b = 2
          in b
          |]
          int

      , assertGeneralType
          "nested let expressions"
          [r|
        module main (x)
        x =
          let a = 1
          in let b = 2
             in b
          |]
          int

      , assertGeneralType
          "let binding used in body"
          [r|
        module main (x)
        add :: Int -> Int -> Int
        x =
          let a = 1
              b = 2
          in add a b
          |]
          int

      -- === Semicolon-delimited let (for inline / morloc run) ===

      , assertGeneralType
          "let with semicolons (inline form)"
          "module main (x)\nx = let { a = 1; b = 2 } in b"
          int

      -- === Do-block let bindings ===

      , assertGeneralType
          "do-block with single let"
          [r|
        module main (x)
        x = do
            let y = 42
            y
          |]
          (emptyEff int)

      , assertGeneralType
          "do-block with multi-binding let (omit repeated let)"
          [r|
        module main (x)
        x = do
            let a = 1
                b = 2
            b
          |]
          (emptyEff int)

      , assertGeneralType
          "do-block with separate let statements"
          [r|
        module main (x)
        x = do
            let a = 1
            let b = 2
            b
          |]
          (emptyEff int)

      , assertGeneralType
          "do-block let interleaved with bind"
          [r|
        module main (x)
        f :: Int -> <IO> Int
        x = do
            let a = 1
            b <- f a
            let c = 2
            b
          |]
          (ioEff int)

      -- === Semicolon-delimited do-block (explicit braces) ===

      , assertGeneralType
          "do with explicit braces and semicolons"
          "module main (x)\nx = do { 42 }"
          (emptyEff int)

      , assertGeneralType
          "do with explicit braces, let, and semicolons"
          "module main (x)\nx = do { let a = 1; a }"
          (emptyEff int)

      , assertGeneralType
          "do with explicit braces, multiple lets"
          "module main (x)\nx = do { let a = 1; let b = 2; b }"
          (emptyEff int)
      ]

-- | Tests for typeclass instance resolution when multiple instances share the
-- same underlying type (e.g., Foldable List, Foldable Deque, Foldable Array
-- where Deque and Array are defined as List). Instance resolution must handle
-- these without erroring when the first instance solves an existential and
-- subsequent instances have a different alias name but equivalent applied form.
aliasConstructorTests :: TestTree
aliasConstructorTests =
  localOption (mkTimeout 2000000) $ -- 2 second timeout
    testGroup
      "Typeclass resolution with type alias families"
      [
        -- === POSITIVE: aliases that should be equivalent ===

        -- Two aliases for the same underlying type used in a Foldable context.
        -- concat needs (Foldable f, Monoid a). When fold's existential ?f is
        -- solved to one alias, checking it against another should succeed.
        assertGeneralType
          "fold over alias types: Deque and List are equivalent constructors"
          [r|
        module main (f)
        class Semigroup a where
          append :: a -> a -> a
        class Semigroup a => Monoid a where
          mempty :: a
        class Foldable f where
          fold :: (b -> a -> b) -> b -> f a -> b
        type Deque a = List a
        instance Semigroup (List a)
        instance Semigroup (Deque a)
        instance Monoid (List a)
        instance Monoid (Deque a)
        instance Foldable List
        instance Foldable Deque
        concat :: (Foldable f, Monoid a) => f (f a) -> f a
        concat = fold append mempty
        f :: [[Int]] -> [Int]
        f = concat
          |]
          (fun [lst (lst int), lst int])

      , -- Three aliases for the same type used as type constructors
        assertGeneralType
          "three aliases (List, Deque, Array) all equivalent as constructors"
          [r|
        module main (f)
        class Functor f where
          fmap :: (a -> b) -> f a -> f b
        type Deque a = List a
        type Array a = List a
        instance Functor List
        instance Functor Deque
        instance Functor Array
        f :: [Int] -> [Int]
        f = fmap (\x -> x)
          |]
          (fun [lst int, lst int])

      , -- Transitive alias chains: A = B = C should all be equivalent
        assertGeneralType
          "transitive alias: MyList = Deque = List"
          [r|
        module main (f)
        class Foldable f where
          fold :: (b -> a -> b) -> b -> f a -> b
        type Deque a = List a
        type MyList a = Deque a
        instance Foldable List
        instance Foldable Deque
        instance Foldable MyList
        f :: [Int] -> Int
        f = fold (\a x -> a) 0
          |]
          (fun [lst int, int])

      , -- Multi-parameter aliases: same arity, same underlying type
        assertGeneralType
          "two-parameter alias equivalence"
          [r|
        module main (f)
        class MyClass f where
          myMethod :: f a b -> f a b
        type MyMap a b = Map a b
        instance MyClass Map
        instance MyClass MyMap
        f :: Map Int Str -> Map Int Str
        f = myMethod
          |]
          (fun [arr "Map" [int, str], arr "Map" [int, str]])

      , -- === TYPE SPECIALIZATION ===
        -- When a root type (List) and a descendant (Deque) are unified,
        -- the inferred type should specialize to the descendant regardless
        -- of argument order.

        assertRawType
          "specializes to Deque: annotation on right"
          [r|
        module main (bar)
        class Semigroup a where
          append :: a -> a -> a
        type Deque a = List a
        instance Semigroup (List a)
        instance Semigroup (Deque a)
        bar :: Deque Int
        bar = append [1,2,3] ([4,5,6] :: Deque Int)
          |]
          (arr "Deque" [int])

      , assertRawType
          "specializes to Deque: annotation on left"
          [r|
        module main (baz)
        class Semigroup a where
          append :: a -> a -> a
        type Deque a = List a
        instance Semigroup (List a)
        instance Semigroup (Deque a)
        baz :: Deque Int
        baz = append ([4,5,6] :: Deque Int) [1,2,3]
          |]
          (arr "Deque" [int])

      , -- Transitive specialization: MyList = Deque = List should
        -- specialize to the deepest descendant
        assertRawType
          "transitive specialization to deepest descendant"
          [r|
        module main (bar)
        class Semigroup a where
          append :: a -> a -> a
        type Deque a = List a
        type MyList a = Deque a
        instance Semigroup (List a)
        instance Semigroup (Deque a)
        instance Semigroup (MyList a)
        bar :: MyList Int
        bar = append [1,2,3] ([4,5,6] :: MyList Int)
          |]
          (arr "MyList" [int])

      , -- concat: the original motivating case. concat uses fold, (<>),
        -- and mempty which are all typeclass methods with instances for
        -- multiple members of the List representation family.
        assertGeneralType
          "concat typechecks with List representation family"
          [r|
        module main (f)
        class Semigroup a where
          append :: a -> a -> a
        class Semigroup a => Monoid a where
          mempty :: a
        class Foldable f where
          fold :: (b -> a -> b) -> b -> f a -> b
        type Deque a = List a
        type Array a = List a
        instance Semigroup (List a)
        instance Semigroup (Deque a)
        instance Semigroup (Array a)
        instance Monoid (List a)
        instance Monoid (Deque a)
        instance Monoid (Array a)
        instance Foldable List
        instance Foldable Deque
        instance Foldable Array
        concat :: (Foldable f, Monoid a) => f (f a) -> f a
        concat = fold append mempty
        f :: [[Int]] -> [Int]
        f = concat
          |]
          (fun [lst (lst int), lst int])

      , -- === NEGATIVE: SIBLING REJECTION ===

        -- Sibling aliases with applied types should be rejected.
        -- This tests the areSiblingAliases check that prevents
        -- transitive matching through the common ancestor.
        exprTestBad
          "sibling aliases Array and Deque are incompatible"
          [r|
        module main (bad)
        class Semigroup a where
          append :: a -> a -> a
        type Deque a = List a
        type Array a = List a
        instance Semigroup (Deque a)
        instance Semigroup (Array a)
        bad = append ([1,2,3] :: Array Int) ([4,5,6] :: Deque Int)
          |]

      , -- Sibling rejection also applies to function arguments
        exprTestBad
          "function expecting Deque rejects Array argument"
          [r|
        module main (bad)
        type Deque a = List a
        type Array a = List a
        f :: Deque Int -> Int
        bad :: Int
        bad = f ([1,2,3] :: Array Int)
          |]

      , -- Non-alias types remain incompatible
        exprTestBad
          "non-alias types Int vs Str remain incompatible"
          [r|
        module main (f)
        f :: Int
        f = ("hello" :: Str)
          |]
      ]


================================================
FILE: test-suite/cmorloc-tests/Makefile
================================================
all:
	gcc -o test -g *.[ch]

clean:
	rm -f *gch test


================================================
FILE: test-suite/cmorloc-tests/test.c
================================================
#include "test.h"
#include "../../data/morloc.h"

SETUP

void test_json() {
    path_t path[] = { { JSON_PATH_TYPE_KEY, {.key = "b"} } };
    char* element = access_json_by_path("{\"a\":69,\"b\":420}", path, 1, &errmsg);
    TEST( strcmp(element, "420") == 0, "access_json_by_path" );
}

void test_json_string_size() {
    size_t json_size = 0;
    size_t c_size = 0;
    char* errmsg = NULL;
    char* json = "";
    json_string_size
}

int main() {
    test_json();
    test_json_string_size();
    
    TEST_SUMMARY();
    return fails ? 1 : 0;
}


================================================
FILE: test-suite/cmorloc-tests/test.h
================================================
#ifndef __TEST_H__
#define __TEST_H__

#include <stdio.h>

#define COLOR_RED "\033[0;31m"
#define COLOR_GREEN "\033[0;32m"
#define COLOR_RESET "\033[0m"

#define TEST(cond, msg) \
    do { \
        if (!(cond) || errmsg != NULL) { \
            printf("[%sFAIL%s] %s:%d: %s\n", COLOR_RED, COLOR_RESET, __FILE__, __LINE__, msg); \
            fails++; \
        } else { \
            passes++; \
        } \
    } while(0)

#define SETUP char* errmsg = NULL;

#define TEST_TRY(fun, ...) \
    errmsg = NULL; \
    fun(__VA_ARGS__ __VA_OPT__(,) &errmsg); \
    TEST(errmsg != NULL, errmsg)


#define TEST_SUMMARY() \
    printf("\nResults: %s%d passed%s, %s%d failed%s\n", \
        COLOR_GREEN, passes, COLOR_RESET, \
        (fails ? COLOR_RED : COLOR_RESET), fails, COLOR_RESET)

int passes = 0;
int fails = 0;

#endif


================================================
FILE: test-suite/concurrency-tests/bidi-py-r.loc
================================================
module bidiPyR (testUni, testBidi1, testBidi5, testBidi10, testBidi11, testBidi15)

import root-r
import root-py

--' R identity on integers
rId :: Int -> Int
source R from "r_funcs.R" ("r_id" as rId)

--' Python identity on integers
pyId :: Int -> Int
source Py from "py_funcs.py" ("py_id" as pyId)

--' Python collectors of various arities
pyCollect1 :: Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect1)

pyCollect5 :: Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect5)

pyCollect10 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect10)

pyCollect11 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect11)

pyCollect15 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect15)

--' Bidirectional: Python calls R, R calls back to Python
rViaPy :: Int -> Int
rViaPy x = rId (pyId x)

--' Unidirectional control: Python->R only, no callbacks
testUni :: [Int]
testUni = pyCollect15 (rId 1) (rId 2) (rId 3) (rId 4) (rId 5) (rId 6) (rId 7) (rId 8) (rId 9) (rId 10) (rId 11) (rId 12) (rId 13) (rId 14) (rId 15)

--' Bidirectional with increasing callback counts
testBidi1 :: [Int]
testBidi1 = pyCollect1 (rViaPy 1)

testBidi5 :: [Int]
testBidi5 = pyCollect5 (rViaPy 1) (rViaPy 2) (rViaPy 3) (rViaPy 4) (rViaPy 5)

testBidi10 :: [Int]
testBidi10 = pyCollect10 (rViaPy 1) (rViaPy 2) (rViaPy 3) (rViaPy 4) (rViaPy 5) (rViaPy 6) (rViaPy 7) (rViaPy 8) (rViaPy 9) (rViaPy 10)

testBidi11 :: [Int]
testBidi11 = pyCollect11 (rViaPy 1) (rViaPy 2) (rViaPy 3) (rViaPy 4) (rViaPy 5) (rViaPy 6) (rViaPy 7) (rViaPy 8) (rViaPy 9) (rViaPy 10) (rViaPy 11)

testBidi15 :: [Int]
testBidi15 = pyCollect15 (rViaPy 1) (rViaPy 2) (rViaPy 3) (rViaPy 4) (rViaPy 5) (rViaPy 6) (rViaPy 7) (rViaPy 8) (rViaPy 9) (rViaPy 10) (rViaPy 11) (rViaPy 12) (rViaPy 13) (rViaPy 14) (rViaPy 15)


================================================
FILE: test-suite/concurrency-tests/bidi-r-py.loc
================================================
module bidiRPy (testBidi1, testBidi5, testBidi10, testBidi11, testBidi15)

import root-r
import root-py

--' R identity on integers
rId :: Int -> Int
source R from "r_funcs.R" ("r_id" as rId)

--' Python identity on integers
pyId :: Int -> Int
source Py from "py_funcs.py" ("py_id" as pyId)

--' R collectors of various arities
rCollect1 :: Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect1)

rCollect5 :: Int -> Int -> Int -> Int -> Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect5)

rCollect10 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect10)

rCollect11 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect11)

rCollect15 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect15)

--' Bidirectional: R calls Python, Python calls back to R
pyViaR :: Int -> Int
pyViaR x = pyId (rId x)

--' Bidirectional with increasing callback counts (R entry point)
testBidi1 :: [Int]
testBidi1 = rCollect1 (pyViaR 1)

testBidi5 :: [Int]
testBidi5 = rCollect5 (pyViaR 1) (pyViaR 2) (pyViaR 3) (pyViaR 4) (pyViaR 5)

testBidi10 :: [Int]
testBidi10 = rCollect10 (pyViaR 1) (pyViaR 2) (pyViaR 3) (pyViaR 4) (pyViaR 5) (pyViaR 6) (pyViaR 7) (pyViaR 8) (pyViaR 9) (pyViaR 10)

testBidi11 :: [Int]
testBidi11 = rCollect11 (pyViaR 1) (pyViaR 2) (pyViaR 3) (pyViaR 4) (pyViaR 5) (pyViaR 6) (pyViaR 7) (pyViaR 8) (pyViaR 9) (pyViaR 10) (pyViaR 11)

testBidi15 :: [Int]
testBidi15 = rCollect15 (pyViaR 1) (pyViaR 2) (pyViaR 3) (pyViaR 4) (pyViaR 5) (pyViaR 6) (pyViaR 7) (pyViaR 8) (pyViaR 9) (pyViaR 10) (pyViaR 11) (pyViaR 12) (pyViaR 13) (pyViaR 14) (pyViaR 15)


================================================
FILE: test-suite/concurrency-tests/concurrent-uni.loc
================================================
module concurrentUni (testPyToR15, testRToPy15, testPyToR20)

import root-r
import root-py

--' R identity on integers
rId :: Int -> Int
source R from "r_funcs.R" ("r_id" as rId)

--' Python identity on integers
pyId :: Int -> Int
source Py from "py_funcs.py" ("py_id" as pyId)

--' Python collectors
pyCollect15 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect15)

pyCollect20 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect20)

--' R collectors
rCollect15 :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> [Int]
source R from "r_funcs.R" ("r_collect" as rCollect15)

--' 15 unidirectional Python->R calls
testPyToR15 :: [Int]
testPyToR15 = pyCollect15 (rId 1) (rId 2) (rId 3) (rId 4) (rId 5) (rId 6) (rId 7) (rId 8) (rId 9) (rId 10) (rId 11) (rId 12) (rId 13) (rId 14) (rId 15)

--' 15 unidirectional R->Python calls
testRToPy15 :: [Int]
testRToPy15 = rCollect15 (pyId 1) (pyId 2) (pyId 3) (pyId 4) (pyId 5) (pyId 6) (pyId 7) (pyId 8) (pyId 9) (pyId 10) (pyId 11) (pyId 12) (pyId 13) (pyId 14) (pyId 15)

--' 20 unidirectional Python->R calls
testPyToR20 :: [Int]
testPyToR20 = pyCollect20 (rId 1) (rId 2) (rId 3) (rId 4) (rId 5) (rId 6) (rId 7) (rId 8) (rId 9) (rId 10) (rId 11) (rId 12) (rId 13) (rId 14) (rId 15) (rId 16) (rId 17) (rId 18) (rId 19) (rId 20)


================================================
FILE: test-suite/concurrency-tests/deep-callback.loc
================================================
module deepCallback (testDepth2, testDepth4, testDepth6, testDepth12, testDeep4x5, testDeep6x5)

import root-r
import root-py

--' R identity on integers
rId :: Int -> Int
source R from "r_funcs.R" ("r_id" as rId)

--' Python identity on integers
pyId :: Int -> Int
source Py from "py_funcs.py" ("py_id" as pyId)

--' Python collectors
pyCollect1 :: Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect1)

pyCollect5 :: Int -> Int -> Int -> Int -> Int -> [Int]
source Py from "py_funcs.py" ("py_collect" as pyCollect5)

--' Depth-2 chain: Py -> R -> Py
depth2 :: Int -> Int
depth2 x = rId (pyId x)

--' Depth-4 chain: Py -> R -> Py -> R -> Py
depth4 :: Int -> Int
depth4 x = rId (pyId (rId (pyId x)))

--' Depth-6 chain: Py -> R -> Py -> R -> Py -> R -> Py
depth6 :: Int -> Int
depth6 x = rId (pyId (rId (pyId (rId (pyId x)))))

--' Depth-12 chain: 6 round trips
depth12 :: Int -> Int
depth12 x = rId (pyId (rId (pyId (rId (pyId (rId (pyId (rId (pyId (rId (pyId x)))))))))))

-- NOTE: Depth beyond 2*(nproc-1) will deadlock because each cross-language
-- hop blocks a worker. Depth-24 (12 round trips) needs ~12 workers per pool,
-- exceeding the typical nproc-1 = 11 on a 12-core system.

--' Single depth-2 call
testDepth2 :: [Int]
testDepth2 = pyCollect1 (depth2 42)

--' Single depth-4 call
testDepth4 :: [Int]
testDepth4 = pyCollect1 (depth4 42)

--' Single depth-6 call
testDepth6 :: [Int]
testDepth6 = pyCollect1 (depth6 42)

--' Single depth-12 call (6 round trips, sequential)
testDepth12 :: [Int]
testDepth12 = pyCollect1 (depth12 42)

--' 5 parallel depth-4 calls
testDeep4x5 :: [Int]
testDeep4x5 = pyCollect5 (depth4 1) (depth4 2) (depth4 3) (depth4 4) (depth4 5)

--' 5 parallel depth-6 calls
testDeep6x5 :: [Int]
testDeep6x5 = pyCollect5 (depth6 1) (depth6 2) (depth6 3) (depth6 4) (depth6 5)


================================================
FILE: test-suite/concurrency-tests/helpers/py_funcs.py
================================================
def py_collect(*args):
    return list(args)

def py_id(x):
    return x


================================================
FILE: test-suite/concurrency-tests/helpers/r_funcs.R
================================================
r_id <- function(x) x
r_collect <- function(...) list(...)


================================================
FILE: test-suite/concurrency-tests/run-tests.sh
================================================
#!/usr/bin/env bash
# run-tests.sh - Concurrency test suite for morloc cross-pool dispatch
#
# Tests bidirectional callbacks, deep callback chains, and high-concurrency
# unidirectional calls between Python and R pools.
#
# Usage: ./run-tests.sh [test...]
#   With no arguments, runs all tests. Pass partial names to filter:
#   ./run-tests.sh bidi deep

set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
TIMEOUT=10

PASSED=0
FAILED=0
TOTAL=0
FAILURES=()

if [[ -t 1 ]]; then
    GREEN=$'\033[32m' RED=$'\033[31m' YELLOW=$'\033[33m' BOLD=$'\033[1m' RESET=$'\033[0m'
else
    GREEN='' RED='' YELLOW='' BOLD='' RESET=''
fi

# Extract exported subcommands from a .loc file
get_exports() {
    local loc_file="$1"
    # Parse the module export list: module name (export1, export2, ...)
    head -1 "$loc_file" \
        | sed 's/^module[[:space:]]*[^(]*(//; s/).*//; s/,/ /g' \
        | tr -s ' '
}

run_single_test() {
    local loc_file="$1"
    local subcommand="$2"
    local work_dir="$3"

    TOTAL=$((TOTAL + 1))
    local test_label
    test_label="$(basename "$loc_file" .loc):$subcommand"
    printf "  %-35s " "$test_label"

    local output start_time elapsed rc
    start_time=$(date +%s%N)
    output=$(cd "$work_dir" && timeout "$TIMEOUT" ./nexus "$subcommand" 2>&1) && rc=0 || rc=$?
    elapsed=$(( ($(date +%s%N) - start_time) / 1000000 ))

    if [[ $rc -eq 0 ]]; then
        if (( elapsed >= 1000 )); then
            printf "%sPASS%s (%d.%01ds)\n" "$GREEN" "$RESET" "$((elapsed/1000))" "$(( (elapsed%1000) / 100 ))"
        else
            printf "%sPASS%s (%dms)\n" "$GREEN" "$RESET" "$elapsed"
        fi
        PASSED=$((PASSED + 1))
    elif [[ $rc -eq 124 ]]; then
        printf "%sTIMEOUT%s (>${TIMEOUT}s)\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$test_label (timeout)")
    else
        printf "%sFAIL%s (rc=$rc)\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$test_label")
        echo "$output" | tail -3 | sed 's/^/      /'
    fi
}

compile_and_run() {
    local loc_file="$1"
    local loc_basename
    loc_basename="$(basename "$loc_file")"
    local test_name="${loc_basename%.loc}"

    echo "${BOLD}[$test_name]${RESET}"

    local work_dir
    work_dir=$(mktemp -d)
    trap "rm -rf '$work_dir'" RETURN

    cp "$loc_file" "$work_dir/"
    cp "$SCRIPT_DIR/helpers"/* "$work_dir/" 2>/dev/null || true

    # Compile
    if ! (cd "$work_dir" && morloc make -o nexus "$loc_basename" > /dev/null 2>&1); then
        printf "  %-35s %sCOMPILE FAIL%s\n" "$test_name" "$RED" "$RESET"
        local exports
        exports=$(get_exports "$loc_file")
        for sub in $exports; do
            TOTAL=$((TOTAL + 1))
            FAILED=$((FAILED + 1))
            FAILURES+=("$test_name:$sub (compile)")
        done
        echo ""
        return
    fi

    local exports
    exports=$(get_exports "$loc_file")
    for sub in $exports; do
        run_single_test "$loc_file" "$sub" "$work_dir"
    done
    echo ""
}

# Determine which tests to run
SELECTED=("$@")
should_run() {
    if [ ${#SELECTED[@]} -eq 0 ]; then return 0; fi
    for s in "${SELECTED[@]}"; do
        if [[ "$1" == *"$s"* ]]; then return 0; fi
    done
    return 1
}

echo "=== Morloc Concurrency Test Suite ==="
echo "Timeout: ${TIMEOUT}s per subcommand"
echo ""

for loc_file in "$SCRIPT_DIR"/*.loc; do
    test_name="$(basename "$loc_file" .loc)"
    if should_run "$test_name"; then
        compile_and_run "$loc_file"
    fi
done

echo "=== Results ==="
echo "${GREEN}Passed: $PASSED${RESET}, ${RED}Failed: $FAILED${RESET}, Total: $TOTAL"

if (( FAILED > 0 )); then
    echo ""
    echo "${RED}Failures:${RESET}"
    for f in "${FAILURES[@]}"; do
        echo "  ${RED}-${RESET} $f"
    done
    exit 1
fi
echo "${GREEN}${BOLD}ALL PASSED${RESET}"


================================================
FILE: test-suite/daemon-tests/arithmetic.loc
================================================
module arithmetic (add, mul, neg, square)

import root-cpp

add :: Real -> Real -> Real
add x y = x + y

mul :: Real -> Real -> Real
mul x y = x * y

neg :: Real -> Real
neg x = 0.0 - x

square :: Real -> Real
square x = x * x


================================================
FILE: test-suite/daemon-tests/helpers.py
================================================
def greet(name):
    return "Hello, " + name + "!"

def strlen(s):
    return len(s)


================================================
FILE: test-suite/daemon-tests/pure.loc
================================================
module pure (checkInt, checkReal, checkBool, checkStr, checkTuple)

checkInt = 42 :: Int
checkReal = 3.14 :: Real
checkBool = True
checkStr = "hello"
checkTuple = (1 :: Int, True, "abc")


================================================
FILE: test-suite/daemon-tests/run-tests.sh
================================================
#!/usr/bin/env bash
# run-tests.sh - Daemon and router test suite for morloc
#
# Tests the daemon mode (--daemon), HTTP/TCP/socket APIs, and the
# multi-program router (--router).
#
# Usage: ./run-tests.sh [test...]
#   With no arguments, runs all test groups. Pass partial names to filter:
#   ./run-tests.sh http tcp socket router

set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
TIMEOUT=30
DAEMON_STARTUP_WAIT=3

PASSED=0
FAILED=0
TOTAL=0
FAILURES=()

# Tracked PIDs and temp dirs for cleanup
DAEMON_PIDS=()
WORK_DIRS=()
SOCKET_FILES=()

if [[ -t 1 ]]; then
    GREEN=$'\033[32m' RED=$'\033[31m' YELLOW=$'\033[33m' BOLD=$'\033[1m' RESET=$'\033[0m'
else
    GREEN='' RED='' YELLOW='' BOLD='' RESET=''
fi

# ======================================================================
# Cleanup
# ======================================================================

cleanup() {
    for pid in "${DAEMON_PIDS[@]}"; do
        kill "$pid" 2>/dev/null || true
    done
    # Wait briefly then force-kill
    sleep 0.5
    for pid in "${DAEMON_PIDS[@]}"; do
        kill -9 "$pid" 2>/dev/null || true
        wait "$pid" 2>/dev/null || true
    done
    for sock in "${SOCKET_FILES[@]}"; do
        rm -f "$sock"
    done
    for d in "${WORK_DIRS[@]}"; do
        rm -rf "$d"
    done
}
trap cleanup EXIT

# ======================================================================
# Test helpers
# ======================================================================

assert_test() {
    local label="$1"
    local expected="$2"
    local actual="$3"

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "$label"

    if [[ "$actual" == "$expected" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      expected: $expected"
        echo "      actual:   $actual"
    fi
}

assert_contains() {
    local label="$1"
    local needle="$2"
    local haystack="$3"

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "$label"

    if echo "$haystack" | grep -qF "$needle"; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      expected to contain: $needle"
        echo "      actual: $(echo "$haystack" | head -3)"
    fi
}

assert_http_status() {
    local label="$1"
    local expected_status="$2"
    local url="$3"
    shift 3
    # remaining args are passed to curl

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "$label"

    local status
    status=$(curl -s -o /dev/null -w "%{http_code}" "$@" "$url" 2>/dev/null) || status="000"

    if [[ "$status" == "$expected_status" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      expected status: $expected_status"
        echo "      actual status:   $status"
    fi
}

# Send a length-prefixed JSON message over a socket and read the response.
# Usage: lp_request <socket_or_host:port> <json>
# Output: the response JSON string
lp_request() {
    local target="$1"
    local json="$2"

    python3 -c "
import socket, struct, sys, json

target = sys.argv[1]
msg = sys.argv[2].encode('utf-8')

if target.startswith('/'):
    # Unix socket
    s = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
    s.connect(target)
else:
    # TCP host:port
    host, port = target.rsplit(':', 1)
    s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
    s.connect((host, int(port)))

s.settimeout(10)

# Send length-prefixed message
s.sendall(struct.pack('>I', len(msg)) + msg)

# Read response length
resp_len_bytes = b''
while len(resp_len_bytes) < 4:
    chunk = s.recv(4 - len(resp_len_bytes))
    if not chunk:
        break
    resp_len_bytes += chunk

resp_len = struct.unpack('>I', resp_len_bytes)[0]

# Read response body
resp = b''
while len(resp) < resp_len:
    chunk = s.recv(resp_len - len(resp))
    if not chunk:
        break
    resp += chunk

s.close()
print(resp.decode('utf-8'))
" "$target" "$json"
}

# Extract a JSON field value (simple string/number/bool/object extraction)
json_field() {
    local json="$1"
    local field="$2"
    python3 -c "
import json, sys
data = json.loads(sys.argv[1])
val = data.get(sys.argv[2])
if val is None:
    print('')
elif isinstance(val, (dict, list)):
    print(json.dumps(val, separators=(',', ':')))
elif isinstance(val, bool):
    print('true' if val else 'false')
else:
    print(val)
" "$json" "$field"
}

# Wait for a daemon to be ready (checks stderr log for "daemon: ready")
wait_for_daemon() {
    local log_file="$1"
    local max_wait="${2:-$DAEMON_STARTUP_WAIT}"
    local elapsed=0

    while [ "$elapsed" -lt "$max_wait" ]; do
        if grep -q "ready" "$log_file" 2>/dev/null; then
            return 0
        fi
        sleep 0.2
        elapsed=$((elapsed + 1))
    done

    echo "Daemon did not become ready within ${max_wait}s" >&2
    echo "Log contents:" >&2
    cat "$log_file" >&2
    return 1
}

# Wait for an HTTP port to respond
wait_for_http() {
    local port="$1"
    local max_wait="${2:-$DAEMON_STARTUP_WAIT}"
    local i=0
    local step_ms=200
    local max_steps=$(( max_wait * 1000 / step_ms ))

    while [ "$i" -lt "$max_steps" ]; do
        if curl -s -o /dev/null "http://127.0.0.1:${port}/health" 2>/dev/null; then
            return 0
        fi
        sleep 0."$step_ms"
        i=$((i + 1))
    done

    echo "HTTP port $port did not respond within ${max_wait}s" >&2
    return 1
}

# ======================================================================
# Compile test programs
# ======================================================================

compile_program() {
    local loc_file="$1"
    local work_dir="$2"
    local name
    name="$(basename "$loc_file" .loc)"

    cp "$SCRIPT_DIR/$loc_file" "$work_dir/"
    cp "$SCRIPT_DIR"/*.py "$work_dir/" 2>/dev/null || true

    if ! (cd "$work_dir" && morloc make -o nexus "$loc_file" > /dev/null 2>"$work_dir/build-${name}.err"); then
        echo "COMPILE FAIL: $loc_file" >&2
        cat "$work_dir/build-${name}.err" >&2
        return 1
    fi
    return 0
}

# Start a daemon in the background, returning its PID
# Usage: start_daemon <work_dir> [extra_args...]
# Sets: LAST_DAEMON_PID, LAST_DAEMON_LOG
start_daemon() {
    local work_dir="$1"
    shift

    local log_file="$work_dir/daemon.log"

    (cd "$work_dir" && exec ./nexus --daemon "$@" 2>"$log_file") &
    local pid=$!
    DAEMON_PIDS+=("$pid")
    LAST_DAEMON_PID=$pid
    LAST_DAEMON_LOG="$log_file"
}

# Stop a daemon by PID
stop_daemon() {
    local pid="$1"
    kill "$pid" 2>/dev/null || true
    wait "$pid" 2>/dev/null || true
    # Remove from tracked list
    local new_pids=()
    for p in "${DAEMON_PIDS[@]}"; do
        [[ "$p" != "$pid" ]] && new_pids+=("$p")
    done
    DAEMON_PIDS=("${new_pids[@]+"${new_pids[@]}"}")
}

# Pick a random available port
pick_port() {
    python3 -c "
import socket
s = socket.socket()
s.bind(('127.0.0.1', 0))
print(s.getsockname()[1])
s.close()
"
}

# ======================================================================
# Test selector
# ======================================================================

SELECTED=("$@")
should_run() {
    if [ ${#SELECTED[@]} -eq 0 ]; then return 0; fi
    for s in "${SELECTED[@]}"; do
        if [[ "$1" == *"$s"* ]]; then return 0; fi
    done
    return 1
}

# ======================================================================
# Setup: compile all test programs
# ======================================================================

echo "=== Morloc Daemon Test Suite ==="
echo ""

ARITH_DIR=$(mktemp -d)
STRINGS_DIR=$(mktemp -d)
PURE_DIR=$(mktemp -d)
WORK_DIRS+=("$ARITH_DIR" "$STRINGS_DIR" "$PURE_DIR")

echo "Compiling test programs..."
compile_program "arithmetic.loc" "$ARITH_DIR"
compile_program "strings.loc" "$STRINGS_DIR"
compile_program "pure.loc" "$PURE_DIR"
echo "Done."
echo ""

# ======================================================================
# Test Group 1: HTTP API
# ======================================================================

if should_run "http"; then
    echo "${BOLD}[http] Daemon HTTP API${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    # Health endpoint
    result=$(curl -s "http://127.0.0.1:${HTTP_PORT}/health")
    status=$(json_field "$result" "status")
    assert_test "GET /health returns ok" "ok" "$status"

    # Discovery endpoint
    disco=$(curl -s "http://127.0.0.1:${HTTP_PORT}/discover")
    assert_contains "GET /discover lists commands" "add" "$disco"
    assert_contains "GET /discover lists mul" "mul" "$disco"
    assert_contains "GET /discover lists neg" "neg" "$disco"
    assert_contains "GET /discover lists square" "square" "$disco"

    # Call add(3, 4) -> 7.0
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -H "Content-Type: application/json" -d '[3, 4]')
    status=$(json_field "$result" "status")
    val=$(json_field "$result" "result")
    assert_test "POST /call/add [3,4] status=ok" "ok" "$status"
    assert_test "POST /call/add [3,4] result=7" "7" "$val"

    # Call mul(5, 6) -> 30
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/mul" \
        -H "Content-Type: application/json" -d '[5, 6]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/mul [5,6] result=30" "30" "$val"

    # Call neg(42) -> -42
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/neg" \
        -H "Content-Type: application/json" -d '[42]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/neg [42] result=-42" "-42" "$val"

    # Call square(7) -> 49
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/square" \
        -H "Content-Type: application/json" -d '[7]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/square [7] result=49" "49" "$val"

    # Args as {"args": [...]} object form
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -H "Content-Type: application/json" -d '{"args": [10, 20]}')
    val=$(json_field "$result" "result")
    assert_test "POST /call/add {args:[10,20]} result=30" "30" "$val"

    # Floating point args
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -H "Content-Type: application/json" -d '[1.5, 2.5]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/add [1.5,2.5] result=4" "4" "$val"

    # Error: unknown command
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/nonexistent" \
        -H "Content-Type: application/json" -d '[1]')
    status=$(json_field "$result" "status")
    assert_test "POST /call/nonexistent returns error" "error" "$status"

    # Error: unknown endpoint
    assert_http_status "GET /bogus returns 400" "400" "http://127.0.0.1:${HTTP_PORT}/bogus"

    # CORS preflight
    assert_http_status "OPTIONS returns 200" "200" "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -X OPTIONS

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 2: HTTP with Python pool (strings)
# ======================================================================

if should_run "http-py"; then
    echo "${BOLD}[http-py] Daemon HTTP with Python pool${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$STRINGS_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    # Call greet("world") -> "Hello, world!"
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/greet" \
        -H "Content-Type: application/json" -d '["world"]')
    status=$(json_field "$result" "status")
    val=$(json_field "$result" "result")
    assert_test "POST /call/greet status=ok" "ok" "$status"
    assert_test "POST /call/greet [world] result" "Hello, world!" "$val"

    # Call strlen("morloc") -> 6
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/strlen" \
        -H "Content-Type: application/json" -d '["morloc"]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/strlen [morloc] result=6" "6" "$val"

    # Empty string
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/strlen" \
        -H "Content-Type: application/json" -d '[""]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/strlen [] result=0" "0" "$val"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 3: HTTP with pure commands
# ======================================================================

if should_run "http-pure"; then
    echo "${BOLD}[http-pure] Daemon HTTP with pure morloc commands${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$PURE_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    # Pure commands take no arguments
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/checkInt" \
        -H "Content-Type: application/json" -d '[]')
    status=$(json_field "$result" "status")
    val=$(json_field "$result" "result")
    assert_test "POST /call/checkInt status=ok" "ok" "$status"
    assert_test "POST /call/checkInt result=42" "42" "$val"

    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/checkReal" \
        -H "Content-Type: application/json" -d '[]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/checkReal result=3.14" "3.14" "$val"

    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/checkBool" \
        -H "Content-Type: application/json" -d '[]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/checkBool result=true" "true" "$val"

    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/checkStr" \
        -H "Content-Type: application/json" -d '[]')
    val=$(json_field "$result" "result")
    assert_test "POST /call/checkStr result=hello" "hello" "$val"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 4: Unix socket (length-prefixed JSON)
# ======================================================================

if should_run "socket"; then
    echo "${BOLD}[socket] Daemon Unix socket API${RESET}"

    SOCK_PATH="/tmp/morloc-test-$$.sock"
    SOCKET_FILES+=("$SOCK_PATH")
    start_daemon "$ARITH_DIR" --socket "$SOCK_PATH"
    wait_for_daemon "$LAST_DAEMON_LOG" 15

    # Health check via socket
    result=$(lp_request "$SOCK_PATH" '{"method":"health"}')
    status=$(json_field "$result" "status")
    assert_test "socket health status=ok" "ok" "$status"

    # Discovery via socket
    result=$(lp_request "$SOCK_PATH" '{"method":"discover"}')
    assert_contains "socket discover lists add" "add" "$result"

    # Call via socket: add(10, 20) -> 30.0
    result=$(lp_request "$SOCK_PATH" '{"method":"call","command":"add","args":[10,20]}')
    status=$(json_field "$result" "status")
    val=$(json_field "$result" "result")
    assert_test "socket call add status=ok" "ok" "$status"
    assert_test "socket call add [10,20] result=30" "30" "$val"

    # Call via socket with request ID
    result=$(lp_request "$SOCK_PATH" '{"id":"req-42","method":"call","command":"mul","args":[3,7]}')
    rid=$(json_field "$result" "id")
    val=$(json_field "$result" "result")
    assert_test "socket call with id echoes id" "req-42" "$rid"
    assert_test "socket call mul [3,7] result=21" "21" "$val"

    # Error: unknown command via socket
    result=$(lp_request "$SOCK_PATH" '{"method":"call","command":"bogus","args":[1]}')
    status=$(json_field "$result" "status")
    assert_test "socket unknown command returns error" "error" "$status"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 5: TCP (length-prefixed JSON)
# ======================================================================

if should_run "tcp"; then
    echo "${BOLD}[tcp] Daemon TCP API${RESET}"

    TCP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --port "$TCP_PORT"
    wait_for_daemon "$LAST_DAEMON_LOG" 15

    # Health check via TCP
    result=$(lp_request "127.0.0.1:${TCP_PORT}" '{"method":"health"}')
    status=$(json_field "$result" "status")
    assert_test "tcp health status=ok" "ok" "$status"

    # Call via TCP: add(100, 200) -> 300.0
    result=$(lp_request "127.0.0.1:${TCP_PORT}" '{"method":"call","command":"add","args":[100,200]}')
    status=$(json_field "$result" "status")
    val=$(json_field "$result" "result")
    assert_test "tcp call add status=ok" "ok" "$status"
    assert_test "tcp call add [100,200] result=300" "300" "$val"

    # Call via TCP: square(9) -> 81
    result=$(lp_request "127.0.0.1:${TCP_PORT}" '{"method":"call","command":"square","args":[9]}')
    val=$(json_field "$result" "result")
    assert_test "tcp call square [9] result=81" "81" "$val"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 6: Multiple listeners simultaneously
# ======================================================================

if should_run "multi"; then
    echo "${BOLD}[multi] Daemon with all listeners${RESET}"

    SOCK_PATH="/tmp/morloc-test-multi-$$.sock"
    SOCKET_FILES+=("$SOCK_PATH")
    HTTP_PORT=$(pick_port)
    TCP_PORT=$(pick_port)

    start_daemon "$ARITH_DIR" --socket "$SOCK_PATH" --port "$TCP_PORT" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    # Same command via all three protocols
    # HTTP
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -H "Content-Type: application/json" -d '[1, 2]')
    val=$(json_field "$result" "result")
    assert_test "multi: HTTP add [1,2] result=3" "3" "$val"

    # TCP
    result=$(lp_request "127.0.0.1:${TCP_PORT}" '{"method":"call","command":"add","args":[1,2]}')
    val=$(json_field "$result" "result")
    assert_test "multi: TCP add [1,2] result=3" "3" "$val"

    # Unix socket
    result=$(lp_request "$SOCK_PATH" '{"method":"call","command":"add","args":[1,2]}')
    val=$(json_field "$result" "result")
    assert_test "multi: socket add [1,2] result=3" "3" "$val"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 7: Sequential requests (daemon stays alive)
# ======================================================================

if should_run "sequential"; then
    echo "${BOLD}[sequential] Multiple sequential requests${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    all_ok=true
    for i in $(seq 1 10); do
        result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
            -H "Content-Type: application/json" -d "[${i}, ${i}]")
        val=$(json_field "$result" "result")
        expected=$(python3 -c "x = float($i + $i); print(int(x) if x == int(x) else x)")
        if [[ "$val" != "$expected" ]]; then
            all_ok=false
            break
        fi
    done

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "10 sequential add calls"
    if $all_ok; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("10 sequential add calls")
    fi

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 8: Concurrent requests
# ======================================================================

if should_run "concurrent"; then
    echo "${BOLD}[concurrent] Concurrent HTTP requests${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    # Fire 5 concurrent requests (each with a 15s timeout)
    CONC_DIR=$(mktemp -d)
    WORK_DIRS+=("$CONC_DIR")

    CONC_PIDS=()
    for i in $(seq 1 5); do
        (
            curl -s --max-time 15 -X POST "http://127.0.0.1:${HTTP_PORT}/call/square" \
                -H "Content-Type: application/json" -d "[${i}]" \
                > "$CONC_DIR/result-${i}.json" 2>/dev/null
        ) &
        CONC_PIDS+=($!)
    done
    # Wait for all with a per-process check
    for pid in "${CONC_PIDS[@]}"; do
        wait "$pid" 2>/dev/null || true
    done

    all_ok=true
    for i in $(seq 1 5); do
        if [ -f "$CONC_DIR/result-${i}.json" ]; then
            result=$(cat "$CONC_DIR/result-${i}.json")
            val=$(json_field "$result" "result")
            expected=$(python3 -c "x = float($i * $i); print(int(x) if x == int(x) else x)")
            if [[ "$val" != "$expected" ]]; then
                all_ok=false
            fi
        else
            all_ok=false
        fi
    done

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "5 concurrent square calls"
    if $all_ok; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("5 concurrent square calls")
    fi

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 9: Graceful shutdown
# ======================================================================

if should_run "shutdown"; then
    echo "${BOLD}[shutdown] Graceful daemon shutdown${RESET}"

    HTTP_PORT=$(pick_port)
    SOCK_PATH="/tmp/morloc-test-shutdown-$$.sock"
    SOCKET_FILES+=("$SOCK_PATH")

    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT" --socket "$SOCK_PATH"
    wait_for_http "$HTTP_PORT" 10
    local_pid=$LAST_DAEMON_PID

    # Verify it's alive
    result=$(curl -s "http://127.0.0.1:${HTTP_PORT}/health" 2>/dev/null) || result=""
    status=$(json_field "$result" "status" 2>/dev/null) || status=""
    assert_test "daemon alive before shutdown" "ok" "$status"

    # Send SIGTERM
    kill "$local_pid" 2>/dev/null
    wait "$local_pid" 2>/dev/null || true

    # Remove from tracked list
    new_pids=()
    for p in "${DAEMON_PIDS[@]}"; do
        [[ "$p" != "$local_pid" ]] && new_pids+=("$p")
    done
    DAEMON_PIDS=("${new_pids[@]+"${new_pids[@]}"}")

    # Verify it's dead
    sleep 0.5

    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "daemon exits after SIGTERM"
    if ! kill -0 "$local_pid" 2>/dev/null; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("daemon exits after SIGTERM")
        kill -9 "$local_pid" 2>/dev/null || true
    fi

    # Verify socket file cleaned up
    TOTAL=$((TOTAL + 1))
    printf "  %-50s " "socket file removed after shutdown"
    if [ ! -e "$SOCK_PATH" ]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("socket file removed after shutdown")
    fi

    echo ""
fi

# ======================================================================
# Test Group 10: Router
# ======================================================================

if should_run "router"; then
    echo "${BOLD}[router] Multi-program router${RESET}"

    # Set up a temporary fdb directory with manifests
    FDB_DIR=$(mktemp -d)
    WORK_DIRS+=("$FDB_DIR")

    # Extract manifest JSON from the nexus wrapper script
    # Format is: #!/bin/sh\nexec morloc-nexus ...\n### MANIFEST ###\n<json>
    if [ -f "$ARITH_DIR/nexus" ]; then
        sed -n '/^### MANIFEST ###$/,$ { /^### MANIFEST ###$/d; p; }' \
            "$ARITH_DIR/nexus" > "$FDB_DIR/arithmetic.manifest"
        # Patch build_dir in manifest to point to the work dir
        python3 -c "
import json, sys
with open(sys.argv[1]) as f:
    m = json.load(f)
m['build_dir'] = sys.argv[2]
with open(sys.argv[1], 'w') as f:
    json.dump(m, f)
" "$FDB_DIR/arithmetic.manifest" "$ARITH_DIR"
    fi

    if [ ! -s "$FDB_DIR/arithmetic.manifest" ]; then
        echo "  ${RED}SKIP: could not extract manifest${RESET}"
        echo ""
        TOTAL=$((TOTAL + 1))
        FAILED=$((FAILED + 1))
        FAILURES+=("router: could not extract manifest")
    fi

    if [ -s "$FDB_DIR/arithmetic.manifest" ]; then
        ROUTER_PORT=$(pick_port)

        # Start router (use the morloc-nexus binary)
        NEXUS_PATH="$(which morloc-nexus 2>/dev/null || echo "$HOME/.local/bin/morloc-nexus")"
        (exec "$NEXUS_PATH" --router --http-port "$ROUTER_PORT" --fdb "$FDB_DIR" 2>"$FDB_DIR/router.log") &
        ROUTER_PID=$!
        DAEMON_PIDS+=("$ROUTER_PID")

        wait_for_http "$ROUTER_PORT" 15 || true

        # Health check
        result=$(curl -s "http://127.0.0.1:${ROUTER_PORT}/health" 2>/dev/null) || result=""
        status=$(json_field "$result" "status" 2>/dev/null) || status=""
        assert_test "router GET /health" "ok" "$status"

        # List programs
        disco=$(curl -s "http://127.0.0.1:${ROUTER_PORT}/programs" 2>/dev/null) || disco=""
        assert_contains "router GET /programs lists arithmetic" "arithmetic" "$disco"

        # Full discovery
        disco=$(curl -s "http://127.0.0.1:${ROUTER_PORT}/discover" 2>/dev/null) || disco=""
        assert_contains "router GET /discover lists programs" "programs" "$disco"

        # Per-program discovery
        disco=$(curl -s "http://127.0.0.1:${ROUTER_PORT}/discover/arithmetic" 2>/dev/null) || disco=""
        assert_contains "router GET /discover/arithmetic lists add" "add" "$disco"

        # Call through router: add(5, 10) -> 15.0
        result=$(curl -s -X POST "http://127.0.0.1:${ROUTER_PORT}/call/arithmetic/add" \
            -H "Content-Type: application/json" -d '[5, 10]' 2>/dev/null) || result=""
        status=$(json_field "$result" "status" 2>/dev/null) || status=""
        val=$(json_field "$result" "result" 2>/dev/null) || val=""
        assert_test "router call add status=ok" "ok" "$status"
        assert_test "router call add [5,10] result=15" "15" "$val"

        # Call through router: square(4) -> 16
        result=$(curl -s -X POST "http://127.0.0.1:${ROUTER_PORT}/call/arithmetic/square" \
            -H "Content-Type: application/json" -d '[4]' 2>/dev/null) || result=""
        val=$(json_field "$result" "result" 2>/dev/null) || val=""
        assert_test "router call square [4] result=16" "16" "$val"

        # Error: unknown program
        result=$(curl -s -X POST "http://127.0.0.1:${ROUTER_PORT}/call/bogus/add" \
            -H "Content-Type: application/json" -d '[1,2]' 2>/dev/null) || result=""
        assert_contains "router unknown program returns error" "error" "$result"

        # Shutdown router
        stop_daemon "$ROUTER_PID"

        # Verify child daemons are also cleaned up
        sleep 1
        remaining=$(pgrep -f "morloc-router-arithmetic" 2>/dev/null | wc -l) || remaining=0

        TOTAL=$((TOTAL + 1))
        printf "  %-50s " "router cleans up child daemons"
        if [ "$remaining" -eq 0 ]; then
            printf "%sPASS%s\n" "$GREEN" "$RESET"
            PASSED=$((PASSED + 1))
        else
            printf "%sFAIL%s\n" "$RED" "$RESET"
            FAILED=$((FAILED + 1))
            FAILURES+=("router cleans up child daemons")
        fi
    fi

    echo ""
fi

# ======================================================================
# Test Group 11: Connection timeout resilience
# ======================================================================

if should_run "timeout"; then
    echo "${BOLD}[timeout] Connection timeout resilience${RESET}"

    HTTP_PORT=$(pick_port)
    SOCK_PATH="/tmp/morloc-test-timeout-$$.sock"
    SOCKET_FILES+=("$SOCK_PATH")
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT" --socket "$SOCK_PATH"
    wait_for_http "$HTTP_PORT" 10

    # Open a socket, send partial data (just 2 bytes of the 4-byte length prefix),
    # then don't send anything else. The daemon should time out and remain responsive.
    python3 -c "
import socket, time
s = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
s.connect('$SOCK_PATH')
s.sendall(b'\\x00\\x00')  # partial length prefix
time.sleep(1)
s.close()
" 2>/dev/null &
    STALL_PID=$!

    # Wait a moment, then verify daemon still responds
    sleep 2
    result=$(curl -s "http://127.0.0.1:${HTTP_PORT}/health" 2>/dev/null) || result=""
    status=$(json_field "$result" "status" 2>/dev/null) || status=""
    assert_test "daemon responsive after stalled client" "ok" "$status"

    wait "$STALL_PID" 2>/dev/null || true

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Test Group 12: Pool crash recovery
# ======================================================================

if should_run "pool-recovery"; then
    echo "${BOLD}[pool-recovery] Pool crash and restart${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10
    DAEMON_PID_FOR_RECOVERY=$LAST_DAEMON_PID

    # Verify it works before killing
    result=$(curl -s -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
        -H "Content-Type: application/json" -d '[1, 2]')
    val=$(json_field "$result" "result")
    assert_test "pool-recovery: works before kill" "3" "$val"

    # Find and kill pool child processes
    pool_pids=$(pgrep -P "$DAEMON_PID_FOR_RECOVERY" 2>/dev/null) || pool_pids=""
    if [ -n "$pool_pids" ]; then
        for ppid in $pool_pids; do
            kill -9 "$ppid" 2>/dev/null || true
        done

        # Wait for restart (daemon checks on every poll cycle = 1s)
        sleep 4

        # Verify it works after pool restart
        result=$(curl -s --max-time 10 -X POST "http://127.0.0.1:${HTTP_PORT}/call/add" \
            -H "Content-Type: application/json" -d '[10, 20]')
        val=$(json_field "$result" "result" 2>/dev/null) || val=""
        assert_test "pool-recovery: works after pool kill" "30" "$val"
    else
        TOTAL=$((TOTAL + 1))
        printf "  %-50s " "pool-recovery: works after pool kill"
        printf "%sSKIP%s (no child pools found)\n" "$YELLOW" "$RESET"
        PASSED=$((PASSED + 1))
    fi

    stop_daemon "$DAEMON_PID_FOR_RECOVERY"
    echo ""
fi

# ======================================================================
# Test Group 13: Health endpoint with pool status
# ======================================================================

if should_run "pool-health"; then
    echo "${BOLD}[pool-health] Health endpoint reports pool status${RESET}"

    HTTP_PORT=$(pick_port)
    start_daemon "$ARITH_DIR" --http-port "$HTTP_PORT"
    wait_for_http "$HTTP_PORT" 10

    result=$(curl -s "http://127.0.0.1:${HTTP_PORT}/health")
    assert_contains "health response includes pools" "pools" "$result"
    assert_contains "health response includes status ok" "ok" "$result"

    # Check that pools array has at least one true entry
    has_alive=$(python3 -c "
import json, sys
data = json.loads(sys.argv[1])
result = data.get('result', data)
pools = result.get('pools', [])
print('true' if any(pools) else 'false')
" "$result" 2>/dev/null) || has_alive="false"
    assert_test "health shows pools alive" "true" "$has_alive"

    stop_daemon "$LAST_DAEMON_PID"
    echo ""
fi

# ======================================================================
# Results
# ======================================================================

echo "=== Results ==="
echo "${GREEN}Passed: $PASSED${RESET}, ${RED}Failed: $FAILED${RESET}, Total: $TOTAL"

if (( FAILED > 0 )); then
    echo ""
    echo "${RED}Failures:${RESET}"
    for f in "${FAILURES[@]}"; do
        echo "  ${RED}-${RESET} $f"
    done
    exit 1
fi
echo "${GREEN}${BOLD}ALL PASSED${RESET}"


================================================
FILE: test-suite/daemon-tests/strings.loc
================================================
module strings (greet, strlen)

import root-py

source Py from "helpers.py" ("greet", "strlen")

greet :: Str -> Str
strlen :: Str -> Int


================================================
FILE: test-suite/error-message-tests/README
================================================
All programs here are broken by design. They should all fail and give reasonable
error messages.


================================================
FILE: test-suite/error-message-tests/bad-source/Makefile
================================================
all:
	morloc make foo.loc


================================================
FILE: test-suite/error-message-tests/bad-source/foo.loc
================================================
module main (foo)

source Py from "badthing" ("foo" as bar)

class Dohicky where
  bar :: Int

foo = 1


================================================
FILE: test-suite/error-message-tests/cyclical-import/foo.loc
================================================
module foo (foo)

import foo (foo)


================================================
FILE: test-suite/error-message-tests/list-error-1/Makefile
================================================
all:
	morloc make foo.loc


================================================
FILE: test-suite/error-message-tests/list-error-1/foo.loc
================================================
module main (foo)

type Py => Real = "float"

foo :: [Real]
foo = [2.0, "yolo", 5.6]


================================================
FILE: test-suite/error-message-tests/missing-import-module/foo.loc
================================================
module foo (bar)

import barm (bar)


================================================
FILE: test-suite/error-message-tests/missing-import-term/barm.loc
================================================
module barm (bar)

bar a :: a -> a -> a 


================================================
FILE: test-suite/error-message-tests/missing-import-term/main.loc
================================================
module main (bar)

import barm (lemonhope, bar, pickle)


================================================
FILE: test-suite/error-message-tests/pool-crash-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus crashme 0 2>&1 | grep -ci "signal\|crash\|abort" > obs.txt || echo "0" > obs.txt

clean:
	rm -rf nexus pools* __pycache__ *.err obs.txt .manifest


================================================
FILE: test-suite/error-message-tests/pool-crash-cpp/foo.hpp
================================================
#include <cstdlib>

int cpp_crash(int x){
    abort();
    return x;
}


================================================
FILE: test-suite/error-message-tests/pool-crash-cpp/main
================================================
#!/bin/sh
exec morloc-nexus "$0" "$@"
### MANIFEST ###
{"version":1,"name":"main","build_dir":"/home/z/projects/morloc-core/morloc-workspace/compiler/morloc/test-suite/error-message-tests/pool-crash-cpp","build_time":1773294321,"pools":[{"lang":"cpp","exec":["pools/main/pool-cpp.out"],"socket":"pipe-cpp"}],"commands":[{"name":"crashme","type":"remote","mid":1,"pool":0,"needed_pools":[0],"arg_schemas":["<int>i4"],"return_schema":"<int>i4","desc":[],"return_type":"Int","return_desc":[],"args":[{"kind":"pos","metavar":null,"type_desc":"Int","quoted":false,"desc":[]}],"group":null}],"groups":[]}

================================================
FILE: test-suite/error-message-tests/pool-crash-cpp/main.loc
================================================
module main (crashme)

source Cpp from "foo.hpp" ("cpp_crash")

type Cpp => Int = "int"

cpp_crash :: Int -> Int
crashme = cpp_crash


================================================
FILE: test-suite/error-message-tests/runtime-error-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus failme 0 2>&1 | grep -c "CPPERR" > obs.txt || echo "0" > obs.txt

clean:
	rm -rf nexus pools* __pycache__ *.err obs.txt .manifest


================================================
FILE: test-suite/error-message-tests/runtime-error-cpp/foo.hpp
================================================
#include <stdexcept>

int cpp_fail(int x){
    throw std::runtime_error("CPPERR: something went wrong in cpp");
    return x;
}


================================================
FILE: test-suite/error-message-tests/runtime-error-cpp/main.loc
================================================
module main (failme)

source Cpp from "foo.hpp" ("cpp_fail")

type Cpp => Int = "int"

cpp_fail :: Int -> Int
failme = cpp_fail


================================================
FILE: test-suite/error-message-tests/runtime-error-cross-lang/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus py_calls_cpp_err '"hello"' 2>&1 | grep -c "CPPERR" > obs.txt || echo "0" > obs.txt
	./nexus r_calls_py_err '"hello"' 2>&1 | grep -c "PYERR" >> obs.txt || echo "0" >> obs.txt

clean:
	rm -rf nexus pools* __pycache__ *.err obs.txt .manifest


================================================
FILE: test-suite/error-message-tests/runtime-error-cross-lang/foo.R
================================================
r_id <- function(x) x


================================================
FILE: test-suite/error-message-tests/runtime-error-cross-lang/foo.hpp
================================================
#include <stdexcept>
#include <string>

std::string cpp_fail(std::string x){
    throw std::runtime_error("CPPERR: cross-lang failure in cpp");
    return x;
}

std::string cpp_id(std::string x){
    return x;
}


================================================
FILE: test-suite/error-message-tests/runtime-error-cross-lang/foo.py
================================================
def py_fail(x):
    raise ValueError("PYERR: cross-lang failure in python")

def py_id(x):
    return x


================================================
FILE: test-suite/error-message-tests/runtime-error-cross-lang/main.loc
================================================
module main (py_calls_cpp_err, r_calls_py_err)

import root ((.))

source Cpp from "foo.hpp" ("cpp_fail", "cpp_id")
source Py from "foo.py" ("py_fail", "py_id")
source R from "foo.R" ("r_id")

type Cpp => Str = "std::string"
type Py => Str = "str"
type R => Str = "character"

cpp_fail :: Str -> Str
cpp_id :: Str -> Str
py_fail :: Str -> Str
py_id :: Str -> Str
r_id :: Str -> Str

-- Python calls into C++ which throws
py_calls_cpp_err :: Str -> Str
py_calls_cpp_err = py_id . cpp_fail

-- R calls into Python which raises
r_calls_py_err :: Str -> Str
r_calls_py_err = r_id . py_fail


================================================
FILE: test-suite/error-message-tests/runtime-error-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus failme 0 2>&1 | grep -c "PYERR" > obs.txt || echo "0" > obs.txt

clean:
	rm -rf nexus pools* __pycache__ *.err obs.txt .manifest


================================================
FILE: test-suite/error-message-tests/runtime-error-py/foo.py
================================================
def py_fail(x):
    raise ValueError("PYERR: something went wrong in python")


================================================
FILE: test-suite/error-message-tests/runtime-error-py/main.loc
================================================
module main (failme)

source Py from "foo.py" ("py_fail")

type Py => Int = "int"

py_fail :: Int -> Int
failme = py_fail


================================================
FILE: test-suite/error-message-tests/runtime-error-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus failme 0 2>&1 | grep -c "RERR" > obs.txt || echo "0" > obs.txt

clean:
	rm -rf nexus pools* __pycache__ *.err obs.txt .manifest


================================================
FILE: test-suite/error-message-tests/runtime-error-r/foo.R
================================================
r_fail <- function(x){
    stop("RERR: something went wrong in r")
}


================================================
FILE: test-suite/error-message-tests/runtime-error-r/main.loc
================================================
module main (failme)

source R from "foo.R" ("r_fail")

type R => Int = "integer"

r_fail :: Int -> Int
failme = r_fail


================================================
FILE: test-suite/error-message-tests/term-masking/foo.loc
================================================
module m (foo) 

import foo2 (foo)
import foo3 (foo)


================================================
FILE: test-suite/error-message-tests/term-masking/foo2.loc
================================================
module foo2 (foo)

source Py ("foo")

foo a :: a -> a -> a


================================================
FILE: test-suite/error-message-tests/term-masking/foo3.loc
================================================
module foo3 (foo)

source Py ("foo")

foo a :: a -> a -> a


================================================
FILE: test-suite/error-message-tests/typechecking-1/Makefile
================================================
all:
	morloc make foo.loc


================================================
FILE: test-suite/error-message-tests/typechecking-1/foo.loc
================================================
module main (foo)

import root-py

foo :: Real -> Real
foo x = x + "2.0" * 20.0


================================================
FILE: test-suite/error-message-tests/typechecking-2/Makefile
================================================
all:
	morloc make foo.loc


================================================
FILE: test-suite/error-message-tests/typechecking-2/foo.loc
================================================
module main (foo)

import root-py

foo :: Real -> Str
foo y = (\x -> 32) y


================================================
FILE: test-suite/error-message-tests/typeclass-bad-instance/foo.loc
================================================
module foo3 (*)

class Marcy a where
  foo a :: a -> a -> a

instance Marcy a where
  source Py ("foo", "bar")


================================================
FILE: test-suite/error-message-tests/typeclass-bad-instance-expr/foo.loc
================================================
module foo3 (*)

class Marcy a where
  foo a :: a -> a -> a

instance Marcy a where
  source Py ("foo", "bar")


================================================
FILE: test-suite/error-message-tests/typeclass-masking/foo.loc
================================================
module foo (*) 

instance Marcy a where
  source Py ("foo")

import foo2 (Marcy)
import foo3 (Marcy)


================================================
FILE: test-suite/error-message-tests/typeclass-masking/foo2.loc
================================================
module foo2 (Marcy)

class Marcy a where
  bar a :: a -> a -> a


================================================
FILE: test-suite/error-message-tests/typeclass-masking/foo3.loc
================================================
module foo3 (Marcy)

class Marcy a where
  foo a :: a -> a -> a


================================================
FILE: test-suite/error-message-tests/typeclass-monomorphic-conflict/foo.loc
================================================
module foo (foo) 

import foo2 (foo)
import foo3 (Marcy)


================================================
FILE: test-suite/error-message-tests/typeclass-monomorphic-conflict/foo2.loc
================================================
module foo2 (foo)

source Py ("foo")

foo a :: a -> a -> a


================================================
FILE: test-suite/error-message-tests/typeclass-monomorphic-conflict/foo3.loc
================================================
module foo3 (Marcy)

class Marcy a where
  foo a :: a -> a -> a

instance Marcy a where
  source Py ("foo")


================================================
FILE: test-suite/error-message-tests/typeclass-overlap/foo.loc
================================================
module foo (*) 

import foo2 (Farcy)
import foo3 (Marcy)


================================================
FILE: test-suite/error-message-tests/typeclass-overlap/foo2.loc
================================================
module foo2 (Farcy)

class Farcy a where
  foo a :: a -> a -> a

instance Farcy a where
  source Py ("foo")


================================================
FILE: test-suite/error-message-tests/typeclass-overlap/foo3.loc
================================================
module foo3 (Marcy)

class Marcy a where
  foo a :: a -> a -> a

instance Marcy a where
  source Py ("foo")


================================================
FILE: test-suite/error-message-tests/undefined-term/Makefile
================================================
all:
	morloc make foo.loc


================================================
FILE: test-suite/error-message-tests/undefined-term/foo.loc
================================================
module main (foo)

foo :: Real -> Real
foo x = x + "2.0" * 20.0


================================================
FILE: test-suite/executable-benchmark/.gitignore
================================================
nexus
pool.*


================================================
FILE: test-suite/executable-benchmark/README
================================================
# Executable Benchmarks

This folder contains benchmarks of the executables that morloc produces (not compile times).


================================================
FILE: test-suite/executable-benchmark/distributed/.gitignore
================================================
.morloc-cache


================================================
FILE: test-suite/executable-benchmark/distributed/Makefile
================================================
all:
	morloc make main.loc
	./nexus bar [1,2,3]

build:
	gcc -g -o nexus -O -I/home/z/.morloc/include nexus.c
	g++ -g --std=c++17 -o pool-cpp.out pool.cpp -std=c++17 -I/home/z/.morloc/include -I.

clean:
	rm -rf __pycache__ pool* nexus* log


================================================
FILE: test-suite/executable-benchmark/distributed/foo.cpp
================================================
#include <vector>

double cmean(std::vector<double> xs){
    if(xs.size() == 0){
        return 0;
    }
    double total = 0;
    for(size_t i = 0; i < xs.size(); i++){
        total += xs[i];
    }
    return total / xs.size();
}

double cdouble(double x){
    return x * 2;
}


================================================
FILE: test-suite/executable-benchmark/distributed/foo.py
================================================
import random
import math
import multiprocessing


def simulate(n: int) -> list[float]:
    return [random.normalvariate(mu=0, sigma=1) for _ in range(n)]

def mean(xs: list[float]) -> float:
    return sum(xs) / len(xs)

def sd(xs: list[float]) -> float:
    mu = mean(xs)
    return math.sqrt(sum([(x - mu) * (x - mu) for x in xs]) / (len(xs) - 1))

def double(x: float):
    return x * 2

def nTrials(n: int, a, f):
    with multiprocessing.Pool() as pool:
        results = pool.map(f, (a for _ in range(n)))
    return results


================================================
FILE: test-suite/executable-benchmark/distributed/main.loc
================================================
-- module m (bar)
--
-- source Py from "foo.py" ("double", "mean" as pmean)
--
-- type Py => Real = "float"
-- type Py => List a = "list" a
--
-- pmean :: [Real] -> Real
-- double :: Real -> Real
--
-- bar xs = double (large:pmean xs)


module m (bar)

source Cpp from "foo.cpp" ("cdouble" as double, "cmean" as mean)

type Cpp => Real = "double"
type Cpp => List a = "std::vector<$1>" a
mean :: [Real] -> Real
double :: Real -> Real

bar xs = double (large:mean xs)


-- -- module m (foo, bar)
-- -- module m (foo)
-- module m (bar)
--
-- -- source R from "foo.R" ("mean" as rmean)
-- -- source Py from "foo.py" ("double", "mean" as pmean)
-- source Cpp from "foo.cpp" ("cdouble" as double, "cmean" as mean)
--
-- -- type Py => Real = "float"
-- -- type Py => List a = "list" a
--
-- type Cpp => Real = "double"
-- type Cpp => List a = "std::vector<$1>" a
--
-- -- type R => Real = "numeric"
-- -- type R => List a = "list" a
--
-- -- rmean :: [Real] -> Real
-- -- pmean :: [Real] -> Real
-- mean :: [Real] -> Real
-- double :: Real -> Real
--
-- -- -- This should *immediately* make a remote call from the nexus and then that
-- -- -- remote nexus will call the remote pool
-- -- foo = large:mean
--
-- -- Here the pool makes the remote call
-- bar xs = double (large:mean xs)
--
-- -- type Py => Int = "int"
-- -- type Py => Real = "float"
-- -- type Py => Tuple2 a b = "tuple" a b
-- -- type Py => List a = "list" a
-- --
-- -- source Py from "foo.py" ("nTrials", "mean", "sd", "simulate")
-- --
-- -- simulate :: Int -> [Real]
-- -- mean :: [Real] -> Real
-- -- sd :: [Real] -> Real
-- --
-- -- -- multi-threaded program for running a random process many times on the same input
-- -- nTrials a b :: Int -> a -> (a -> b) -> [b]
-- --
-- -- foo :: Int -> Int -> (Real, Real)
-- -- foo n size = (mean means, sd means)
-- --   where
-- --   means = nTrials n size (small:mean . simulate)
--
-- -- -- case 1: applications
-- -- f1 x = small:foo x
-- --
-- -- -- case 2: compositions
-- -- f1 = small:foo . bar
-- --
-- -- -- non-case: lambdas, instead bind the top named function, there always is one
-- -- f3 = (\y -> small:foo (bar y))
-- --
-- -- -- basically, we are always binding directly to a variable name
-- --
-- -- -- what about this? the label should travel with bar, so `f4 = small:foo`
-- -- bar = small:foo
-- -- f4 = bar


================================================
FILE: test-suite/executable-benchmark/distributed/main.yaml
================================================
default-group:
  benchmark: false
  cache: false
  distribute: null
labeled-groups:
  large:
    benchmark: true
    cache: true
    remote:
      threads: 32
      memory: 128
      gpus: 0
      time: "3-00:00:00"
  small:
    cache: true
    remote:
      threads: 32
      memory: 128
      gpus: 0
      time: "0-01:00:00"


================================================
FILE: test-suite/executable-benchmark/parallel-interop/.gitignore
================================================
__pycache__/
cis.csv
cis.markdown
log
trans.csv
trans.markdown


================================================
FILE: test-suite/executable-benchmark/parallel-interop/Makefile
================================================
all:
	bash test.sh

clean:
	rm -rf cis.csv cis.markdown log nexus pools trans.csv trans.markdown __pycache__


================================================
FILE: test-suite/executable-benchmark/parallel-interop/foo.R
================================================
mockr <- function(x){
  Sys.sleep(1)
  return(2*x)
}


================================================
FILE: test-suite/executable-benchmark/parallel-interop/foo.loc
================================================
module parallel (pcis, scis, ptrans, strans)

source Py from "parallel.py" ("pmap", "smap")
source Py from "foo.py" ("mockpy")
source R from "foo.R" ("mockr")

type Py => Int = "int"
type Py => List a = "list" a

type R => Int = "numeric"
type R => List a = "list" a

mockr :: Int -> Int
mockpy :: Int -> Int
pmap a b :: (a -> b) -> [a] -> [b]
smap a b :: (a -> b) -> [a] -> [b]

pcis = pmap mockpy
ptrans = pmap mockr

scis = smap mockpy
strans = smap mockr


================================================
FILE: test-suite/executable-benchmark/parallel-interop/foo.py
================================================
import time

def mockpy(x):
    time.sleep(1)
    return 2*x


================================================
FILE: test-suite/executable-benchmark/parallel-interop/parallel.py
================================================
import multiprocessing

def pmap(f, xs):
    with multiprocessing.Pool() as pool:
        results = pool.map(f, xs)
    return results

def smap(f, xs):
    return [f(x) for x in xs]


================================================
FILE: test-suite/executable-benchmark/parallel-interop/test.sh
================================================
#!/usr/bin/env bash

set -e

morloc make foo.loc

hyperfine \
  -w 5 \
  -L test pcis,scis \
  --export-markdown cis.markdown \
  --export-csv cis.csv \
  "./nexus {test} [1,2,3,4,5,6]"

hyperfine \
  -w 5 \
  -L test ptrans,strans \
  --export-markdown trans.markdown \
  --export-csv trans.csv \
  "./nexus {test} [1,2,3,4,5,6]"


================================================
FILE: test-suite/executable-benchmark/serial-interop/.gitignore
================================================
__pycache__/
pool*
stats.*
log
z-*
z
stats-*.markdown
nexus


================================================
FILE: test-suite/executable-benchmark/serial-interop/Makefile
================================================
all:
	morloc make foo.loc

clean:
	rm -rf pool* nexus __pycache__ stats.* log


================================================
FILE: test-suite/executable-benchmark/serial-interop/foo.R
================================================
rid <- function(x) x

# Generate an n MB random string
nmb <- function(n){
  stringi::stri_dup("x", n * 1024 * 1024)
}

incr <- function(x, y) x + y

addr <- function(x, y) x + y


================================================
FILE: test-suite/executable-benchmark/serial-interop/foo.hpp
================================================
#include <iostream>
#include <string>

template <class T>
T cid(T x) {
  return x;
}

template <class T>
int noop(const T& x) { return 1; }

int strlen(const std::string& x){
  return static_cast<int>(x.size());
}

std::string nmb(int n) {
    std::string result(1024 * 1024 * n, 'x');
    return result;
}


================================================
FILE: test-suite/executable-benchmark/serial-interop/foo.loc
================================================
module foo
  ( pZeroBaseline
  , rZeroBaseline
  , cZeroBaseline
  , pTenBaseline
  , rTenBaseline
  , cTenBaseline
  , pZeroToForeign
  , pZeroFromForeign
  , rZeroToForeign
  , rZeroFromForeign
  , pTenToForeign
  , pTenFromForeign
  , rTenToForeign
  , rTenFromForeign
  , rMarginalCost1
  , rMarginalCost2
  , rMarginalCost3
  , rMarginalCost4
  , pMarginalCost1
  , pMarginalCost2
  , pMarginalCost3
  , pMarginalCost4
  , mapManyPCP
  , mapManyPCR
  , memtest
  )

import root ((.))
import root-py (Int, Str, List)
import root-cpp (Int, Str, List, Functor)
import root-r (Int, Str, List)

source py from "foo.py" ("nmb" as pnmb, "pid", "morloc_len" as plen, "addp")
source R from "foo.R" ("nmb" as rnmb, "rid", "nchar" as rlen, "addr")
source Cpp from "foo.hpp" ("nmb" as cnmb, "cid", "strlen" as clen)

addp :: Int -> Int -> Int
addr :: Int -> Int -> Int

-- Generate a test string with a length of n megabytes
pnmb :: Int -> Str
rnmb :: Int -> Str
cnmb :: Int -> Str

plen a :: Str -> Int
rlen a :: Str -> Int
clen a :: Str -> Int

pid a :: a -> a
rid a :: a -> a
cid a :: a -> a

-- C(L) : constant cost of calling language L
-- R(x) : cost of generating x megabyte string
-- F(x,L,M) : cost of sending x MB from L to M

-- 0MB test for baseline - t = C(L) + R(0)
pZeroBaseline = (plen . pnmb) 0
rZeroBaseline = (rlen . rnmb) 0
cZeroBaseline = (clen . cnmb) 0

-- 10MB test for baseline - t = C(L) + R(10MB)
pTenBaseline = (plen . pnmb) 100 -- 
rTenBaseline = (rlen . rnmb) 100
cTenBaseline = (clen . cnmb) 100

-- 0MB test for foreign interop
pZeroToForeign   = (clen . pnmb) 0 -- C(c) + C(p) + F(0,p,c) + R(0)
pZeroFromForeign = (plen . cnmb) 0 -- C(c) + C(p) + F(0,c,p) + R(0)

rZeroToForeign   = (clen . rnmb) 0 -- C(c) + C(r) + F(0,r,c) + R(0)
rZeroFromForeign = (rlen . cnmb) 0 -- C(c) + C(r) + F(0,c,r) + R(0)

-- 10MB test for foreign interop
pTenToForeign   = (clen . pnmb) 100 -- C(c) + C(p) + F(10,p,c) + R(10)
pTenFromForeign = (plen . cnmb) 100 -- C(c) + C(p) + F(10,c,p) + R(10)
                                                                    
rTenToForeign   = (clen . rnmb) 100 -- C(c) + C(r) + F(10,r,c) + R(10)
rTenFromForeign = (rlen . cnmb) 100 -- C(c) + C(r) + F(10,c,r) + R(10)

-- Test the marginal cost of foreign calls
-- This will be high if, for example, we have to fire up the interpreter for every call to Python
rMarginalCost1 = rnmb 0 
rMarginalCost2 = (rid . cid . rnmb) 0 
rMarginalCost3 = (rid . cid . rid . cid . rnmb) 0 
rMarginalCost4 = (rid . cid . rid . cid . rid . cid . rnmb) 0 

pMarginalCost1 = pnmb 0 
pMarginalCost2 = (pid . cid . pnmb) 0 
pMarginalCost3 = (pid . cid . pid . cid . pnmb) 0 
pMarginalCost4 = (pid . cid . pid . cid . pid . cid . pnmb) 0 

memtest :: [Int] -> [(Int, Int)]
memtest xs = map (\x -> (pid x, plen s)) xs where
  s = cnmb 10

mapManyPCP :: Int -> [Int] -> [Int]
mapManyPCP x xs = map (addp x) xs

mapManyPCR :: Int -> [Int] -> [Int]
mapManyPCR x xs = map (addr x) xs


================================================
FILE: test-suite/executable-benchmark/serial-interop/foo.py
================================================
def nmb(n):
    return "x" * n * 1024 * 1024

def pid(x):
    return x

def addp(x, y):
    return x + y

def morloc_len(xs):
    return len(xs)


================================================
FILE: test-suite/executable-benchmark/serial-interop/long-list.json
================================================
[ 1,
  2,
  3,
  4,
  5,
  6,
  7,
  8,
  9,
  10,
  11,
  12,
  13,
  14,
  15,
  16,
  17,
  18,
  19,
  20,
  21,
  22,
  23,
  24,
  25,
  26,
  27,
  28,
  29,
  30,
  31,
  32,
  33,
  34,
  35,
  36,
  37,
  38,
  39,
  40,
  41,
  42,
  43,
  44,
  45,
  46,
  47,
  48,
  49,
  50,
  51,
  52,
  53,
  54,
  55,
  56,
  57,
  58,
  59,
  60,
  61,
  62,
  63,
  64,
  65,
  66,
  67,
  68,
  69,
  70,
  71,
  72,
  73,
  74,
  75,
  76,
  77,
  78,
  79,
  80,
  81,
  82,
  83,
  84,
  85,
  86,
  87,
  88,
  89,
  90,
  91,
  92,
  93,
  94,
  95,
  96,
  97,
  98,
  99,
  100,
  101,
  102,
  103,
  104,
  105,
  106,
  107,
  108,
  109,
  110,
  111,
  112,
  113,
  114,
  115,
  116,
  117,
  118,
  119,
  120,
  121,
  122,
  123,
  124,
  125,
  126,
  127,
  128,
  129,
  130,
  131,
  132,
  133,
  134,
  135,
  136,
  137,
  138,
  139,
  140,
  141,
  142,
  143,
  144,
  145,
  146,
  147,
  148,
  149,
  150,
  151,
  152,
  153,
  154,
  155,
  156,
  157,
  158,
  159,
  160,
  161,
  162,
  163,
  164,
  165,
  166,
  167,
  168,
  169,
  170,
  171,
  172,
  173,
  174,
  175,
  176,
  177,
  178,
  179,
  180,
  181,
  182,
  183,
  184,
  185,
  186,
  187,
  188,
  189,
  190,
  191,
  192,
  193,
  194,
  195,
  196,
  197,
  198,
  199,
  200,
  201,
  202,
  203,
  204,
  205,
  206,
  207,
  208,
  209,
  210,
  211,
  212,
  213,
  214,
  215,
  216,
  217,
  218,
  219,
  220,
  221,
  222,
  223,
  224,
  225,
  226,
  227,
  228,
  229,
  230,
  231,
  232,
  233,
  234,
  235,
  236,
  237,
  238,
  239,
  240,
  241,
  242,
  243,
  244,
  245,
  246,
  247,
  248,
  249,
  250,
  251,
  252,
  253,
  254,
  255,
  256,
  257,
  258,
  259,
  260,
  261,
  262,
  263,
  264,
  265,
  266,
  267,
  268,
  269,
  270,
  271,
  272,
  273,
  274,
  275,
  276,
  277,
  278,
  279,
  280,
  281,
  282,
  283,
  284,
  285,
  286,
  287,
  288,
  289,
  290,
  291,
  292,
  293,
  294,
  295,
  296,
  297,
  298,
  299,
  300,
  301,
  302,
  303,
  304,
  305,
  306,
  307,
  308,
  309,
  310,
  311,
  312,
  313,
  314,
  315,
  316,
  317,
  318,
  319,
  320,
  321,
  322,
  323,
  324,
  325,
  326,
  327,
  328,
  329,
  330,
  331,
  332,
  333,
  334,
  335,
  336,
  337,
  338,
  339,
  340,
  341,
  342,
  343,
  344,
  345,
  346,
  347,
  348,
  349,
  350,
  351,
  352,
  353,
  354,
  355,
  356,
  357,
  358,
  359,
  360,
  361,
  362,
  363,
  364,
  365,
  366,
  367,
  368,
  369,
  370,
  371,
  372,
  373,
  374,
  375,
  376,
  377,
  378,
  379,
  380,
  381,
  382,
  383,
  384,
  385,
  386,
  387,
  388,
  389,
  390,
  391,
  392,
  393,
  394,
  395,
  396,
  397,
  398,
  399,
  400,
  401,
  402,
  403,
  404,
  405,
  406,
  407,
  408,
  409,
  410,
  411,
  412,
  413,
  414,
  415,
  416,
  417,
  418,
  419,
  420,
  421,
  422,
  423,
  424,
  425,
  426,
  427,
  428,
  429,
  430,
  431,
  432,
  433,
  434,
  435,
  436,
  437,
  438,
  439,
  440,
  441,
  442,
  443,
  444,
  445,
  446,
  447,
  448,
  449,
  450,
  451,
  452,
  453,
  454,
  455,
  456,
  457,
  458,
  459,
  460,
  461,
  462,
  463,
  464,
  465,
  466,
  467,
  468,
  469,
  470,
  471,
  472,
  473,
  474,
  475,
  476,
  477,
  478,
  479,
  480,
  481,
  482,
  483,
  484,
  485,
  486,
  487,
  488,
  489,
  490,
  491,
  492,
  493,
  494,
  495,
  496,
  497,
  498,
  499,
  500,
  501,
  502,
  503,
  504,
  505,
  506,
  507,
  508,
  509,
  510,
  511,
  512,
  513,
  514,
  515,
  516,
  517,
  518,
  519,
  520,
  521,
  522,
  523,
  524,
  525,
  526,
  527,
  528,
  529,
  530,
  531,
  532,
  533,
  534,
  535,
  536,
  537,
  538,
  539,
  540,
  541,
  542,
  543,
  544,
  545,
  546,
  547,
  548,
  549,
  550,
  551,
  552,
  553,
  554,
  555,
  556,
  557,
  558,
  559,
  560,
  561,
  562,
  563,
  564,
  565,
  566,
  567,
  568,
  569,
  570,
  571,
  572,
  573,
  574,
  575,
  576,
  577,
  578,
  579,
  580,
  581,
  582,
  583,
  584,
  585,
  586,
  587,
  588,
  589,
  590,
  591,
  592,
  593,
  594,
  595,
  596,
  597,
  598,
  599,
  600,
  601,
  602,
  603,
  604,
  605,
  606,
  607,
  608,
  609,
  610,
  611,
  612,
  613,
  614,
  615,
  616,
  617,
  618,
  619,
  620,
  621,
  622,
  623,
  624,
  625,
  626,
  627,
  628,
  629,
  630,
  631,
  632,
  633,
  634,
  635,
  636,
  637,
  638,
  639,
  640,
  641,
  642,
  643,
  644,
  645,
  646,
  647,
  648,
  649,
  650,
  651,
  652,
  653,
  654,
  655,
  656,
  657,
  658,
  659,
  660,
  661,
  662,
  663,
  664,
  665,
  666,
  667,
  668,
  669,
  670,
  671,
  672,
  673,
  674,
  675,
  676,
  677,
  678,
  679,
  680,
  681,
  682,
  683,
  684,
  685,
  686,
  687,
  688,
  689,
  690,
  691,
  692,
  693,
  694,
  695,
  696,
  697,
  698,
  699,
  700,
  701,
  702,
  703,
  704,
  705,
  706,
  707,
  708,
  709,
  710,
  711,
  712,
  713,
  714,
  715,
  716,
  717,
  718,
  719,
  720,
  721,
  722,
  723,
  724,
  725,
  726,
  727,
  728,
  729,
  730,
  731,
  732,
  733,
  734,
  735,
  736,
  737,
  738,
  739,
  740,
  741,
  742,
  743,
  744,
  745,
  746,
  747,
  748,
  749,
  750,
  751,
  752,
  753,
  754,
  755,
  756,
  757,
  758,
  759,
  760,
  761,
  762,
  763,
  764,
  765,
  766,
  767,
  768,
  769,
  770,
  771,
  772,
  773,
  774,
  775,
  776,
  777,
  778,
  779,
  780,
  781,
  782,
  783,
  784,
  785,
  786,
  787,
  788,
  789,
  790,
  791,
  792,
  793,
  794,
  795,
  796,
  797,
  798,
  799,
  800,
  801,
  802,
  803,
  804,
  805,
  806,
  807,
  808,
  809,
  810,
  811,
  812,
  813,
  814,
  815,
  816,
  817,
  818,
  819,
  820,
  821,
  822,
  823,
  824,
  825,
  826,
  827,
  828,
  829,
  830,
  831,
  832,
  833,
  834,
  835,
  836,
  837,
  838,
  839,
  840,
  841,
  842,
  843,
  844,
  845,
  846,
  847,
  848,
  849,
  850,
  851,
  852,
  853,
  854,
  855,
  856,
  857,
  858,
  859,
  860,
  861,
  862,
  863,
  864,
  865,
  866,
  867,
  868,
  869,
  870,
  871,
  872,
  873,
  874,
  875,
  876,
  877,
  878,
  879,
  880,
  881,
  882,
  883,
  884,
  885,
  886,
  887,
  888,
  889,
  890,
  891,
  892,
  893,
  894,
  895,
  896,
  897,
  898,
  899,
  900,
  901,
  902,
  903,
  904,
  905,
  906,
  907,
  908,
  909,
  910,
  911,
  912,
  913,
  914,
  915,
  916,
  917,
  918,
  919,
  920,
  921,
  922,
  923,
  924,
  925,
  926,
  927,
  928,
  929,
  930,
  931,
  932,
  933,
  934,
  935,
  936,
  937,
  938,
  939,
  940,
  941,
  942,
  943,
  944,
  945,
  946,
  947,
  948,
  949,
  950,
  951,
  952,
  953,
  954,
  955,
  956,
  957,
  958,
  959,
  960,
  961,
  962,
  963,
  964,
  965,
  966,
  967,
  968,
  969,
  970,
  971,
  972,
  973,
  974,
  975,
  976,
  977,
  978,
  979,
  980,
  981,
  982,
  983,
  984,
  985,
  986,
  987,
  988,
  989,
  990,
  991,
  992,
  993,
  994,
  995,
  996,
  997,
  998,
  999,
  1000,
  1001,
  1002,
  1003,
  1004,
  1005,
  1006,
  1007,
  1008,
  1009,
  1010,
  1011,
  1012,
  1013,
  1014,
  1015,
  1016,
  1017,
  1018,
  1019,
  1020,
  1021,
  1022,
  1023,
  1024,
  1025,
  1026,
  1027,
  1028,
  1029,
  1030,
  1031,
  1032,
  1033,
  1034,
  1035,
  1036,
  1037,
  1038,
  1039,
  1040,
  1041,
  1042,
  1043,
  1044,
  1045,
  1046,
  1047,
  1048,
  1049,
  1050,
  1051,
  1052,
  1053,
  1054,
  1055,
  1056,
  1057,
  1058,
  1059,
  1060,
  1061,
  1062,
  1063,
  1064,
  1065,
  1066,
  1067,
  1068,
  1069,
  1070,
  1071,
  1072,
  1073,
  1074,
  1075,
  1076,
  1077,
  1078,
  1079,
  1080,
  1081,
  1082,
  1083,
  1084,
  1085,
  1086,
  1087,
  1088,
  1089,
  1090,
  1091,
  1092,
  1093,
  1094,
  1095,
  1096,
  1097,
  1098,
  1099,
  1100,
  1101,
  1102,
  1103,
  1104,
  1105,
  1106,
  1107,
  1108,
  1109,
  1110,
  1111,
  1112,
  1113,
  1114,
  1115,
  1116,
  1117,
  1118,
  1119,
  1120,
  1121,
  1122,
  1123,
  1124,
  1125,
  1126,
  1127,
  1128,
  1129,
  1130,
  1131,
  1132,
  1133,
  1134,
  1135,
  1136,
  1137,
  1138,
  1139,
  1140,
  1141,
  1142,
  1143,
  1144,
  1145,
  1146,
  1147,
  1148,
  1149,
  1150,
  1151,
  1152,
  1153,
  1154,
  1155,
  1156,
  1157,
  1158,
  1159,
  1160,
  1161,
  1162,
  1163,
  1164,
  1165,
  1166,
  1167,
  1168,
  1169,
  1170,
  1171,
  1172,
  1173,
  1174,
  1175,
  1176,
  1177,
  1178,
  1179,
  1180,
  1181,
  1182,
  1183,
  1184,
  1185,
  1186,
  1187,
  1188,
  1189,
  1190,
  1191,
  1192,
  1193,
  1194,
  1195,
  1196,
  1197,
  1198,
  1199,
  1200,
  1201,
  1202,
  1203,
  1204,
  1205,
  1206,
  1207,
  1208,
  1209,
  1210,
  1211,
  1212,
  1213,
  1214,
  1215,
  1216,
  1217,
  1218,
  1219,
  1220,
  1221,
  1222,
  1223,
  1224,
  1225,
  1226,
  1227,
  1228,
  1229,
  1230,
  1231,
  1232,
  1233,
  1234,
  1235,
  1236,
  1237,
  1238,
  1239,
  1240,
  1241,
  1242,
  1243,
  1244,
  1245,
  1246,
  1247,
  1248,
  1249,
  1250,
  1251,
  1252,
  1253,
  1254,
  1255,
  1256,
  1257,
  1258,
  1259,
  1260,
  1261,
  1262,
  1263,
  1264,
  1265,
  1266,
  1267,
  1268,
  1269,
  1270,
  1271,
  1272,
  1273,
  1274,
  1275,
  1276,
  1277,
  1278,
  1279,
  1280,
  1281,
  1282,
  1283,
  1284,
  1285,
  1286,
  1287,
  1288,
  1289,
  1290,
  1291,
  1292,
  1293,
  1294,
  1295,
  1296,
  1297,
  1298,
  1299,
  1300,
  1301,
  1302,
  1303,
  1304,
  1305,
  1306,
  1307,
  1308,
  1309,
  1310,
  1311,
  1312,
  1313,
  1314,
  1315,
  1316,
  1317,
  1318,
  1319,
  1320,
  1321,
  1322,
  1323,
  1324,
  1325,
  1326,
  1327,
  1328,
  1329,
  1330,
  1331,
  1332,
  1333,
  1334,
  1335,
  1336,
  1337,
  1338,
  1339,
  1340,
  1341,
  1342,
  1343,
  1344,
  1345,
  1346,
  1347,
  1348,
  1349,
  1350,
  1351,
  1352,
  1353,
  1354,
  1355,
  1356,
  1357,
  1358,
  1359,
  1360,
  1361,
  1362,
  1363,
  1364,
  1365,
  1366,
  1367,
  1368,
  1369,
  1370,
  1371,
  1372,
  1373,
  1374,
  1375,
  1376,
  1377,
  1378,
  1379,
  1380,
  1381,
  1382,
  1383,
  1384,
  1385,
  1386,
  1387,
  1388,
  1389,
  1390,
  1391,
  1392,
  1393,
  1394,
  1395,
  1396,
  1397,
  1398,
  1399,
  1400,
  1401,
  1402,
  1403,
  1404,
  1405,
  1406,
  1407,
  1408,
  1409,
  1410,
  1411,
  1412,
  1413,
  1414,
  1415,
  1416,
  1417,
  1418,
  1419,
  1420,
  1421,
  1422,
  1423,
  1424,
  1425,
  1426,
  1427,
  1428,
  1429,
  1430,
  1431,
  1432,
  1433,
  1434,
  1435,
  1436,
  1437,
  1438,
  1439,
  1440,
  1441,
  1442,
  1443,
  1444,
  1445,
  1446,
  1447,
  1448,
  1449,
  1450,
  1451,
  1452,
  1453,
  1454,
  1455,
  1456,
  1457,
  1458,
  1459,
  1460,
  1461,
  1462,
  1463,
  1464,
  1465,
  1466,
  1467,
  1468,
  1469,
  1470,
  1471,
  1472,
  1473,
  1474,
  1475,
  1476,
  1477,
  1478,
  1479,
  1480,
  1481,
  1482,
  1483,
  1484,
  1485,
  1486,
  1487,
  1488,
  1489,
  1490,
  1491,
  1492,
  1493,
  1494,
  1495,
  1496,
  1497,
  1498,
  1499,
  1500,
  1501,
  1502,
  1503,
  1504,
  1505,
  1506,
  1507,
  1508,
  1509,
  1510,
  1511,
  1512,
  1513,
  1514,
  1515,
  1516,
  1517,
  1518,
  1519,
  1520,
  1521,
  1522,
  1523,
  1524,
  1525,
  1526,
  1527,
  1528,
  1529,
  1530,
  1531,
  1532,
  1533,
  1534,
  1535,
  1536,
  1537,
  1538,
  1539,
  1540,
  1541,
  1542,
  1543,
  1544,
  1545,
  1546,
  1547,
  1548,
  1549,
  1550,
  1551,
  1552,
  1553,
  1554,
  1555,
  1556,
  1557,
  1558,
  1559,
  1560,
  1561,
  1562,
  1563,
  1564,
  1565,
  1566,
  1567,
  1568,
  1569,
  1570,
  1571,
  1572,
  1573,
  1574,
  1575,
  1576,
  1577,
  1578,
  1579,
  1580,
  1581,
  1582,
  1583,
  1584,
  1585,
  1586,
  1587,
  1588,
  1589,
  1590,
  1591,
  1592,
  1593,
  1594,
  1595,
  1596,
  1597,
  1598,
  1599,
  1600,
  1601,
  1602,
  1603,
  1604,
  1605,
  1606,
  1607,
  1608,
  1609,
  1610,
  1611,
  1612,
  1613,
  1614,
  1615,
  1616,
  1617,
  1618,
  1619,
  1620,
  1621,
  1622,
  1623,
  1624,
  1625,
  1626,
  1627,
  1628,
  1629,
  1630,
  1631,
  1632,
  1633,
  1634,
  1635,
  1636,
  1637,
  1638,
  1639,
  1640,
  1641,
  1642,
  1643,
  1644,
  1645,
  1646,
  1647,
  1648,
  1649,
  1650,
  1651,
  1652,
  1653,
  1654,
  1655,
  1656,
  1657,
  1658,
  1659,
  1660,
  1661,
  1662,
  1663,
  1664,
  1665,
  1666,
  1667,
  1668,
  1669,
  1670,
  1671,
  1672,
  1673,
  1674,
  1675,
  1676,
  1677,
  1678,
  1679,
  1680,
  1681,
  1682,
  1683,
  1684,
  1685,
  1686,
  1687,
  1688,
  1689,
  1690,
  1691,
  1692,
  1693,
  1694,
  1695,
  1696,
  1697,
  1698,
  1699,
  1700,
  1701,
  1702,
  1703,
  1704,
  1705,
  1706,
  1707,
  1708,
  1709,
  1710,
  1711,
  1712,
  1713,
  1714,
  1715,
  1716,
  1717,
  1718,
  1719,
  1720,
  1721,
  1722,
  1723,
  1724,
  1725,
  1726,
  1727,
  1728,
  1729,
  1730,
  1731,
  1732,
  1733,
  1734,
  1735,
  1736,
  1737,
  1738,
  1739,
  1740,
  1741,
  1742,
  1743,
  1744,
  1745,
  1746,
  1747,
  1748,
  1749,
  1750,
  1751,
  1752,
  1753,
  1754,
  1755,
  1756,
  1757,
  1758,
  1759,
  1760,
  1761,
  1762,
  1763,
  1764,
  1765,
  1766,
  1767,
  1768,
  1769,
  1770,
  1771,
  1772,
  1773,
  1774,
  1775,
  1776,
  1777,
  1778,
  1779,
  1780,
  1781,
  1782,
  1783,
  1784,
  1785,
  1786,
  1787,
  1788,
  1789,
  1790,
  1791,
  1792,
  1793,
  1794,
  1795,
  1796,
  1797,
  1798,
  1799,
  1800,
  1801,
  1802,
  1803,
  1804,
  1805,
  1806,
  1807,
  1808,
  1809,
  1810,
  1811,
  1812,
  1813,
  1814,
  1815,
  1816,
  1817,
  1818,
  1819,
  1820,
  1821,
  1822,
  1823,
  1824,
  1825,
  1826,
  1827,
  1828,
  1829,
  1830,
  1831,
  1832,
  1833,
  1834,
  1835,
  1836,
  1837,
  1838,
  1839,
  1840,
  1841,
  1842,
  1843,
  1844,
  1845,
  1846,
  1847,
  1848,
  1849,
  1850,
  1851,
  1852,
  1853,
  1854,
  1855,
  1856,
  1857,
  1858,
  1859,
  1860,
  1861,
  1862,
  1863,
  1864,
  1865,
  1866,
  1867,
  1868,
  1869,
  1870,
  1871,
  1872,
  1873,
  1874,
  1875,
  1876,
  1877,
  1878,
  1879,
  1880,
  1881,
  1882,
  1883,
  1884,
  1885,
  1886,
  1887,
  1888,
  1889,
  1890,
  1891,
  1892,
  1893,
  1894,
  1895,
  1896,
  1897,
  1898,
  1899,
  1900,
  1901,
  1902,
  1903,
  1904,
  1905,
  1906,
  1907,
  1908,
  1909,
  1910,
  1911,
  1912,
  1913,
  1914,
  1915,
  1916,
  1917,
  1918,
  1919,
  1920,
  1921,
  1922,
  1923,
  1924,
  1925,
  1926,
  1927,
  1928,
  1929,
  1930,
  1931,
  1932,
  1933,
  1934,
  1935,
  1936,
  1937,
  1938,
  1939,
  1940,
  1941,
  1942,
  1943,
  1944,
  1945,
  1946,
  1947,
  1948,
  1949,
  1950,
  1951,
  1952,
  1953,
  1954,
  1955,
  1956,
  1957,
  1958,
  1959,
  1960,
  1961,
  1962,
  1963,
  1964,
  1965,
  1966,
  1967,
  1968,
  1969,
  1970,
  1971,
  1972,
  1973,
  1974,
  1975,
  1976,
  1977,
  1978,
  1979,
  1980,
  1981,
  1982,
  1983,
  1984,
  1985,
  1986,
  1987,
  1988,
  1989,
  1990,
  1991,
  1992,
  1993,
  1994,
  1995,
  1996,
  1997,
  1998,
  1999,
  2000,
  2001,
  2002,
  2003,
  2004,
  2005,
  2006,
  2007,
  2008,
  2009,
  2010,
  2011,
  2012,
  2013,
  2014,
  2015,
  2016,
  2017,
  2018,
  2019,
  2020,
  2021,
  2022,
  2023,
  2024,
  2025,
  2026,
  2027,
  2028,
  2029,
  2030,
  2031,
  2032,
  2033,
  2034,
  2035,
  2036,
  2037,
  2038,
  2039,
  2040,
  2041,
  2042,
  2043,
  2044,
  2045,
  2046,
  2047,
  2048,
  2049,
  2050,
  2051,
  2052,
  2053,
  2054,
  2055,
  2056,
  2057,
  2058,
  2059,
  2060,
  2061,
  2062,
  2063,
  2064,
  2065,
  2066,
  2067,
  2068,
  2069,
  2070,
  2071,
  2072,
  2073,
  2074,
  2075,
  2076,
  2077,
  2078,
  2079,
  2080,
  2081,
  2082,
  2083,
  2084,
  2085,
  2086,
  2087,
  2088,
  2089,
  2090,
  2091,
  2092,
  2093,
  2094,
  2095,
  2096,
  2097,
  2098,
  2099,
  2100,
  2101,
  2102,
  2103,
  2104,
  2105,
  2106,
  2107,
  2108,
  2109,
  2110,
  2111,
  2112,
  2113,
  2114,
  2115,
  2116,
  2117,
  2118,
  2119,
  2120,
  2121,
  2122,
  2123,
  2124,
  2125,
  2126,
  2127,
  2128,
  2129,
  2130,
  2131,
  2132,
  2133,
  2134,
  2135,
  2136,
  2137,
  2138,
  2139,
  2140,
  2141,
  2142,
  2143,
  2144,
  2145,
  2146,
  2147,
  2148,
  2149,
  2150,
  2151,
  2152,
  2153,
  2154,
  2155,
  2156,
  2157,
  2158,
  2159,
  2160,
  2161,
  2162,
  2163,
  2164,
  2165,
  2166,
  2167,
  2168,
  2169,
  2170,
  2171,
  2172,
  2173,
  2174,
  2175,
  2176,
  2177,
  2178,
  2179,
  2180,
  2181,
  2182,
  2183,
  2184,
  2185,
  2186,
  2187,
  2188,
  2189,
  2190,
  2191,
  2192,
  2193,
  2194,
  2195,
  2196,
  2197,
  2198,
  2199,
  2200,
  2201,
  2202,
  2203,
  2204,
  2205,
  2206,
  2207,
  2208,
  2209,
  2210,
  2211,
  2212,
  2213,
  2214,
  2215,
  2216,
  2217,
  2218,
  2219,
  2220,
  2221,
  2222,
  2223,
  2224,
  2225,
  2226,
  2227,
  2228,
  2229,
  2230,
  2231,
  2232,
  2233,
  2234,
  2235,
  2236,
  2237,
  2238,
  2239,
  2240,
  2241,
  2242,
  2243,
  2244,
  2245,
  2246,
  2247,
  2248,
  2249,
  2250,
  2251,
  2252,
  2253,
  2254,
  2255,
  2256,
  2257,
  2258,
  2259,
  2260,
  2261,
  2262,
  2263,
  2264,
  2265,
  2266,
  2267,
  2268,
  2269,
  2270,
  2271,
  2272,
  2273,
  2274,
  2275,
  2276,
  2277,
  2278,
  2279,
  2280,
  2281,
  2282,
  2283,
  2284,
  2285,
  2286,
  2287,
  2288,
  2289,
  2290,
  2291,
  2292,
  2293,
  2294,
  2295,
  2296,
  2297,
  2298,
  2299,
  2300,
  2301,
  2302,
  2303,
  2304,
  2305,
  2306,
  2307,
  2308,
  2309,
  2310,
  2311,
  2312,
  2313,
  2314,
  2315,
  2316,
  2317,
  2318,
  2319,
  2320,
  2321,
  2322,
  2323,
  2324,
  2325,
  2326,
  2327,
  2328,
  2329,
  2330,
  2331,
  2332,
  2333,
  2334,
  2335,
  2336,
  2337,
  2338,
  2339,
  2340,
  2341,
  2342,
  2343,
  2344,
  2345,
  2346,
  2347,
  2348,
  2349,
  2350,
  2351,
  2352,
  2353,
  2354,
  2355,
  2356,
  2357,
  2358,
  2359,
  2360,
  2361,
  2362,
  2363,
  2364,
  2365,
  2366,
  2367,
  2368,
  2369,
  2370,
  2371,
  2372,
  2373,
  2374,
  2375,
  2376,
  2377,
  2378,
  2379,
  2380,
  2381,
  2382,
  2383,
  2384,
  2385,
  2386,
  2387,
  2388,
  2389,
  2390,
  2391,
  2392,
  2393,
  2394,
  2395,
  2396,
  2397,
  2398,
  2399,
  2400,
  2401,
  2402,
  2403,
  2404,
  2405,
  2406,
  2407,
  2408,
  2409,
  2410,
  2411,
  2412,
  2413,
  2414,
  2415,
  2416,
  2417,
  2418,
  2419,
  2420,
  2421,
  2422,
  2423,
  2424,
  2425,
  2426,
  2427,
  2428,
  2429,
  2430,
  2431,
  2432,
  2433,
  2434,
  2435,
  2436,
  2437,
  2438,
  2439,
  2440,
  2441,
  2442,
  2443,
  2444,
  2445,
  2446,
  2447,
  2448,
  2449,
  2450,
  2451,
  2452,
  2453,
  2454,
  2455,
  2456,
  2457,
  2458,
  2459,
  2460,
  2461,
  2462,
  2463,
  2464,
  2465,
  2466,
  2467,
  2468,
  2469,
  2470,
  2471,
  2472,
  2473,
  2474,
  2475,
  2476,
  2477,
  2478,
  2479,
  2480,
  2481,
  2482,
  2483,
  2484,
  2485,
  2486,
  2487,
  2488,
  2489,
  2490,
  2491,
  2492,
  2493,
  2494,
  2495,
  2496,
  2497,
  2498,
  2499,
  2500,
  2501,
  2502,
  2503,
  2504,
  2505,
  2506,
  2507,
  2508,
  2509,
  2510,
  2511,
  2512,
  2513,
  2514,
  2515,
  2516,
  2517,
  2518,
  2519,
  2520,
  2521,
  2522,
  2523,
  2524,
  2525,
  2526,
  2527,
  2528,
  2529,
  2530,
  2531,
  2532,
  2533,
  2534,
  2535,
  2536,
  2537,
  2538,
  2539,
  2540,
  2541,
  2542,
  2543,
  2544,
  2545,
  2546,
  2547,
  2548,
  2549,
  2550,
  2551,
  2552,
  2553,
  2554,
  2555,
  2556,
  2557,
  2558,
  2559,
  2560,
  2561,
  2562,
  2563,
  2564,
  2565,
  2566,
  2567,
  2568,
  2569,
  2570,
  2571,
  2572,
  2573,
  2574,
  2575,
  2576,
  2577,
  2578,
  2579,
  2580,
  2581,
  2582,
  2583,
  2584,
  2585,
  2586,
  2587,
  2588,
  2589,
  2590,
  2591,
  2592,
  2593,
  2594,
  2595,
  2596,
  2597,
  2598,
  2599,
  2600,
  2601,
  2602,
  2603,
  2604,
  2605,
  2606,
  2607,
  2608,
  2609,
  2610,
  2611,
  2612,
  2613,
  2614,
  2615,
  2616,
  2617,
  2618,
  2619,
  2620,
  2621,
  2622,
  2623,
  2624,
  2625,
  2626,
  2627,
  2628,
  2629,
  2630,
  2631,
  2632,
  2633,
  2634,
  2635,
  2636,
  2637,
  2638,
  2639,
  2640,
  2641,
  2642,
  2643,
  2644,
  2645,
  2646,
  2647,
  2648,
  2649,
  2650,
  2651,
  2652,
  2653,
  2654,
  2655,
  2656,
  2657,
  2658,
  2659,
  2660,
  2661,
  2662,
  2663,
  2664,
  2665,
  2666,
  2667,
  2668,
  2669,
  2670,
  2671,
  2672,
  2673,
  2674,
  2675,
  2676,
  2677,
  2678,
  2679,
  2680,
  2681,
  2682,
  2683,
  2684,
  2685,
  2686,
  2687,
  2688,
  2689,
  2690,
  2691,
  2692,
  2693,
  2694,
  2695,
  2696,
  2697,
  2698,
  2699,
  2700,
  2701,
  2702,
  2703,
  2704,
  2705,
  2706,
  2707,
  2708,
  2709,
  2710,
  2711,
  2712,
  2713,
  2714,
  2715,
  2716,
  2717,
  2718,
  2719,
  2720,
  2721,
  2722,
  2723,
  2724,
  2725,
  2726,
  2727,
  2728,
  2729,
  2730,
  2731,
  2732,
  2733,
  2734,
  2735,
  2736,
  2737,
  2738,
  2739,
  2740,
  2741,
  2742,
  2743,
  2744,
  2745,
  2746,
  2747,
  2748,
  2749,
  2750,
  2751,
  2752,
  2753,
  2754,
  2755,
  2756,
  2757,
  2758,
  2759,
  2760,
  2761,
  2762,
  2763,
  2764,
  2765,
  2766,
  2767,
  2768,
  2769,
  2770,
  2771,
  2772,
  2773,
  2774,
  2775,
  2776,
  2777,
  2778,
  2779,
  2780,
  2781,
  2782,
  2783,
  2784,
  2785,
  2786,
  2787,
  2788,
  2789,
  2790,
  2791,
  2792,
  2793,
  2794,
  2795,
  2796,
  2797,
  2798,
  2799,
  2800,
  2801,
  2802,
  2803,
  2804,
  2805,
  2806,
  2807,
  2808,
  2809,
  2810,
  2811,
  2812,
  2813,
  2814,
  2815,
  2816,
  2817,
  2818,
  2819,
  2820,
  2821,
  2822,
  2823,
  2824,
  2825,
  2826,
  2827,
  2828,
  2829,
  2830,
  2831,
  2832,
  2833,
  2834,
  2835,
  2836,
  2837,
  2838,
  2839,
  2840,
  2841,
  2842,
  2843,
  2844,
  2845,
  2846,
  2847,
  2848,
  2849,
  2850,
  2851,
  2852,
  2853,
  2854,
  2855,
  2856,
  2857,
  2858,
  2859,
  2860,
  2861,
  2862,
  2863,
  2864,
  2865,
  2866,
  2867,
  2868,
  2869,
  2870,
  2871,
  2872,
  2873,
  2874,
  2875,
  2876,
  2877,
  2878,
  2879,
  2880,
  2881,
  2882,
  2883,
  2884,
  2885,
  2886,
  2887,
  2888,
  2889,
  2890,
  2891,
  2892,
  2893,
  2894,
  2895,
  2896,
  2897,
  2898,
  2899,
  2900,
  2901,
  2902,
  2903,
  2904,
  2905,
  2906,
  2907,
  2908,
  2909,
  2910,
  2911,
  2912,
  2913,
  2914,
  2915,
  2916,
  2917,
  2918,
  2919,
  2920,
  2921,
  2922,
  2923,
  2924,
  2925,
  2926,
  2927,
  2928,
  2929,
  2930,
  2931,
  2932,
  2933,
  2934,
  2935,
  2936,
  2937,
  2938,
  2939,
  2940,
  2941,
  2942,
  2943,
  2944,
  2945,
  2946,
  2947,
  2948,
  2949,
  2950,
  2951,
  2952,
  2953,
  2954,
  2955,
  2956,
  2957,
  2958,
  2959,
  2960,
  2961,
  2962,
  2963,
  2964,
  2965,
  2966,
  2967,
  2968,
  2969,
  2970,
  2971,
  2972,
  2973,
  2974,
  2975,
  2976,
  2977,
  2978,
  2979,
  2980,
  2981,
  2982,
  2983,
  2984,
  2985,
  2986,
  2987,
  2988,
  2989,
  2990,
  2991,
  2992,
  2993,
  2994,
  2995,
  2996,
  2997,
  2998,
  2999,
  3000,
  3001,
  3002,
  3003,
  3004,
  3005,
  3006,
  3007,
  3008,
  3009,
  3010,
  3011,
  3012,
  3013,
  3014,
  3015,
  3016,
  3017,
  3018,
  3019,
  3020,
  3021,
  3022,
  3023,
  3024,
  3025,
  3026,
  3027,
  3028,
  3029,
  3030,
  3031,
  3032,
  3033,
  3034,
  3035,
  3036,
  3037,
  3038,
  3039,
  3040,
  3041,
  3042,
  3043,
  3044,
  3045,
  3046,
  3047,
  3048,
  3049,
  3050,
  3051,
  3052,
  3053,
  3054,
  3055,
  3056,
  3057,
  3058,
  3059,
  3060,
  3061,
  3062,
  3063,
  3064,
  3065,
  3066,
  3067,
  3068,
  3069,
  3070,
  3071,
  3072,
  3073,
  3074,
  3075,
  3076,
  3077,
  3078,
  3079,
  3080,
  3081,
  3082,
  3083,
  3084,
  3085,
  3086,
  3087,
  3088,
  3089,
  3090,
  3091,
  3092,
  3093,
  3094,
  3095,
  3096,
  3097,
  3098,
  3099,
  3100,
  3101,
  3102,
  3103,
  3104,
  3105,
  3106,
  3107,
  3108,
  3109,
  3110,
  3111,
  3112,
  3113,
  3114,
  3115,
  3116,
  3117,
  3118,
  3119,
  3120,
  3121,
  3122,
  3123,
  3124,
  3125,
  3126,
  3127,
  3128,
  3129,
  3130,
  3131,
  3132,
  3133,
  3134,
  3135,
  3136,
  3137,
  3138,
  3139,
  3140,
  3141,
  3142,
  3143,
  3144,
  3145,
  3146,
  3147,
  3148,
  3149,
  3150,
  3151,
  3152,
  3153,
  3154,
  3155,
  3156,
  3157,
  3158,
  3159,
  3160,
  3161,
  3162,
  3163,
  3164,
  3165,
  3166,
  3167,
  3168,
  3169,
  3170,
  3171,
  3172,
  3173,
  3174,
  3175,
  3176,
  3177,
  3178,
  3179,
  3180,
  3181,
  3182,
  3183,
  3184,
  3185,
  3186,
  3187,
  3188,
  3189,
  3190,
  3191,
  3192,
  3193,
  3194,
  3195,
  3196,
  3197,
  3198,
  3199,
  3200,
  3201,
  3202,
  3203,
  3204,
  3205,
  3206,
  3207,
  3208,
  3209,
  3210,
  3211,
  3212,
  3213,
  3214,
  3215,
  3216,
  3217,
  3218,
  3219,
  3220,
  3221,
  3222,
  3223,
  3224,
  3225,
  3226,
  3227,
  3228,
  3229,
  3230,
  3231,
  3232,
  3233,
  3234,
  3235,
  3236,
  3237,
  3238,
  3239,
  3240,
  3241,
  3242,
  3243,
  3244,
  3245,
  3246,
  3247,
  3248,
  3249,
  3250,
  3251,
  3252,
  3253,
  3254,
  3255,
  3256,
  3257,
  3258,
  3259,
  3260,
  3261,
  3262,
  3263,
  3264,
  3265,
  3266,
  3267,
  3268,
  3269,
  3270,
  3271,
  3272,
  3273,
  3274,
  3275,
  3276,
  3277,
  3278,
  3279,
  3280,
  3281,
  3282,
  3283,
  3284,
  3285,
  3286,
  3287,
  3288,
  3289,
  3290,
  3291,
  3292,
  3293,
  3294,
  3295,
  3296,
  3297,
  3298,
  3299,
  3300,
  3301,
  3302,
  3303,
  3304,
  3305,
  3306,
  3307,
  3308,
  3309,
  3310,
  3311,
  3312,
  3313,
  3314,
  3315,
  3316,
  3317,
  3318,
  3319,
  3320,
  3321,
  3322,
  3323,
  3324,
  3325,
  3326,
  3327,
  3328,
  3329,
  3330,
  3331,
  3332,
  3333,
  3334,
  3335,
  3336,
  3337,
  3338,
  3339,
  3340,
  3341,
  3342,
  3343,
  3344,
  3345,
  3346,
  3347,
  3348,
  3349,
  3350,
  3351,
  3352,
  3353,
  3354,
  3355,
  3356,
  3357,
  3358,
  3359,
  3360,
  3361,
  3362,
  3363,
  3364,
  3365,
  3366,
  3367,
  3368,
  3369,
  3370,
  3371,
  3372,
  3373,
  3374,
  3375,
  3376,
  3377,
  3378,
  3379,
  3380,
  3381,
  3382,
  3383,
  3384,
  3385,
  3386,
  3387,
  3388,
  3389,
  3390,
  3391,
  3392,
  3393,
  3394,
  3395,
  3396,
  3397,
  3398,
  3399,
  3400,
  3401,
  3402,
  3403,
  3404,
  3405,
  3406,
  3407,
  3408,
  3409,
  3410,
  3411,
  3412,
  3413,
  3414,
  3415,
  3416,
  3417,
  3418,
  3419,
  3420,
  3421,
  3422,
  3423,
  3424,
  3425,
  3426,
  3427,
  3428,
  3429,
  3430,
  3431,
  3432,
  3433,
  3434,
  3435,
  3436,
  3437,
  3438,
  3439,
  3440,
  3441,
  3442,
  3443,
  3444,
  3445,
  3446,
  3447,
  3448,
  3449,
  3450,
  3451,
  3452,
  3453,
  3454,
  3455,
  3456,
  3457,
  3458,
  3459,
  3460,
  3461,
  3462,
  3463,
  3464,
  3465,
  3466,
  3467,
  3468,
  3469,
  3470,
  3471,
  3472,
  3473,
  3474,
  3475,
  3476,
  3477,
  3478,
  3479,
  3480,
  3481,
  3482,
  3483,
  3484,
  3485,
  3486,
  3487,
  3488,
  3489,
  3490,
  3491,
  3492,
  3493,
  3494,
  3495,
  3496,
  3497,
  3498,
  3499,
  3500,
  3501,
  3502,
  3503,
  3504,
  3505,
  3506,
  3507,
  3508,
  3509,
  3510,
  3511,
  3512,
  3513,
  3514,
  3515,
  3516,
  3517,
  3518,
  3519,
  3520,
  3521,
  3522,
  3523,
  3524,
  3525,
  3526,
  3527,
  3528,
  3529,
  3530,
  3531,
  3532,
  3533,
  3534,
  3535,
  3536,
  3537,
  3538,
  3539,
  3540,
  3541,
  3542,
  3543,
  3544,
  3545,
  3546,
  3547,
  3548,
  3549,
  3550,
  3551,
  3552,
  3553,
  3554,
  3555,
  3556,
  3557,
  3558,
  3559,
  3560,
  3561,
  3562,
  3563,
  3564,
  3565,
  3566,
  3567,
  3568,
  3569,
  3570,
  3571,
  3572,
  3573,
  3574,
  3575,
  3576,
  3577,
  3578,
  3579,
  3580,
  3581,
  3582,
  3583,
  3584,
  3585,
  3586,
  3587,
  3588,
  3589,
  3590,
  3591,
  3592,
  3593,
  3594,
  3595,
  3596,
  3597,
  3598,
  3599,
  3600,
  3601,
  3602,
  3603,
  3604,
  3605,
  3606,
  3607,
  3608,
  3609,
  3610,
  3611,
  3612,
  3613,
  3614,
  3615,
  3616,
  3617,
  3618,
  3619,
  3620,
  3621,
  3622,
  3623,
  3624,
  3625,
  3626,
  3627,
  3628,
  3629,
  3630,
  3631,
  3632,
  3633,
  3634,
  3635,
  3636,
  3637,
  3638,
  3639,
  3640,
  3641,
  3642,
  3643,
  3644,
  3645,
  3646,
  3647,
  3648,
  3649,
  3650,
  3651,
  3652,
  3653,
  3654,
  3655,
  3656,
  3657,
  3658,
  3659,
  3660,
  3661,
  3662,
  3663,
  3664,
  3665,
  3666,
  3667,
  3668,
  3669,
  3670,
  3671,
  3672,
  3673,
  3674,
  3675,
  3676,
  3677,
  3678,
  3679,
  3680,
  3681,
  3682,
  3683,
  3684,
  3685,
  3686,
  3687,
  3688,
  3689,
  3690,
  3691,
  3692,
  3693,
  3694,
  3695,
  3696,
  3697,
  3698,
  3699,
  3700,
  3701,
  3702,
  3703,
  3704,
  3705,
  3706,
  3707,
  3708,
  3709,
  3710,
  3711,
  3712,
  3713,
  3714,
  3715,
  3716,
  3717,
  3718,
  3719,
  3720,
  3721,
  3722,
  3723,
  3724,
  3725,
  3726,
  3727,
  3728,
  3729,
  3730,
  3731,
  3732,
  3733,
  3734,
  3735,
  3736,
  3737,
  3738,
  3739,
  3740,
  3741,
  3742,
  3743,
  3744,
  3745,
  3746,
  3747,
  3748,
  3749,
  3750,
  3751,
  3752,
  3753,
  3754,
  3755,
  3756,
  3757,
  3758,
  3759,
  3760,
  3761,
  3762,
  3763,
  3764,
  3765,
  3766,
  3767,
  3768,
  3769,
  3770,
  3771,
  3772,
  3773,
  3774,
  3775,
  3776,
  3777,
  3778,
  3779,
  3780,
  3781,
  3782,
  3783,
  3784,
  3785,
  3786,
  3787,
  3788,
  3789,
  3790,
  3791,
  3792,
  3793,
  3794,
  3795,
  3796,
  3797,
  3798,
  3799,
  3800,
  3801,
  3802,
  3803,
  3804,
  3805,
  3806,
  3807,
  3808,
  3809,
  3810,
  3811,
  3812,
  3813,
  3814,
  3815,
  3816,
  3817,
  3818,
  3819,
  3820,
  3821,
  3822,
  3823,
  3824,
  3825,
  3826,
  3827,
  3828,
  3829,
  3830,
  3831,
  3832,
  3833,
  3834,
  3835,
  3836,
  3837,
  3838,
  3839,
  3840,
  3841,
  3842,
  3843,
  3844,
  3845,
  3846,
  3847,
  3848,
  3849,
  3850,
  3851,
  3852,
  3853,
  3854,
  3855,
  3856,
  3857,
  3858,
  3859,
  3860,
  3861,
  3862,
  3863,
  3864,
  3865,
  3866,
  3867,
  3868,
  3869,
  3870,
  3871,
  3872,
  3873,
  3874,
  3875,
  3876,
  3877,
  3878,
  3879,
  3880,
  3881,
  3882,
  3883,
  3884,
  3885,
  3886,
  3887,
  3888,
  3889,
  3890,
  3891,
  3892,
  3893,
  3894,
  3895,
  3896,
  3897,
  3898,
  3899,
  3900,
  3901,
  3902,
  3903,
  3904,
  3905,
  3906,
  3907,
  3908,
  3909,
  3910,
  3911,
  3912,
  3913,
  3914,
  3915,
  3916,
  3917,
  3918,
  3919,
  3920,
  3921,
  3922,
  3923,
  3924,
  3925,
  3926,
  3927,
  3928,
  3929,
  3930,
  3931,
  3932,
  3933,
  3934,
  3935,
  3936,
  3937,
  3938,
  3939,
  3940,
  3941,
  3942,
  3943,
  3944,
  3945,
  3946,
  3947,
  3948,
  3949,
  3950,
  3951,
  3952,
  3953,
  3954,
  3955,
  3956,
  3957,
  3958,
  3959,
  3960,
  3961,
  3962,
  3963,
  3964,
  3965,
  3966,
  3967,
  3968,
  3969,
  3970,
  3971,
  3972,
  3973,
  3974,
  3975,
  3976,
  3977,
  3978,
  3979,
  3980,
  3981,
  3982,
  3983,
  3984,
  3985,
  3986,
  3987,
  3988,
  3989,
  3990,
  3991,
  3992,
  3993,
  3994,
  3995,
  3996,
  3997,
  3998,
  3999,
  4000,
  4001,
  4002,
  4003,
  4004,
  4005,
  4006,
  4007,
  4008,
  4009,
  4010,
  4011,
  4012,
  4013,
  4014,
  4015,
  4016,
  4017,
  4018,
  4019,
  4020,
  4021,
  4022,
  4023,
  4024,
  4025,
  4026,
  4027,
  4028,
  4029,
  4030,
  4031,
  4032,
  4033,
  4034,
  4035,
  4036,
  4037,
  4038,
  4039,
  4040,
  4041,
  4042,
  4043,
  4044,
  4045,
  4046,
  4047,
  4048,
  4049,
  4050,
  4051,
  4052,
  4053,
  4054,
  4055,
  4056,
  4057,
  4058,
  4059,
  4060,
  4061,
  4062,
  4063,
  4064,
  4065,
  4066,
  4067,
  4068,
  4069,
  4070,
  4071,
  4072,
  4073,
  4074,
  4075,
  4076,
  4077,
  4078,
  4079,
  4080,
  4081,
  4082,
  4083,
  4084,
  4085,
  4086,
  4087,
  4088,
  4089,
  4090,
  4091,
  4092,
  4093,
  4094,
  4095,
  4096,
  4097,
  4098,
  4099,
  4100,
  4101,
  4102,
  4103,
  4104,
  4105,
  4106,
  4107,
  4108,
  4109,
  4110,
  4111,
  4112,
  4113,
  4114,
  4115,
  4116,
  4117,
  4118,
  4119,
  4120,
  4121,
  4122,
  4123,
  4124,
  4125,
  4126,
  4127,
  4128,
  4129,
  4130,
  4131,
  4132,
  4133,
  4134,
  4135,
  4136,
  4137,
  4138,
  4139,
  4140,
  4141,
  4142,
  4143,
  4144,
  4145,
  4146,
  4147,
  4148,
  4149,
  4150,
  4151,
  4152,
  4153,
  4154,
  4155,
  4156,
  4157,
  4158,
  4159,
  4160,
  4161,
  4162,
  4163,
  4164,
  4165,
  4166,
  4167,
  4168,
  4169,
  4170,
  4171,
  4172,
  4173,
  4174,
  4175,
  4176,
  4177,
  4178,
  4179,
  4180,
  4181,
  4182,
  4183,
  4184,
  4185,
  4186,
  4187,
  4188,
  4189,
  4190,
  4191,
  4192,
  4193,
  4194,
  4195,
  4196,
  4197,
  4198,
  4199,
  4200,
  4201,
  4202,
  4203,
  4204,
  4205,
  4206,
  4207,
  4208,
  4209,
  4210,
  4211,
  4212,
  4213,
  4214,
  4215,
  4216,
  4217,
  4218,
  4219,
  4220,
  4221,
  4222,
  4223,
  4224,
  4225,
  4226,
  4227,
  4228,
  4229,
  4230,
  4231,
  4232,
  4233,
  4234,
  4235,
  4236,
  4237,
  4238,
  4239,
  4240,
  4241,
  4242,
  4243,
  4244,
  4245,
  4246,
  4247,
  4248,
  4249,
  4250,
  4251,
  4252,
  4253,
  4254,
  4255,
  4256,
  4257,
  4258,
  4259,
  4260,
  4261,
  4262,
  4263,
  4264,
  4265,
  4266,
  4267,
  4268,
  4269,
  4270,
  4271,
  4272,
  4273,
  4274,
  4275,
  4276,
  4277,
  4278,
  4279,
  4280,
  4281,
  4282,
  4283,
  4284,
  4285,
  4286,
  4287,
  4288,
  4289,
  4290,
  4291,
  4292,
  4293,
  4294,
  4295,
  4296,
  4297,
  4298,
  4299,
  4300,
  4301,
  4302,
  4303,
  4304,
  4305,
  4306,
  4307,
  4308,
  4309,
  4310,
  4311,
  4312,
  4313,
  4314,
  4315,
  4316,
  4317,
  4318,
  4319,
  4320,
  4321,
  4322,
  4323,
  4324,
  4325,
  4326,
  4327,
  4328,
  4329,
  4330,
  4331,
  4332,
  4333,
  4334,
  4335,
  4336,
  4337,
  4338,
  4339,
  4340,
  4341,
  4342,
  4343,
  4344,
  4345,
  4346,
  4347,
  4348,
  4349,
  4350,
  4351,
  4352,
  4353,
  4354,
  4355,
  4356,
  4357,
  4358,
  4359,
  4360,
  4361,
  4362,
  4363,
  4364,
  4365,
  4366,
  4367,
  4368,
  4369,
  4370,
  4371,
  4372,
  4373,
  4374,
  4375,
  4376,
  4377,
  4378,
  4379,
  4380,
  4381,
  4382,
  4383,
  4384,
  4385,
  4386,
  4387,
  4388,
  4389,
  4390,
  4391,
  4392,
  4393,
  4394,
  4395,
  4396,
  4397,
  4398,
  4399,
  4400,
  4401,
  4402,
  4403,
  4404,
  4405,
  4406,
  4407,
  4408,
  4409,
  4410,
  4411,
  4412,
  4413,
  4414,
  4415,
  4416,
  4417,
  4418,
  4419,
  4420,
  4421,
  4422,
  4423,
  4424,
  4425,
  4426,
  4427,
  4428,
  4429,
  4430,
  4431,
  4432,
  4433,
  4434,
  4435,
  4436,
  4437,
  4438,
  4439,
  4440,
  4441,
  4442,
  4443,
  4444,
  4445,
  4446,
  4447,
  4448,
  4449,
  4450,
  4451,
  4452,
  4453,
  4454,
  4455,
  4456,
  4457,
  4458,
  4459,
  4460,
  4461,
  4462,
  4463,
  4464,
  4465,
  4466,
  4467,
  4468,
  4469,
  4470,
  4471,
  4472,
  4473,
  4474,
  4475,
  4476,
  4477,
  4478,
  4479,
  4480,
  4481,
  4482,
  4483,
  4484,
  4485,
  4486,
  4487,
  4488,
  4489,
  4490,
  4491,
  4492,
  4493,
  4494,
  4495,
  4496,
  4497,
  4498,
  4499,
  4500,
  4501,
  4502,
  4503,
  4504,
  4505,
  4506,
  4507,
  4508,
  4509,
  4510,
  4511,
  4512,
  4513,
  4514,
  4515,
  4516,
  4517,
  4518,
  4519,
  4520,
  4521,
  4522,
  4523,
  4524,
  4525,
  4526,
  4527,
  4528,
  4529,
  4530,
  4531,
  4532,
  4533,
  4534,
  4535,
  4536,
  4537,
  4538,
  4539,
  4540,
  4541,
  4542,
  4543,
  4544,
  4545,
  4546,
  4547,
  4548,
  4549,
  4550,
  4551,
  4552,
  4553,
  4554,
  4555,
  4556,
  4557,
  4558,
  4559,
  4560,
  4561,
  4562,
  4563,
  4564,
  4565,
  4566,
  4567,
  4568,
  4569,
  4570,
  4571,
  4572,
  4573,
  4574,
  4575,
  4576,
  4577,
  4578,
  4579,
  4580,
  4581,
  4582,
  4583,
  4584,
  4585,
  4586,
  4587,
  4588,
  4589,
  4590,
  4591,
  4592,
  4593,
  4594,
  4595,
  4596,
  4597,
  4598,
  4599,
  4600,
  4601,
  4602,
  4603,
  4604,
  4605,
  4606,
  4607,
  4608,
  4609,
  4610,
  4611,
  4612,
  4613,
  4614,
  4615,
  4616,
  4617,
  4618,
  4619,
  4620,
  4621,
  4622,
  4623,
  4624,
  4625,
  4626,
  4627,
  4628,
  4629,
  4630,
  4631,
  4632,
  4633,
  4634,
  4635,
  4636,
  4637,
  4638,
  4639,
  4640,
  4641,
  4642,
  4643,
  4644,
  4645,
  4646,
  4647,
  4648,
  4649,
  4650,
  4651,
  4652,
  4653,
  4654,
  4655,
  4656,
  4657,
  4658,
  4659,
  4660,
  4661,
  4662,
  4663,
  4664,
  4665,
  4666,
  4667,
  4668,
  4669,
  4670,
  4671,
  4672,
  4673,
  4674,
  4675,
  4676,
  4677,
  4678,
  4679,
  4680,
  4681,
  4682,
  4683,
  4684,
  4685,
  4686,
  4687,
  4688,
  4689,
  4690,
  4691,
  4692,
  4693,
  4694,
  4695,
  4696,
  4697,
  4698,
  4699,
  4700,
  4701,
  4702,
  4703,
  4704,
  4705,
  4706,
  4707,
  4708,
  4709,
  4710,
  4711,
  4712,
  4713,
  4714,
  4715,
  4716,
  4717,
  4718,
  4719,
  4720,
  4721,
  4722,
  4723,
  4724,
  4725,
  4726,
  4727,
  4728,
  4729,
  4730,
  4731,
  4732,
  4733,
  4734,
  4735,
  4736,
  4737,
  4738,
  4739,
  4740,
  4741,
  4742,
  4743,
  4744,
  4745,
  4746,
  4747,
  4748,
  4749,
  4750,
  4751,
  4752,
  4753,
  4754,
  4755,
  4756,
  4757,
  4758,
  4759,
  4760,
  4761,
  4762,
  4763,
  4764,
  4765,
  4766,
  4767,
  4768,
  4769,
  4770,
  4771,
  4772,
  4773,
  4774,
  4775,
  4776,
  4777,
  4778,
  4779,
  4780,
  4781,
  4782,
  4783,
  4784,
  4785,
  4786,
  4787,
  4788,
  4789,
  4790,
  4791,
  4792,
  4793,
  4794,
  4795,
  4796,
  4797,
  4798,
  4799,
  4800,
  4801,
  4802,
  4803,
  4804,
  4805,
  4806,
  4807,
  4808,
  4809,
  4810,
  4811,
  4812,
  4813,
  4814,
  4815,
  4816,
  4817,
  4818,
  4819,
  4820,
  4821,
  4822,
  4823,
  4824,
  4825,
  4826,
  4827,
  4828,
  4829,
  4830,
  4831,
  4832,
  4833,
  4834,
  4835,
  4836,
  4837,
  4838,
  4839,
  4840,
  4841,
  4842,
  4843,
  4844,
  4845,
  4846,
  4847,
  4848,
  4849,
  4850,
  4851,
  4852,
  4853,
  4854,
  4855,
  4856,
  4857,
  4858,
  4859,
  4860,
  4861,
  4862,
  4863,
  4864,
  4865,
  4866,
  4867,
  4868,
  4869,
  4870,
  4871,
  4872,
  4873,
  4874,
  4875,
  4876,
  4877,
  4878,
  4879,
  4880,
  4881,
  4882,
  4883,
  4884,
  4885,
  4886,
  4887,
  4888,
  4889,
  4890,
  4891,
  4892,
  4893,
  4894,
  4895,
  4896,
  4897,
  4898,
  4899,
  4900,
  4901,
  4902,
  4903,
  4904,
  4905,
  4906,
  4907,
  4908,
  4909,
  4910,
  4911,
  4912,
  4913,
  4914,
  4915,
  4916,
  4917,
  4918,
  4919,
  4920,
  4921,
  4922,
  4923,
  4924,
  4925,
  4926,
  4927,
  4928,
  4929,
  4930,
  4931,
  4932,
  4933,
  4934,
  4935,
  4936,
  4937,
  4938,
  4939,
  4940,
  4941,
  4942,
  4943,
  4944,
  4945,
  4946,
  4947,
  4948,
  4949,
  4950,
  4951,
  4952,
  4953,
  4954,
  4955,
  4956,
  4957,
  4958,
  4959,
  4960,
  4961,
  4962,
  4963,
  4964,
  4965,
  4966,
  4967,
  4968,
  4969,
  4970,
  4971,
  4972,
  4973,
  4974,
  4975,
  4976,
  4977,
  4978,
  4979,
  4980,
  4981,
  4982,
  4983,
  4984,
  4985,
  4986,
  4987,
  4988,
  4989,
  4990,
  4991,
  4992,
  4993,
  4994,
  4995,
  4996,
  4997,
  4998,
  4999,
  5000,
  5001,
  5002,
  5003,
  5004,
  5005,
  5006,
  5007,
  5008,
  5009,
  5010,
  5011,
  5012,
  5013,
  5014,
  5015,
  5016,
  5017,
  5018,
  5019,
  5020,
  5021,
  5022,
  5023,
  5024,
  5025,
  5026,
  5027,
  5028,
  5029,
  5030,
  5031,
  5032,
  5033,
  5034,
  5035,
  5036,
  5037,
  5038,
  5039,
  5040,
  5041,
  5042,
  5043,
  5044,
  5045,
  5046,
  5047,
  5048,
  5049,
  5050,
  5051,
  5052,
  5053,
  5054,
  5055,
  5056,
  5057,
  5058,
  5059,
  5060,
  5061,
  5062,
  5063,
  5064,
  5065,
  5066,
  5067,
  5068,
  5069,
  5070,
  5071,
  5072,
  5073,
  5074,
  5075,
  5076,
  5077,
  5078,
  5079,
  5080,
  5081,
  5082,
  5083,
  5084,
  5085,
  5086,
  5087,
  5088,
  5089,
  5090,
  5091,
  5092,
  5093,
  5094,
  5095,
  5096,
  5097,
  5098,
  5099,
  5100,
  5101,
  5102,
  5103,
  5104,
  5105,
  5106,
  5107,
  5108,
  5109,
  5110,
  5111,
  5112,
  5113,
  5114,
  5115,
  5116,
  5117,
  5118,
  5119,
  5120,
  5121,
  5122,
  5123,
  5124,
  5125,
  5126,
  5127,
  5128,
  5129,
  5130,
  5131,
  5132,
  5133,
  5134,
  5135,
  5136,
  5137,
  5138,
  5139,
  5140,
  5141,
  5142,
  5143,
  5144,
  5145,
  5146,
  5147,
  5148,
  5149,
  5150,
  5151,
  5152,
  5153,
  5154,
  5155,
  5156,
  5157,
  5158,
  5159,
  5160,
  5161,
  5162,
  5163,
  5164,
  5165,
  5166,
  5167,
  5168,
  5169,
  5170,
  5171,
  5172,
  5173,
  5174,
  5175,
  5176,
  5177,
  5178,
  5179,
  5180,
  5181,
  5182,
  5183,
  5184,
  5185,
  5186,
  5187,
  5188,
  5189,
  5190,
  5191,
  5192,
  5193,
  5194,
  5195,
  5196,
  5197,
  5198,
  5199,
  5200,
  5201,
  5202,
  5203,
  5204,
  5205,
  5206,
  5207,
  5208,
  5209,
  5210,
  5211,
  5212,
  5213,
  5214,
  5215,
  5216,
  5217,
  5218,
  5219,
  5220,
  5221,
  5222,
  5223,
  5224,
  5225,
  5226,
  5227,
  5228,
  5229,
  5230,
  5231,
  5232,
  5233,
  5234,
  5235,
  5236,
  5237,
  5238,
  5239,
  5240,
  5241,
  5242,
  5243,
  5244,
  5245,
  5246,
  5247,
  5248,
  5249,
  5250,
  5251,
  5252,
  5253,
  5254,
  5255,
  5256,
  5257,
  5258,
  5259,
  5260,
  5261,
  5262,
  5263,
  5264,
  5265,
  5266,
  5267,
  5268,
  5269,
  5270,
  5271,
  5272,
  5273,
  5274,
  5275,
  5276,
  5277,
  5278,
  5279,
  5280,
  5281,
  5282,
  5283,
  5284,
  5285,
  5286,
  5287,
  5288,
  5289,
  5290,
  5291,
  5292,
  5293,
  5294,
  5295,
  5296,
  5297,
  5298,
  5299,
  5300,
  5301,
  5302,
  5303,
  5304,
  5305,
  5306,
  5307,
  5308,
  5309,
  5310,
  5311,
  5312,
  5313,
  5314,
  5315,
  5316,
  5317,
  5318,
  5319,
  5320,
  5321,
  5322,
  5323,
  5324,
  5325,
  5326,
  5327,
  5328,
  5329,
  5330,
  5331,
  5332,
  5333,
  5334,
  5335,
  5336,
  5337,
  5338,
  5339,
  5340,
  5341,
  5342,
  5343,
  5344,
  5345,
  5346,
  5347,
  5348,
  5349,
  5350,
  5351,
  5352,
  5353,
  5354,
  5355,
  5356,
  5357,
  5358,
  5359,
  5360,
  5361,
  5362,
  5363,
  5364,
  5365,
  5366,
  5367,
  5368,
  5369,
  5370,
  5371,
  5372,
  5373,
  5374,
  5375,
  5376,
  5377,
  5378,
  5379,
  5380,
  5381,
  5382,
  5383,
  5384,
  5385,
  5386,
  5387,
  5388,
  5389,
  5390,
  5391,
  5392,
  5393,
  5394,
  5395,
  5396,
  5397,
  5398,
  5399,
  5400,
  5401,
  5402,
  5403,
  5404,
  5405,
  5406,
  5407,
  5408,
  5409,
  5410,
  5411,
  5412,
  5413,
  5414,
  5415,
  5416,
  5417,
  5418,
  5419,
  5420,
  5421,
  5422,
  5423,
  5424,
  5425,
  5426,
  5427,
  5428,
  5429,
  5430,
  5431,
  5432,
  5433,
  5434,
  5435,
  5436,
  5437,
  5438,
  5439,
  5440,
  5441,
  5442,
  5443,
  5444,
  5445,
  5446,
  5447,
  5448,
  5449,
  5450,
  5451,
  5452,
  5453,
  5454,
  5455,
  5456,
  5457,
  5458,
  5459,
  5460,
  5461,
  5462,
  5463,
  5464,
  5465,
  5466,
  5467,
  5468,
  5469,
  5470,
  5471,
  5472,
  5473,
  5474,
  5475,
  5476,
  5477,
  5478,
  5479,
  5480,
  5481,
  5482,
  5483,
  5484,
  5485,
  5486,
  5487,
  5488,
  5489,
  5490,
  5491,
  5492,
  5493,
  5494,
  5495,
  5496,
  5497,
  5498,
  5499,
  5500,
  5501,
  5502,
  5503,
  5504,
  5505,
  5506,
  5507,
  5508,
  5509,
  5510,
  5511,
  5512,
  5513,
  5514,
  5515,
  5516,
  5517,
  5518,
  5519,
  5520,
  5521,
  5522,
  5523,
  5524,
  5525,
  5526,
  5527,
  5528,
  5529,
  5530,
  5531,
  5532,
  5533,
  5534,
  5535,
  5536,
  5537,
  5538,
  5539,
  5540,
  5541,
  5542,
  5543,
  5544,
  5545,
  5546,
  5547,
  5548,
  5549,
  5550,
  5551,
  5552,
  5553,
  5554,
  5555,
  5556,
  5557,
  5558,
  5559,
  5560,
  5561,
  5562,
  5563,
  5564,
  5565,
  5566,
  5567,
  5568,
  5569,
  5570,
  5571,
  5572,
  5573,
  5574,
  5575,
  5576,
  5577,
  5578,
  5579,
  5580,
  5581,
  5582,
  5583,
  5584,
  5585,
  5586,
  5587,
  5588,
  5589,
  5590,
  5591,
  5592,
  5593,
  5594,
  5595,
  5596,
  5597,
  5598,
  5599,
  5600,
  5601,
  5602,
  5603,
  5604,
  5605,
  5606,
  5607,
  5608,
  5609,
  5610,
  5611,
  5612,
  5613,
  5614,
  5615,
  5616,
  5617,
  5618,
  5619,
  5620,
  5621,
  5622,
  5623,
  5624,
  5625,
  5626,
  5627,
  5628,
  5629,
  5630,
  5631,
  5632,
  5633,
  5634,
  5635,
  5636,
  5637,
  5638,
  5639,
  5640,
  5641,
  5642,
  5643,
  5644,
  5645,
  5646,
  5647,
  5648,
  5649,
  5650,
  5651,
  5652,
  5653,
  5654,
  5655,
  5656,
  5657,
  5658,
  5659,
  5660,
  5661,
  5662,
  5663,
  5664,
  5665,
  5666,
  5667,
  5668,
  5669,
  5670,
  5671,
  5672,
  5673,
  5674,
  5675,
  5676,
  5677,
  5678,
  5679,
  5680,
  5681,
  5682,
  5683,
  5684,
  5685,
  5686,
  5687,
  5688,
  5689,
  5690,
  5691,
  5692,
  5693,
  5694,
  5695,
  5696,
  5697,
  5698,
  5699,
  5700,
  5701,
  5702,
  5703,
  5704,
  5705,
  5706,
  5707,
  5708,
  5709,
  5710,
  5711,
  5712,
  5713,
  5714,
  5715,
  5716,
  5717,
  5718,
  5719,
  5720,
  5721,
  5722,
  5723,
  5724,
  5725,
  5726,
  5727,
  5728,
  5729,
  5730,
  5731,
  5732,
  5733,
  5734,
  5735,
  5736,
  5737,
  5738,
  5739,
  5740,
  5741,
  5742,
  5743,
  5744,
  5745,
  5746,
  5747,
  5748,
  5749,
  5750,
  5751,
  5752,
  5753,
  5754,
  5755,
  5756,
  5757,
  5758,
  5759,
  5760,
  5761,
  5762,
  5763,
  5764,
  5765,
  5766,
  5767,
  5768,
  5769,
  5770,
  5771,
  5772,
  5773,
  5774,
  5775,
  5776,
  5777,
  5778,
  5779,
  5780,
  5781,
  5782,
  5783,
  5784,
  5785,
  5786,
  5787,
  5788,
  5789,
  5790,
  5791,
  5792,
  5793,
  5794,
  5795,
  5796,
  5797,
  5798,
  5799,
  5800,
  5801,
  5802,
  5803,
  5804,
  5805,
  5806,
  5807,
  5808,
  5809,
  5810,
  5811,
  5812,
  5813,
  5814,
  5815,
  5816,
  5817,
  5818,
  5819,
  5820,
  5821,
  5822,
  5823,
  5824,
  5825,
  5826,
  5827,
  5828,
  5829,
  5830,
  5831,
  5832,
  5833,
  5834,
  5835,
  5836,
  5837,
  5838,
  5839,
  5840,
  5841,
  5842,
  5843,
  5844,
  5845,
  5846,
  5847,
  5848,
  5849,
  5850,
  5851,
  5852,
  5853,
  5854,
  5855,
  5856,
  5857,
  5858,
  5859,
  5860,
  5861,
  5862,
  5863,
  5864,
  5865,
  5866,
  5867,
  5868,
  5869,
  5870,
  5871,
  5872,
  5873,
  5874,
  5875,
  5876,
  5877,
  5878,
  5879,
  5880,
  5881,
  5882,
  5883,
  5884,
  5885,
  5886,
  5887,
  5888,
  5889,
  5890,
  5891,
  5892,
  5893,
  5894,
  5895,
  5896,
  5897,
  5898,
  5899,
  5900,
  5901,
  5902,
  5903,
  5904,
  5905,
  5906,
  5907,
  5908,
  5909,
  5910,
  5911,
  5912,
  5913,
  5914,
  5915,
  5916,
  5917,
  5918,
  5919,
  5920,
  5921,
  5922,
  5923,
  5924,
  5925,
  5926,
  5927,
  5928,
  5929,
  5930,
  5931,
  5932,
  5933,
  5934,
  5935,
  5936,
  5937,
  5938,
  5939,
  5940,
  5941,
  5942,
  5943,
  5944,
  5945,
  5946,
  5947,
  5948,
  5949,
  5950,
  5951,
  5952,
  5953,
  5954,
  5955,
  5956,
  5957,
  5958,
  5959,
  5960,
  5961,
  5962,
  5963,
  5964,
  5965,
  5966,
  5967,
  5968,
  5969,
  5970,
  5971,
  5972,
  5973,
  5974,
  5975,
  5976,
  5977,
  5978,
  5979,
  5980,
  5981,
  5982,
  5983,
  5984,
  5985,
  5986,
  5987,
  5988,
  5989,
  5990,
  5991,
  5992,
  5993,
  5994,
  5995,
  5996,
  5997,
  5998,
  5999,
  6000,
  6001,
  6002,
  6003,
  6004,
  6005,
  6006,
  6007,
  6008,
  6009,
  6010,
  6011,
  6012,
  6013,
  6014,
  6015,
  6016,
  6017,
  6018,
  6019,
  6020,
  6021,
  6022,
  6023,
  6024,
  6025,
  6026,
  6027,
  6028,
  6029,
  6030,
  6031,
  6032,
  6033,
  6034,
  6035,
  6036,
  6037,
  6038,
  6039,
  6040,
  6041,
  6042,
  6043,
  6044,
  6045,
  6046,
  6047,
  6048,
  6049,
  6050,
  6051,
  6052,
  6053,
  6054,
  6055,
  6056,
  6057,
  6058,
  6059,
  6060,
  6061,
  6062,
  6063,
  6064,
  6065,
  6066,
  6067,
  6068,
  6069,
  6070,
  6071,
  6072,
  6073,
  6074,
  6075,
  6076,
  6077,
  6078,
  6079,
  6080,
  6081,
  6082,
  6083,
  6084,
  6085,
  6086,
  6087,
  6088,
  6089,
  6090,
  6091,
  6092,
  6093,
  6094,
  6095,
  6096,
  6097,
  6098,
  6099,
  6100,
  6101,
  6102,
  6103,
  6104,
  6105,
  6106,
  6107,
  6108,
  6109,
  6110,
  6111,
  6112,
  6113,
  6114,
  6115,
  6116,
  6117,
  6118,
  6119,
  6120,
  6121,
  6122,
  6123,
  6124,
  6125,
  6126,
  6127,
  6128,
  6129,
  6130,
  6131,
  6132,
  6133,
  6134,
  6135,
  6136,
  6137,
  6138,
  6139,
  6140,
  6141,
  6142,
  6143,
  6144,
  6145,
  6146,
  6147,
  6148,
  6149,
  6150,
  6151,
  6152,
  6153,
  6154,
  6155,
  6156,
  6157,
  6158,
  6159,
  6160,
  6161,
  6162,
  6163,
  6164,
  6165,
  6166,
  6167,
  6168,
  6169,
  6170,
  6171,
  6172,
  6173,
  6174,
  6175,
  6176,
  6177,
  6178,
  6179,
  6180,
  6181,
  6182,
  6183,
  6184,
  6185,
  6186,
  6187,
  6188,
  6189,
  6190,
  6191,
  6192,
  6193,
  6194,
  6195,
  6196,
  6197,
  6198,
  6199,
  6200,
  6201,
  6202,
  6203,
  6204,
  6205,
  6206,
  6207,
  6208,
  6209,
  6210,
  6211,
  6212,
  6213,
  6214,
  6215,
  6216,
  6217,
  6218,
  6219,
  6220,
  6221,
  6222,
  6223,
  6224,
  6225,
  6226,
  6227,
  6228,
  6229,
  6230,
  6231,
  6232,
  6233,
  6234,
  6235,
  6236,
  6237,
  6238,
  6239,
  6240,
  6241,
  6242,
  6243,
  6244,
  6245,
  6246,
  6247,
  6248,
  6249,
  6250,
  6251,
  6252,
  6253,
  6254,
  6255,
  6256,
  6257,
  6258,
  6259,
  6260,
  6261,
  6262,
  6263,
  6264,
  6265,
  6266,
  6267,
  6268,
  6269,
  6270,
  6271,
  6272,
  6273,
  6274,
  6275,
  6276,
  6277,
  6278,
  6279,
  6280,
  6281,
  6282,
  6283,
  6284,
  6285,
  6286,
  6287,
  6288,
  6289,
  6290,
  6291,
  6292,
  6293,
  6294,
  6295,
  6296,
  6297,
  6298,
  6299,
  6300,
  6301,
  6302,
  6303,
  6304,
  6305,
  6306,
  6307,
  6308,
  6309,
  6310,
  6311,
  6312,
  6313,
  6314,
  6315,
  6316,
  6317,
  6318,
  6319,
  6320,
  6321,
  6322,
  6323,
  6324,
  6325,
  6326,
  6327,
  6328,
  6329,
  6330,
  6331,
  6332,
  6333,
  6334,
  6335,
  6336,
  6337,
  6338,
  6339,
  6340,
  6341,
  6342,
  6343,
  6344,
  6345,
  6346,
  6347,
  6348,
  6349,
  6350,
  6351,
  6352,
  6353,
  6354,
  6355,
  6356,
  6357,
  6358,
  6359,
  6360,
  6361,
  6362,
  6363,
  6364,
  6365,
  6366,
  6367,
  6368,
  6369,
  6370,
  6371,
  6372,
  6373,
  6374,
  6375,
  6376,
  6377,
  6378,
  6379,
  6380,
  6381,
  6382,
  6383,
  6384,
  6385,
  6386,
  6387,
  6388,
  6389,
  6390,
  6391,
  6392,
  6393,
  6394,
  6395,
  6396,
  6397,
  6398,
  6399,
  6400,
  6401,
  6402,
  6403,
  6404,
  6405,
  6406,
  6407,
  6408,
  6409,
  6410,
  6411,
  6412,
  6413,
  6414,
  6415,
  6416,
  6417,
  6418,
  6419,
  6420,
  6421,
  6422,
  6423,
  6424,
  6425,
  6426,
  6427,
  6428,
  6429,
  6430,
  6431,
  6432,
  6433,
  6434,
  6435,
  6436,
  6437,
  6438,
  6439,
  6440,
  6441,
  6442,
  6443,
  6444,
  6445,
  6446,
  6447,
  6448,
  6449,
  6450,
  6451,
  6452,
  6453,
  6454,
  6455,
  6456,
  6457,
  6458,
  6459,
  6460,
  6461,
  6462,
  6463,
  6464,
  6465,
  6466,
  6467,
  6468,
  6469,
  6470,
  6471,
  6472,
  6473,
  6474,
  6475,
  6476,
  6477,
  6478,
  6479,
  6480,
  6481,
  6482,
  6483,
  6484,
  6485,
  6486,
  6487,
  6488,
  6489,
  6490,
  6491,
  6492,
  6493,
  6494,
  6495,
  6496,
  6497,
  6498,
  6499,
  6500,
  6501,
  6502,
  6503,
  6504,
  6505,
  6506,
  6507,
  6508,
  6509,
  6510,
  6511,
  6512,
  6513,
  6514,
  6515,
  6516,
  6517,
  6518,
  6519,
  6520,
  6521,
  6522,
  6523,
  6524,
  6525,
  6526,
  6527,
  6528,
  6529,
  6530,
  6531,
  6532,
  6533,
  6534,
  6535,
  6536,
  6537,
  6538,
  6539,
  6540,
  6541,
  6542,
  6543,
  6544,
  6545,
  6546,
  6547,
  6548,
  6549,
  6550,
  6551,
  6552,
  6553,
  6554,
  6555,
  6556,
  6557,
  6558,
  6559,
  6560,
  6561,
  6562,
  6563,
  6564,
  6565,
  6566,
  6567,
  6568,
  6569,
  6570,
  6571,
  6572,
  6573,
  6574,
  6575,
  6576,
  6577,
  6578,
  6579,
  6580,
  6581,
  6582,
  6583,
  6584,
  6585,
  6586,
  6587,
  6588,
  6589,
  6590,
  6591,
  6592,
  6593,
  6594,
  6595,
  6596,
  6597,
  6598,
  6599,
  6600,
  6601,
  6602,
  6603,
  6604,
  6605,
  6606,
  6607,
  6608,
  6609,
  6610,
  6611,
  6612,
  6613,
  6614,
  6615,
  6616,
  6617,
  6618,
  6619,
  6620,
  6621,
  6622,
  6623,
  6624,
  6625,
  6626,
  6627,
  6628,
  6629,
  6630,
  6631,
  6632,
  6633,
  6634,
  6635,
  6636,
  6637,
  6638,
  6639,
  6640,
  6641,
  6642,
  6643,
  6644,
  6645,
  6646,
  6647,
  6648,
  6649,
  6650,
  6651,
  6652,
  6653,
  6654,
  6655,
  6656,
  6657,
  6658,
  6659,
  6660,
  6661,
  6662,
  6663,
  6664,
  6665,
  6666,
  6667,
  6668,
  6669,
  6670,
  6671,
  6672,
  6673,
  6674,
  6675,
  6676,
  6677,
  6678,
  6679,
  6680,
  6681,
  6682,
  6683,
  6684,
  6685,
  6686,
  6687,
  6688,
  6689,
  6690,
  6691,
  6692,
  6693,
  6694,
  6695,
  6696,
  6697,
  6698,
  6699,
  6700,
  6701,
  6702,
  6703,
  6704,
  6705,
  6706,
  6707,
  6708,
  6709,
  6710,
  6711,
  6712,
  6713,
  6714,
  6715,
  6716,
  6717,
  6718,
  6719,
  6720,
  6721,
  6722,
  6723,
  6724,
  6725,
  6726,
  6727,
  6728,
  6729,
  6730,
  6731,
  6732,
  6733,
  6734,
  6735,
  6736,
  6737,
  6738,
  6739,
  6740,
  6741,
  6742,
  6743,
  6744,
  6745,
  6746,
  6747,
  6748,
  6749,
  6750,
  6751,
  6752,
  6753,
  6754,
  6755,
  6756,
  6757,
  6758,
  6759,
  6760,
  6761,
  6762,
  6763,
  6764,
  6765,
  6766,
  6767,
  6768,
  6769,
  6770,
  6771,
  6772,
  6773,
  6774,
  6775,
  6776,
  6777,
  6778,
  6779,
  6780,
  6781,
  6782,
  6783,
  6784,
  6785,
  6786,
  6787,
  6788,
  6789,
  6790,
  6791,
  6792,
  6793,
  6794,
  6795,
  6796,
  6797,
  6798,
  6799,
  6800,
  6801,
  6802,
  6803,
  6804,
  6805,
  6806,
  6807,
  6808,
  6809,
  6810,
  6811,
  6812,
  6813,
  6814,
  6815,
  6816,
  6817,
  6818,
  6819,
  6820,
  6821,
  6822,
  6823,
  6824,
  6825,
  6826,
  6827,
  6828,
  6829,
  6830,
  6831,
  6832,
  6833,
  6834,
  6835,
  6836,
  6837,
  6838,
  6839,
  6840,
  6841,
  6842,
  6843,
  6844,
  6845,
  6846,
  6847,
  6848,
  6849,
  6850,
  6851,
  6852,
  6853,
  6854,
  6855,
  6856,
  6857,
  6858,
  6859,
  6860,
  6861,
  6862,
  6863,
  6864,
  6865,
  6866,
  6867,
  6868,
  6869,
  6870,
  6871,
  6872,
  6873,
  6874,
  6875,
  6876,
  6877,
  6878,
  6879,
  6880,
  6881,
  6882,
  6883,
  6884,
  6885,
  6886,
  6887,
  6888,
  6889,
  6890,
  6891,
  6892,
  6893,
  6894,
  6895,
  6896,
  6897,
  6898,
  6899,
  6900,
  6901,
  6902,
  6903,
  6904,
  6905,
  6906,
  6907,
  6908,
  6909,
  6910,
  6911,
  6912,
  6913,
  6914,
  6915,
  6916,
  6917,
  6918,
  6919,
  6920,
  6921,
  6922,
  6923,
  6924,
  6925,
  6926,
  6927,
  6928,
  6929,
  6930,
  6931,
  6932,
  6933,
  6934,
  6935,
  6936,
  6937,
  6938,
  6939,
  6940,
  6941,
  6942,
  6943,
  6944,
  6945,
  6946,
  6947,
  6948,
  6949,
  6950,
  6951,
  6952,
  6953,
  6954,
  6955,
  6956,
  6957,
  6958,
  6959,
  6960,
  6961,
  6962,
  6963,
  6964,
  6965,
  6966,
  6967,
  6968,
  6969,
  6970,
  6971,
  6972,
  6973,
  6974,
  6975,
  6976,
  6977,
  6978,
  6979,
  6980,
  6981,
  6982,
  6983,
  6984,
  6985,
  6986,
  6987,
  6988,
  6989,
  6990,
  6991,
  6992,
  6993,
  6994,
  6995,
  6996,
  6997,
  6998,
  6999,
  7000,
  7001,
  7002,
  7003,
  7004,
  7005,
  7006,
  7007,
  7008,
  7009,
  7010,
  7011,
  7012,
  7013,
  7014,
  7015,
  7016,
  7017,
  7018,
  7019,
  7020,
  7021,
  7022,
  7023,
  7024,
  7025,
  7026,
  7027,
  7028,
  7029,
  7030,
  7031,
  7032,
  7033,
  7034,
  7035,
  7036,
  7037,
  7038,
  7039,
  7040,
  7041,
  7042,
  7043,
  7044,
  7045,
  7046,
  7047,
  7048,
  7049,
  7050,
  7051,
  7052,
  7053,
  7054,
  7055,
  7056,
  7057,
  7058,
  7059,
  7060,
  7061,
  7062,
  7063,
  7064,
  7065,
  7066,
  7067,
  7068,
  7069,
  7070,
  7071,
  7072,
  7073,
  7074,
  7075,
  7076,
  7077,
  7078,
  7079,
  7080,
  7081,
  7082,
  7083,
  7084,
  7085,
  7086,
  7087,
  7088,
  7089,
  7090,
  7091,
  7092,
  7093,
  7094,
  7095,
  7096,
  7097,
  7098,
  7099,
  7100,
  7101,
  7102,
  7103,
  7104,
  7105,
  7106,
  7107,
  7108,
  7109,
  7110,
  7111,
  7112,
  7113,
  7114,
  7115,
  7116,
  7117,
  7118,
  7119,
  7120,
  7121,
  7122,
  7123,
  7124,
  7125,
  7126,
  7127,
  7128,
  7129,
  7130,
  7131,
  7132,
  7133,
  7134,
  7135,
  7136,
  7137,
  7138,
  7139,
  7140,
  7141,
  7142,
  7143,
  7144,
  7145,
  7146,
  7147,
  7148,
  7149,
  7150,
  7151,
  7152,
  7153,
  7154,
  7155,
  7156,
  7157,
  7158,
  7159,
  7160,
  7161,
  7162,
  7163,
  7164,
  7165,
  7166,
  7167,
  7168,
  7169,
  7170,
  7171,
  7172,
  7173,
  7174,
  7175,
  7176,
  7177,
  7178,
  7179,
  7180,
  7181,
  7182,
  7183,
  7184,
  7185,
  7186,
  7187,
  7188,
  7189,
  7190,
  7191,
  7192,
  7193,
  7194,
  7195,
  7196,
  7197,
  7198,
  7199,
  7200,
  7201,
  7202,
  7203,
  7204,
  7205,
  7206,
  7207,
  7208,
  7209,
  7210,
  7211,
  7212,
  7213,
  7214,
  7215,
  7216,
  7217,
  7218,
  7219,
  7220,
  7221,
  7222,
  7223,
  7224,
  7225,
  7226,
  7227,
  7228,
  7229,
  7230,
  7231,
  7232,
  7233,
  7234,
  7235,
  7236,
  7237,
  7238,
  7239,
  7240,
  7241,
  7242,
  7243,
  7244,
  7245,
  7246,
  7247,
  7248,
  7249,
  7250,
  7251,
  7252,
  7253,
  7254,
  7255,
  7256,
  7257,
  7258,
  7259,
  7260,
  7261,
  7262,
  7263,
  7264,
  7265,
  7266,
  7267,
  7268,
  7269,
  7270,
  7271,
  7272,
  7273,
  7274,
  7275,
  7276,
  7277,
  7278,
  7279,
  7280,
  7281,
  7282,
  7283,
  7284,
  7285,
  7286,
  7287,
  7288,
  7289,
  7290,
  7291,
  7292,
  7293,
  7294,
  7295,
  7296,
  7297,
  7298,
  7299,
  7300,
  7301,
  7302,
  7303,
  7304,
  7305,
  7306,
  7307,
  7308,
  7309,
  7310,
  7311,
  7312,
  7313,
  7314,
  7315,
  7316,
  7317,
  7318,
  7319,
  7320,
  7321,
  7322,
  7323,
  7324,
  7325,
  7326,
  7327,
  7328,
  7329,
  7330,
  7331,
  7332,
  7333,
  7334,
  7335,
  7336,
  7337,
  7338,
  7339,
  7340,
  7341,
  7342,
  7343,
  7344,
  7345,
  7346,
  7347,
  7348,
  7349,
  7350,
  7351,
  7352,
  7353,
  7354,
  7355,
  7356,
  7357,
  7358,
  7359,
  7360,
  7361,
  7362,
  7363,
  7364,
  7365,
  7366,
  7367,
  7368,
  7369,
  7370,
  7371,
  7372,
  7373,
  7374,
  7375,
  7376,
  7377,
  7378,
  7379,
  7380,
  7381,
  7382,
  7383,
  7384,
  7385,
  7386,
  7387,
  7388,
  7389,
  7390,
  7391,
  7392,
  7393,
  7394,
  7395,
  7396,
  7397,
  7398,
  7399,
  7400,
  7401,
  7402,
  7403,
  7404,
  7405,
  7406,
  7407,
  7408,
  7409,
  7410,
  7411,
  7412,
  7413,
  7414,
  7415,
  7416,
  7417,
  7418,
  7419,
  7420,
  7421,
  7422,
  7423,
  7424,
  7425,
  7426,
  7427,
  7428,
  7429,
  7430,
  7431,
  7432,
  7433,
  7434,
  7435,
  7436,
  7437,
  7438,
  7439,
  7440,
  7441,
  7442,
  7443,
  7444,
  7445,
  7446,
  7447,
  7448,
  7449,
  7450,
  7451,
  7452,
  7453,
  7454,
  7455,
  7456,
  7457,
  7458,
  7459,
  7460,
  7461,
  7462,
  7463,
  7464,
  7465,
  7466,
  7467,
  7468,
  7469,
  7470,
  7471,
  7472,
  7473,
  7474,
  7475,
  7476,
  7477,
  7478,
  7479,
  7480,
  7481,
  7482,
  7483,
  7484,
  7485,
  7486,
  7487,
  7488,
  7489,
  7490,
  7491,
  7492,
  7493,
  7494,
  7495,
  7496,
  7497,
  7498,
  7499,
  7500,
  7501,
  7502,
  7503,
  7504,
  7505,
  7506,
  7507,
  7508,
  7509,
  7510,
  7511,
  7512,
  7513,
  7514,
  7515,
  7516,
  7517,
  7518,
  7519,
  7520,
  7521,
  7522,
  7523,
  7524,
  7525,
  7526,
  7527,
  7528,
  7529,
  7530,
  7531,
  7532,
  7533,
  7534,
  7535,
  7536,
  7537,
  7538,
  7539,
  7540,
  7541,
  7542,
  7543,
  7544,
  7545,
  7546,
  7547,
  7548,
  7549,
  7550,
  7551,
  7552,
  7553,
  7554,
  7555,
  7556,
  7557,
  7558,
  7559,
  7560,
  7561,
  7562,
  7563,
  7564,
  7565,
  7566,
  7567,
  7568,
  7569,
  7570,
  7571,
  7572,
  7573,
  7574,
  7575,
  7576,
  7577,
  7578,
  7579,
  7580,
  7581,
  7582,
  7583,
  7584,
  7585,
  7586,
  7587,
  7588,
  7589,
  7590,
  7591,
  7592,
  7593,
  7594,
  7595,
  7596,
  7597,
  7598,
  7599,
  7600,
  7601,
  7602,
  7603,
  7604,
  7605,
  7606,
  7607,
  7608,
  7609,
  7610,
  7611,
  7612,
  7613,
  7614,
  7615,
  7616,
  7617,
  7618,
  7619,
  7620,
  7621,
  7622,
  7623,
  7624,
  7625,
  7626,
  7627,
  7628,
  7629,
  7630,
  7631,
  7632,
  7633,
  7634,
  7635,
  7636,
  7637,
  7638,
  7639,
  7640,
  7641,
  7642,
  7643,
  7644,
  7645,
  7646,
  7647,
  7648,
  7649,
  7650,
  7651,
  7652,
  7653,
  7654,
  7655,
  7656,
  7657,
  7658,
  7659,
  7660,
  7661,
  7662,
  7663,
  7664,
  7665,
  7666,
  7667,
  7668,
  7669,
  7670,
  7671,
  7672,
  7673,
  7674,
  7675,
  7676,
  7677,
  7678,
  7679,
  7680,
  7681,
  7682,
  7683,
  7684,
  7685,
  7686,
  7687,
  7688,
  7689,
  7690,
  7691,
  7692,
  7693,
  7694,
  7695,
  7696,
  7697,
  7698,
  7699,
  7700,
  7701,
  7702,
  7703,
  7704,
  7705,
  7706,
  7707,
  7708,
  7709,
  7710,
  7711,
  7712,
  7713,
  7714,
  7715,
  7716,
  7717,
  7718,
  7719,
  7720,
  7721,
  7722,
  7723,
  7724,
  7725,
  7726,
  7727,
  7728,
  7729,
  7730,
  7731,
  7732,
  7733,
  7734,
  7735,
  7736,
  7737,
  7738,
  7739,
  7740,
  7741,
  7742,
  7743,
  7744,
  7745,
  7746,
  7747,
  7748,
  7749,
  7750,
  7751,
  7752,
  7753,
  7754,
  7755,
  7756,
  7757,
  7758,
  7759,
  7760,
  7761,
  7762,
  7763,
  7764,
  7765,
  7766,
  7767,
  7768,
  7769,
  7770,
  7771,
  7772,
  7773,
  7774,
  7775,
  7776,
  7777,
  7778,
  7779,
  7780,
  7781,
  7782,
  7783,
  7784,
  7785,
  7786,
  7787,
  7788,
  7789,
  7790,
  7791,
  7792,
  7793,
  7794,
  7795,
  7796,
  7797,
  7798,
  7799,
  7800,
  7801,
  7802,
  7803,
  7804,
  7805,
  7806,
  7807,
  7808,
  7809,
  7810,
  7811,
  7812,
  7813,
  7814,
  7815,
  7816,
  7817,
  7818,
  7819,
  7820,
  7821,
  7822,
  7823,
  7824,
  7825,
  7826,
  7827,
  7828,
  7829,
  7830,
  7831,
  7832,
  7833,
  7834,
  7835,
  7836,
  7837,
  7838,
  7839,
  7840,
  7841,
  7842,
  7843,
  7844,
  7845,
  7846,
  7847,
  7848,
  7849,
  7850,
  7851,
  7852,
  7853,
  7854,
  7855,
  7856,
  7857,
  7858,
  7859,
  7860,
  7861,
  7862,
  7863,
  7864,
  7865,
  7866,
  7867,
  7868,
  7869,
  7870,
  7871,
  7872,
  7873,
  7874,
  7875,
  7876,
  7877,
  7878,
  7879,
  7880,
  7881,
  7882,
  7883,
  7884,
  7885,
  7886,
  7887,
  7888,
  7889,
  7890,
  7891,
  7892,
  7893,
  7894,
  7895,
  7896,
  7897,
  7898,
  7899,
  7900,
  7901,
  7902,
  7903,
  7904,
  7905,
  7906,
  7907,
  7908,
  7909,
  7910,
  7911,
  7912,
  7913,
  7914,
  7915,
  7916,
  7917,
  7918,
  7919,
  7920,
  7921,
  7922,
  7923,
  7924,
  7925,
  7926,
  7927,
  7928,
  7929,
  7930,
  7931,
  7932,
  7933,
  7934,
  7935,
  7936,
  7937,
  7938,
  7939,
  7940,
  7941,
  7942,
  7943,
  7944,
  7945,
  7946,
  7947,
  7948,
  7949,
  7950,
  7951,
  7952,
  7953,
  7954,
  7955,
  7956,
  7957,
  7958,
  7959,
  7960,
  7961,
  7962,
  7963,
  7964,
  7965,
  7966,
  7967,
  7968,
  7969,
  7970,
  7971,
  7972,
  7973,
  7974,
  7975,
  7976,
  7977,
  7978,
  7979,
  7980,
  7981,
  7982,
  7983,
  7984,
  7985,
  7986,
  7987,
  7988,
  7989,
  7990,
  7991,
  7992,
  7993,
  7994,
  7995,
  7996,
  7997,
  7998,
  7999,
  8000,
  8001,
  8002,
  8003,
  8004,
  8005,
  8006,
  8007,
  8008,
  8009,
  8010,
  8011,
  8012,
  8013,
  8014,
  8015,
  8016,
  8017,
  8018,
  8019,
  8020,
  8021,
  8022,
  8023,
  8024,
  8025,
  8026,
  8027,
  8028,
  8029,
  8030,
  8031,
  8032,
  8033,
  8034,
  8035,
  8036,
  8037,
  8038,
  8039,
  8040,
  8041,
  8042,
  8043,
  8044,
  8045,
  8046,
  8047,
  8048,
  8049,
  8050,
  8051,
  8052,
  8053,
  8054,
  8055,
  8056,
  8057,
  8058,
  8059,
  8060,
  8061,
  8062,
  8063,
  8064,
  8065,
  8066,
  8067,
  8068,
  8069,
  8070,
  8071,
  8072,
  8073,
  8074,
  8075,
  8076,
  8077,
  8078,
  8079,
  8080,
  8081,
  8082,
  8083,
  8084,
  8085,
  8086,
  8087,
  8088,
  8089,
  8090,
  8091,
  8092,
  8093,
  8094,
  8095,
  8096,
  8097,
  8098,
  8099,
  8100,
  8101,
  8102,
  8103,
  8104,
  8105,
  8106,
  8107,
  8108,
  8109,
  8110,
  8111,
  8112,
  8113,
  8114,
  8115,
  8116,
  8117,
  8118,
  8119,
  8120,
  8121,
  8122,
  8123,
  8124,
  8125,
  8126,
  8127,
  8128,
  8129,
  8130,
  8131,
  8132,
  8133,
  8134,
  8135,
  8136,
  8137,
  8138,
  8139,
  8140,
  8141,
  8142,
  8143,
  8144,
  8145,
  8146,
  8147,
  8148,
  8149,
  8150,
  8151,
  8152,
  8153,
  8154,
  8155,
  8156,
  8157,
  8158,
  8159,
  8160,
  8161,
  8162,
  8163,
  8164,
  8165,
  8166,
  8167,
  8168,
  8169,
  8170,
  8171,
  8172,
  8173,
  8174,
  8175,
  8176,
  8177,
  8178,
  8179,
  8180,
  8181,
  8182,
  8183,
  8184,
  8185,
  8186,
  8187,
  8188,
  8189,
  8190,
  8191,
  8192,
  8193,
  8194,
  8195,
  8196,
  8197,
  8198,
  8199,
  8200,
  8201,
  8202,
  8203,
  8204,
  8205,
  8206,
  8207,
  8208,
  8209,
  8210,
  8211,
  8212,
  8213,
  8214,
  8215,
  8216,
  8217,
  8218,
  8219,
  8220,
  8221,
  8222,
  8223,
  8224,
  8225,
  8226,
  8227,
  8228,
  8229,
  8230,
  8231,
  8232,
  8233,
  8234,
  8235,
  8236,
  8237,
  8238,
  8239,
  8240,
  8241,
  8242,
  8243,
  8244,
  8245,
  8246,
  8247,
  8248,
  8249,
  8250,
  8251,
  8252,
  8253,
  8254,
  8255,
  8256,
  8257,
  8258,
  8259,
  8260,
  8261,
  8262,
  8263,
  8264,
  8265,
  8266,
  8267,
  8268,
  8269,
  8270,
  8271,
  8272,
  8273,
  8274,
  8275,
  8276,
  8277,
  8278,
  8279,
  8280,
  8281,
  8282,
  8283,
  8284,
  8285,
  8286,
  8287,
  8288,
  8289,
  8290,
  8291,
  8292,
  8293,
  8294,
  8295,
  8296,
  8297,
  8298,
  8299,
  8300,
  8301,
  8302,
  8303,
  8304,
  8305,
  8306,
  8307,
  8308,
  8309,
  8310,
  8311,
  8312,
  8313,
  8314,
  8315,
  8316,
  8317,
  8318,
  8319,
  8320,
  8321,
  8322,
  8323,
  8324,
  8325,
  8326,
  8327,
  8328,
  8329,
  8330,
  8331,
  8332,
  8333,
  8334,
  8335,
  8336,
  8337,
  8338,
  8339,
  8340,
  8341,
  8342,
  8343,
  8344,
  8345,
  8346,
  8347,
  8348,
  8349,
  8350,
  8351,
  8352,
  8353,
  8354,
  8355,
  8356,
  8357,
  8358,
  8359,
  8360,
  8361,
  8362,
  8363,
  8364,
  8365,
  8366,
  8367,
  8368,
  8369,
  8370,
  8371,
  8372,
  8373,
  8374,
  8375,
  8376,
  8377,
  8378,
  8379,
  8380,
  8381,
  8382,
  8383,
  8384,
  8385,
  8386,
  8387,
  8388,
  8389,
  8390,
  8391,
  8392,
  8393,
  8394,
  8395,
  8396,
  8397,
  8398,
  8399,
  8400,
  8401,
  8402,
  8403,
  8404,
  8405,
  8406,
  8407,
  8408,
  8409,
  8410,
  8411,
  8412,
  8413,
  8414,
  8415,
  8416,
  8417,
  8418,
  8419,
  8420,
  8421,
  8422,
  8423,
  8424,
  8425,
  8426,
  8427,
  8428,
  8429,
  8430,
  8431,
  8432,
  8433,
  8434,
  8435,
  8436,
  8437,
  8438,
  8439,
  8440,
  8441,
  8442,
  8443,
  8444,
  8445,
  8446,
  8447,
  8448,
  8449,
  8450,
  8451,
  8452,
  8453,
  8454,
  8455,
  8456,
  8457,
  8458,
  8459,
  8460,
  8461,
  8462,
  8463,
  8464,
  8465,
  8466,
  8467,
  8468,
  8469,
  8470,
  8471,
  8472,
  8473,
  8474,
  8475,
  8476,
  8477,
  8478,
  8479,
  8480,
  8481,
  8482,
  8483,
  8484,
  8485,
  8486,
  8487,
  8488,
  8489,
  8490,
  8491,
  8492,
  8493,
  8494,
  8495,
  8496,
  8497,
  8498,
  8499,
  8500,
  8501,
  8502,
  8503,
  8504,
  8505,
  8506,
  8507,
  8508,
  8509,
  8510,
  8511,
  8512,
  8513,
  8514,
  8515,
  8516,
  8517,
  8518,
  8519,
  8520,
  8521,
  8522,
  8523,
  8524,
  8525,
  8526,
  8527,
  8528,
  8529,
  8530,
  8531,
  8532,
  8533,
  8534,
  8535,
  8536,
  8537,
  8538,
  8539,
  8540,
  8541,
  8542,
  8543,
  8544,
  8545,
  8546,
  8547,
  8548,
  8549,
  8550,
  8551,
  8552,
  8553,
  8554,
  8555,
  8556,
  8557,
  8558,
  8559,
  8560,
  8561,
  8562,
  8563,
  8564,
  8565,
  8566,
  8567,
  8568,
  8569,
  8570,
  8571,
  8572,
  8573,
  8574,
  8575,
  8576,
  8577,
  8578,
  8579,
  8580,
  8581,
  8582,
  8583,
  8584,
  8585,
  8586,
  8587,
  8588,
  8589,
  8590,
  8591,
  8592,
  8593,
  8594,
  8595,
  8596,
  8597,
  8598,
  8599,
  8600,
  8601,
  8602,
  8603,
  8604,
  8605,
  8606,
  8607,
  8608,
  8609,
  8610,
  8611,
  8612,
  8613,
  8614,
  8615,
  8616,
  8617,
  8618,
  8619,
  8620,
  8621,
  8622,
  8623,
  8624,
  8625,
  8626,
  8627,
  8628,
  8629,
  8630,
  8631,
  8632,
  8633,
  8634,
  8635,
  8636,
  8637,
  8638,
  8639,
  8640,
  8641,
  8642,
  8643,
  8644,
  8645,
  8646,
  8647,
  8648,
  8649,
  8650,
  8651,
  8652,
  8653,
  8654,
  8655,
  8656,
  8657,
  8658,
  8659,
  8660,
  8661,
  8662,
  8663,
  8664,
  8665,
  8666,
  8667,
  8668,
  8669,
  8670,
  8671,
  8672,
  8673,
  8674,
  8675,
  8676,
  8677,
  8678,
  8679,
  8680,
  8681,
  8682,
  8683,
  8684,
  8685,
  8686,
  8687,
  8688,
  8689,
  8690,
  8691,
  8692,
  8693,
  8694,
  8695,
  8696,
  8697,
  8698,
  8699,
  8700,
  8701,
  8702,
  8703,
  8704,
  8705,
  8706,
  8707,
  8708,
  8709,
  8710,
  8711,
  8712,
  8713,
  8714,
  8715,
  8716,
  8717,
  8718,
  8719,
  8720,
  8721,
  8722,
  8723,
  8724,
  8725,
  8726,
  8727,
  8728,
  8729,
  8730,
  8731,
  8732,
  8733,
  8734,
  8735,
  8736,
  8737,
  8738,
  8739,
  8740,
  8741,
  8742,
  8743,
  8744,
  8745,
  8746,
  8747,
  8748,
  8749,
  8750,
  8751,
  8752,
  8753,
  8754,
  8755,
  8756,
  8757,
  8758,
  8759,
  8760,
  8761,
  8762,
  8763,
  8764,
  8765,
  8766,
  8767,
  8768,
  8769,
  8770,
  8771,
  8772,
  8773,
  8774,
  8775,
  8776,
  8777,
  8778,
  8779,
  8780,
  8781,
  8782,
  8783,
  8784,
  8785,
  8786,
  8787,
  8788,
  8789,
  8790,
  8791,
  8792,
  8793,
  8794,
  8795,
  8796,
  8797,
  8798,
  8799,
  8800,
  8801,
  8802,
  8803,
  8804,
  8805,
  8806,
  8807,
  8808,
  8809,
  8810,
  8811,
  8812,
  8813,
  8814,
  8815,
  8816,
  8817,
  8818,
  8819,
  8820,
  8821,
  8822,
  8823,
  8824,
  8825,
  8826,
  8827,
  8828,
  8829,
  8830,
  8831,
  8832,
  8833,
  8834,
  8835,
  8836,
  8837,
  8838,
  8839,
  8840,
  8841,
  8842,
  8843,
  8844,
  8845,
  8846,
  8847,
  8848,
  8849,
  8850,
  8851,
  8852,
  8853,
  8854,
  8855,
  8856,
  8857,
  8858,
  8859,
  8860,
  8861,
  8862,
  8863,
  8864,
  8865,
  8866,
  8867,
  8868,
  8869,
  8870,
  8871,
  8872,
  8873,
  8874,
  8875,
  8876,
  8877,
  8878,
  8879,
  8880,
  8881,
  8882,
  8883,
  8884,
  8885,
  8886,
  8887,
  8888,
  8889,
  8890,
  8891,
  8892,
  8893,
  8894,
  8895,
  8896,
  8897,
  8898,
  8899,
  8900,
  8901,
  8902,
  8903,
  8904,
  8905,
  8906,
  8907,
  8908,
  8909,
  8910,
  8911,
  8912,
  8913,
  8914,
  8915,
  8916,
  8917,
  8918,
  8919,
  8920,
  8921,
  8922,
  8923,
  8924,
  8925,
  8926,
  8927,
  8928,
  8929,
  8930,
  8931,
  8932,
  8933,
  8934,
  8935,
  8936,
  8937,
  8938,
  8939,
  8940,
  8941,
  8942,
  8943,
  8944,
  8945,
  8946,
  8947,
  8948,
  8949,
  8950,
  8951,
  8952,
  8953,
  8954,
  8955,
  8956,
  8957,
  8958,
  8959,
  8960,
  8961,
  8962,
  8963,
  8964,
  8965,
  8966,
  8967,
  8968,
  8969,
  8970,
  8971,
  8972,
  8973,
  8974,
  8975,
  8976,
  8977,
  8978,
  8979,
  8980,
  8981,
  8982,
  8983,
  8984,
  8985,
  8986,
  8987,
  8988,
  8989,
  8990,
  8991,
  8992,
  8993,
  8994,
  8995,
  8996,
  8997,
  8998,
  8999,
  9000,
  9001,
  9002,
  9003,
  9004,
  9005,
  9006,
  9007,
  9008,
  9009,
  9010,
  9011,
  9012,
  9013,
  9014,
  9015,
  9016,
  9017,
  9018,
  9019,
  9020,
  9021,
  9022,
  9023,
  9024,
  9025,
  9026,
  9027,
  9028,
  9029,
  9030,
  9031,
  9032,
  9033,
  9034,
  9035,
  9036,
  9037,
  9038,
  9039,
  9040,
  9041,
  9042,
  9043,
  9044,
  9045,
  9046,
  9047,
  9048,
  9049,
  9050,
  9051,
  9052,
  9053,
  9054,
  9055,
  9056,
  9057,
  9058,
  9059,
  9060,
  9061,
  9062,
  9063,
  9064,
  9065,
  9066,
  9067,
  9068,
  9069,
  9070,
  9071,
  9072,
  9073,
  9074,
  9075,
  9076,
  9077,
  9078,
  9079,
  9080,
  9081,
  9082,
  9083,
  9084,
  9085,
  9086,
  9087,
  9088,
  9089,
  9090,
  9091,
  9092,
  9093,
  9094,
  9095,
  9096,
  9097,
  9098,
  9099,
  9100,
  9101,
  9102,
  9103,
  9104,
  9105,
  9106,
  9107,
  9108,
  9109,
  9110,
  9111,
  9112,
  9113,
  9114,
  9115,
  9116,
  9117,
  9118,
  9119,
  9120,
  9121,
  9122,
  9123,
  9124,
  9125,
  9126,
  9127,
  9128,
  9129,
  9130,
  9131,
  9132,
  9133,
  9134,
  9135,
  9136,
  9137,
  9138,
  9139,
  9140,
  9141,
  9142,
  9143,
  9144,
  9145,
  9146,
  9147,
  9148,
  9149,
  9150,
  9151,
  9152,
  9153,
  9154,
  9155,
  9156,
  9157,
  9158,
  9159,
  9160,
  9161,
  9162,
  9163,
  9164,
  9165,
  9166,
  9167,
  9168,
  9169,
  9170,
  9171,
  9172,
  9173,
  9174,
  9175,
  9176,
  9177,
  9178,
  9179,
  9180,
  9181,
  9182,
  9183,
  9184,
  9185,
  9186,
  9187,
  9188,
  9189,
  9190,
  9191,
  9192,
  9193,
  9194,
  9195,
  9196,
  9197,
  9198,
  9199,
  9200,
  9201,
  9202,
  9203,
  9204,
  9205,
  9206,
  9207,
  9208,
  9209,
  9210,
  9211,
  9212,
  9213,
  9214,
  9215,
  9216,
  9217,
  9218,
  9219,
  9220,
  9221,
  9222,
  9223,
  9224,
  9225,
  9226,
  9227,
  9228,
  9229,
  9230,
  9231,
  9232,
  9233,
  9234,
  9235,
  9236,
  9237,
  9238,
  9239,
  9240,
  9241,
  9242,
  9243,
  9244,
  9245,
  9246,
  9247,
  9248,
  9249,
  9250,
  9251,
  9252,
  9253,
  9254,
  9255,
  9256
]


================================================
FILE: test-suite/executable-benchmark/serial-interop/medium-list.json
================================================
[ 1,
  2,
  3,
  4,
  5,
  6,
  7,
  8,
  9,
  10,
  11,
  12,
  13,
  14,
  15,
  16,
  17,
  18,
  19,
  20,
  21,
  22,
  23,
  24,
  25,
  26,
  27,
  28,
  29,
  30,
  31,
  32,
  33,
  34,
  35,
  36,
  37,
  38,
  39,
  40,
  41,
  42,
  43,
  44,
  45,
  46,
  47,
  48,
  49,
  50,
  51,
  52,
  53,
  54,
  55,
  56,
  57,
  58,
  59,
  60,
  61,
  62,
  63,
  64,
  65,
  66,
  67,
  68,
  69,
  70,
  71,
  72,
  73,
  74,
  75,
  76,
  77,
  78,
  79,
  80,
  81,
  82,
  83,
  84,
  85,
  86,
  87,
  88,
  89,
  90,
  91,
  92,
  93,
  94,
  95,
  96,
  97,
  98,
  99,
  100
]


================================================
FILE: test-suite/executable-benchmark/serial-interop/test.sh
================================================
#!/usr/bin/env bash

set -e

morloc make foo.loc

# warmup
hyperfine \
  -w 10 \
  -L test pTenBaseline,rTenBaseline,cTenBaseline \
  "./nexus {test}"

hyperfine \
  -w 5 \
  -L test cZeroBaseline,pZeroBaseline,pZeroFromForeign,pZeroToForeign,rZeroBaseline,rZeroFromForeign,rZeroToForeign,cTenBaseline,pTenBaseline,pTenFromForeign,pTenToForeign,rTenBaseline,rTenFromForeign,rTenToForeign,rMarginalCost1,rMarginalCost2,rMarginalCost3,rMarginalCost4,pMarginalCost1,pMarginalCost2,pMarginalCost3,pMarginalCost4 \
  --export-markdown stats.markdown \
  --export-csv stats.csv \
  "./nexus {test}"

hyperfine -w 5 -L test memtest "./nexus {test} medium-list.json"

hyperfine -w 5 -L test mapManyPCP,mapManyPCR "./nexus {test} 5 long-list.json"


================================================
FILE: test-suite/golden-tests/.gitignore
================================================
obs.txt
0-*
*.out
000*
__pycache__/
pool-rust
good-*
log
*.gdb
.Rhistory
.RData
*.err
main
nexus


================================================
FILE: test-suite/golden-tests/README.md
================================================
Many of these tests are created in sets of `*-forms-<id>`, e.g., serial-form-8.
These sets are intended to enumerate all possible combinations (or all to a
certain depth). How the combinations are enumerated is scrawled in my
ReMarkable tablet somewhere, but I'll try to also copy them here.

# `serial-form-*`

These are all combinations to depth 2 of simple serial forms, record serial
forms, and constructed serial forms.

 1. (S) simple - a data type that maps immediately to JSON. Example: `[(Str, Int)]`

 2. (C) constructed - a parameterized data type where the parameters do not
    fully describe the constructor inputs and a constructor must be provided by
    the programmer. Example: `Map a b`

 3. (R) record - a data type with parameters that are fully described
    (corresponds to "data" constructors in Haskell). These can automatically be
    serialized/deserialized using existing constructors in the target language
    and record accessors. Example: `data Person a = Person {age :: Int, info : a}`

The combinations are:

 1.  S - (Str,Int,Bool)
 2.  C - Map Str Int
 3.  R - Person Str
 4.  S(S) - `[(Str,Int)]`
 5.  S(C) - `[Map Str Int]`
 6.  S(R) - `[Person Str]
 7.  C(S) - `Map Str Int`
 8.  C(C) - `Map Str (Map Str Int)`
 9.  C(R) - `Map Str (Person Str)`
 10. R(S) - `Person Str`
 11. R(C) - `Person (Map Str Int)` 
 12. R(R) - `Person (Person Str)`

There are infinitely more complex forms, but all of these can be systematically
reduced/expanded in (de)serialization. So long as these base cases work,
everything should be awesome. I might add a 10th case for valid recursive
structures (trees) and maybe an 11th really deep structure just for good feels.

# Experimental tests

The `x-` tests cover unimplemented features with syntactic support. They are
just tests of the parser.
import pybase (map, add)
export foo

# Eta reduction

```
foo = map (add 1.0)
```

 1. Synthesize map type |- (a -> b) -> [a] -> [b]
 2. (type args map) == 2
 3. (expr args map) == 1
 4. So add an expr arg:
       `map (add 1.0)  -->  `\xs -> map (add 1.0) xs`
 5. And do the same for add
       `\xs -> map (\x -> add 1.0 x) xs`


If an expression has too many arguments:

```
bar x = add (mul 2 x)
foo y = bar 4 y 
```

This is not really an eta-reduction problem, but a currying problem. The type of
bar is `Real -> (Real -> Real)`. This should be equivalent to `Real -> Real ->
Real`, but due to the how functions are encoded the number of expected arguments
is set to 1, rather than 2. I need to normalize the function definitions.
Better, I should rewrite them to naturally curry and avoid all this non-sense
from the start.

# (un)packers

Packing and unpacking functions are special in morloc. The programmer does not
explicitly evoke them, rather they are used as needed in the compiled code. So
where should they be defined and how should they be imported? Types matter,
already we import type aliases and they are required for general type
inference. So packers should be imported explicitly as types. If they are not
imported, then an informative error should be raised. I had previously thought
of making them silently available everywhere, but that would cause hidden state.

A function is tagged as a (un)packer in the type signature:

```
packMap :: pack => [(a,b)] -> Map
unpackMap :: unpack => Map -> [(a,b)]
```

To this point, I've been treating packers as existing in their own
universes. But why must this be the case? They should just be normal morloc
functions. And yet they are special. It is necessary that all input/output pairs
have compatible serialization forms. But this can be typechecked. Also, it is
not necessary that all serial forms for all types are the same across the
program. This may be useful though for the morloc environment; if a given type
always has the same serialization form serialized data can be more easily passed
between systems. But this is not something morloc can enforce, rather this is a
decision the community must make. So the best morloc can do is typecheck the
packers.

Perhaps the best way to handle these packers is to make them a typeclass. Of
course, I'll need to add support for general typeclasses first, and that is a
large job. If packing functions are written just like any other typeclass, then
all my current language-specific serialization code could be be extracted from
the compiler. Instead, they could be standard morloc modules. And then you would
simply install them as you would install any other morloc modules. The same
could go for a fair bit of code generation, in fact. Such as hooks in the
manifolds, caching functions, etc.

But I should leave this for later. First I need to fix the current packing
paradigm and write the goddamn paper. Adding typeclasses can be the next
step. It will probably be a 6 month rewrite. One thing I should guarantee is
that code using the packable types should not change when I convert to
typeclasses. So the following will be backward compatible:

```
import map (Map)

foo :: Map a b -> b
foo = ...
```

Only the modules that actually define `Map` will need to change. Usually, I
should have one module for each of these types. They should encapsulate
everything that needs to be known about the type. Maybe. Actually, it might make
sense to have one general module defining a type, then many language-specific
modules that import the general module and add the language-specific instance,
and then maybe one base module that imports many language-specific modules. This
is what I am currently doing with `conventions`, `pybase`/`cppbase`/`rbase`, and
`base`.

The next paper, then would add typeclasses, replace (un)packers with a Packable
typeclass, and add other manifold functions such as debuggers (at various
places) and cachers, diagnostics etc. That is, in the next paper, I would loop
back to the original ideas of morloc. Also I'd extend the prelude library and
reach a rough useable version.

# Data packet tests

The purpose of these tests are to ensure that data is passed correctly between
the nexus and the pool and between pools at each of the different size
categories.

Currently, the nexus can read data as either raw JSON or files of JSON. These
are passed as MESG and FILE packets, respectively. MESG packets are limited
(currently) in size to 2^16 characters. This reduces the amount of memory stored
potentially in multiple pools. When pools transmit data, either to each other or
back to the nexus, they pack data into MESG packets if they are small or FILE
packets if they are large.

Another consideration is buffer size. Data is transferred over the sockets in
buffers of (currently) 4096 characters. Packets larger than this need to be
streamed. This streaming needs to be tested across all languages.

So there are three size partitions. 0-4096, 4097-65536, and 65537+. Special
sizes of data are 0, 1, 4096, 4097, 65536, 65537.

For CALL packets, multiple DATA packets may be stored after the header. I need
to test cases where the sum of packets passes size partition.

From a pool's perspective, a call directly from the nexus is no different from a
call from another pool. However, a return is different from a foreign call. So
we need to ensure that every language is tested for foreign calls. 

So the dimensions for the nexus-to-pool call are:

 1. file/mesg nexus input [file,mesg]
 2. size [0,1,4096,4097,65536, 65537]
 3. number of arguments [0,1,n]

And the dimensions for the pool-to-pool call are

 1. size [0,1,4096,4097,65536, 65537]
 2. number of arguments [0,1,n]
 3. direction [receive, foreign call, return]


nexus file -> pool file -> pool file -> nexus file

nexus mesg -> pool mesg -> pool mesg -> nexus mesg

nexus () -> pool () -> nexus ()


================================================
FILE: test-suite/golden-tests/alias-array-monoid/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testArrayMonoidPy ---" > obs.txt
	./nexus testArrayMonoidPy >> obs.txt 2>> obs.err
	echo "--- testArrayMonoidCpp ---" >> obs.txt
	./nexus testArrayMonoidCpp >> obs.txt 2>> obs.err
	echo "--- testArrayMonoidR ---" >> obs.txt
	./nexus testArrayMonoidR >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/alias-array-monoid/exp.txt
================================================
--- testArrayMonoidPy ---
true
--- testArrayMonoidCpp ---
true
--- testArrayMonoidR ---
true


================================================
FILE: test-suite/golden-tests/alias-array-monoid/main.loc
================================================
-- Test that Array has Semigroup and Monoid instances.
-- Array is a List alias, same as Deque, so it should support the same
-- Semigroup/Monoid operations. Types are resolved via annotations at
-- call sites rather than type-casting wrapper functions.

module main (testArrayMonoidPy, testArrayMonoidCpp, testArrayMonoidR)

import root-py
import root-cpp
import root-r

testArrayMonoidPy :: Bool
testArrayMonoidPy =
  let t1 = (([1,2] :: Array Int) <> [3,4]) == [1,2,3,4]
      t2 = (mempty :: Array Int) == []
      t3 = concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
  in t1 && t2 && t3

testArrayMonoidCpp :: Bool
testArrayMonoidCpp =
  let t1 = (([1,2] :: Array Int) <> [3,4]) == [1,2,3,4]
      t2 = (mempty :: Array Int) == []
      t3 = concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
  in t1 && t2 && t3

testArrayMonoidR :: Bool
testArrayMonoidR =
  let t1 = (([1,2] :: Array Int) <> [3,4]) == [1,2,3,4]
      t2 = (mempty :: Array Int) == []
      t3 = concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
  in t1 && t2 && t3


================================================
FILE: test-suite/golden-tests/alias-concrete-bugs/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- bug1_nested_alias_py ---" > obs.txt
	./nexus bug1_nested_alias_py >> obs.txt 2>> obs.err
	echo "--- bug1_nested_alias_cpp ---" >> obs.txt
	./nexus bug1_nested_alias_cpp >> obs.txt 2>> obs.err
	echo "--- bug2_int64_eq_cpp ---" >> obs.txt
	./nexus bug2_int64_eq_cpp >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/alias-concrete-bugs/exp.txt
================================================
--- bug1_nested_alias_py ---
true
--- bug1_nested_alias_cpp ---
true
--- bug2_int64_eq_cpp ---
true


================================================
FILE: test-suite/golden-tests/alias-concrete-bugs/main.loc
================================================
-- Minimal reproducers for two concrete-type bugs with type aliases.
--
-- BUG 1: Nested containers with mixed concrete types.
-- [Deque Int] = List (Deque Int) = std::vector<std::deque<int>> in C++.
-- The code generator produces brace initialization {n1, n2} where n1/n2
-- are std::vector<int> (inner list literal default), not std::deque<int>.
-- C++ cannot implicitly convert vector to deque in an initializer list.
--
-- BUG 2: Integer alias literal type mismatch.
-- Int64 = Int at the general level, but int64_t vs int in C++.
-- When comparing `mul64 x y == 20000`, the literal 20000 is Int (int)
-- but the LHS is Int64 (int64_t). morloc_eq<A>(A, A) fails template
-- deduction because int64_t != int.

module main (bug1_nested_alias_py, bug1_nested_alias_cpp, bug2_int64_eq_cpp)

import root-py
import root-cpp

-- BUG 1: Minimal repro - nested container with alias inner type
nestedDeque :: [Deque Int] -> [Deque Int]
nestedDeque = map (map (\x -> x + 1))

bug1_nested_alias_py :: Bool
bug1_nested_alias_py = nestedDeque [[1,2],[3]] == [[2,3],[4]]

bug1_nested_alias_cpp :: Bool
bug1_nested_alias_cpp = nestedDeque [[1,2],[3]] == [[2,3],[4]]

-- BUG 2: Minimal repro - Int64 compared to Int literal
mul64 :: Int64 -> Int64 -> Int64
mul64 x y = x * y

bug2_int64_eq_cpp :: Bool
bug2_int64_eq_cpp = mul64 3 4 == 12


================================================
FILE: test-suite/golden-tests/alias-constructor-equiv/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testConcatPy ---" > obs.txt
	./nexus testConcatPy >> obs.txt 2>> obs.err
	echo "--- testConcatCpp ---" >> obs.txt
	./nexus testConcatCpp >> obs.txt 2>> obs.err
	echo "--- testConcatR ---" >> obs.txt
	./nexus testConcatR >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/alias-constructor-equiv/exp.txt
================================================
--- testConcatPy ---
true
--- testConcatCpp ---
true
--- testConcatR ---
true


================================================
FILE: test-suite/golden-tests/alias-constructor-equiv/main.loc
================================================
-- Test alias constructor equivalence for Monoid/Semigroup/Foldable interactions.
--
-- This tests the fix for "Cannot compare types Array and Deque" which occurred
-- when resolveInstances solved an existential to one alias name (e.g. Array)
-- and then tried to check it against another (e.g. Deque). Both are aliases
-- for List, so the typechecker must recognize them as equivalent constructors.
--
-- Concrete alias types (List, Deque, Array) are selected via type annotations
-- at call sites, letting typeclass resolution pick the correct implementation.

module main (testConcatPy, testConcatCpp, testConcatR)

import root-py
import root-cpp
import root-r

testConcatPy :: Bool
testConcatPy =
  let t1 = idpy $ concat ([[1,2],[3],[4,5]] :: List (List Int)) == [1,2,3,4,5]
      t2 = idpy $ concat ([[1,2],[3],[4,5]] :: Deque (Deque Int)) == [1,2,3,4,5]
      t3 = idpy $ concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
      t4 = idpy $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: [Int]) == [1,2,2,4,3,6]
      t5 = idpy $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: Deque Int) == [1,2,2,4,3,6]
      t6 = idpy $ intercalate [0] [[1,2],[3,4],[5]] == [1,2,0,3,4,0,5]
      t7 = idpy $ ([1,2] :: [Int]) <> [3,4] == [1,2,3,4]
      t8 = idpy $ ([1,2] :: Deque Int) <> [3,4] == [1,2,3,4]
      t9 = idpy $ ([1,2] :: Array Int) <> [3,4] == [1,2,3,4]
      t10 = idpy $ (mempty :: [Int]) == []
      t11 = idpy $ (mempty :: Deque Int) == []
      t12 = idpy $ (mempty :: Array Int) == []
      t13 = idpy $ fold (+) 0 ([1,2,3,4] :: Deque Int) == 10
      t14 = idpy $ fold (+) 0 ([1,2,3,4] :: Array Int) == 10
      t15 = idpy $ map (\x -> x + 1) ([1,2,3] :: Array Int) == [2,3,4]
      t16 = idpy $ map (\x -> x + 1) ([1,2,3] :: Deque Int) == [2,3,4]
      t17 = idpy $ concatMap (\x -> [x, x + 1]) ([1,2] :: [Int]) == [1,2,2,3]
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10 && t11 && t12 && t13 && t14 && t15 && t16 && t17

testConcatCpp :: Bool
testConcatCpp =
  let t1 = idcpp $ concat ([[1,2],[3],[4,5]] :: List (List Int)) == [1,2,3,4,5]
      t2 = idcpp $ concat ([[1,2],[3],[4,5]] :: Deque (Deque Int)) == [1,2,3,4,5]
      t3 = idcpp $ concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
      t4 = idcpp $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: [Int]) == [1,2,2,4,3,6]
      t5 = idcpp $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: Deque Int) == [1,2,2,4,3,6]
      t6 = idcpp $ intercalate [0] [[1,2],[3,4],[5]] == [1,2,0,3,4,0,5]
      t7 = idcpp $ ([1,2] :: [Int]) <> [3,4] == [1,2,3,4]
      t8 = idcpp $ ([1,2] :: Deque Int) <> [3,4] == [1,2,3,4]
      t9 = idcpp $ ([1,2] :: Array Int) <> [3,4] == [1,2,3,4]
      t10 = idcpp $ (mempty :: [Int]) == []
      t11 = idcpp $ (mempty :: Deque Int) == []
      t12 = idcpp $ (mempty :: Array Int) == []
      t13 = idcpp $ fold (+) 0 ([1,2,3,4] :: Deque Int) == 10
      t14 = idcpp $ fold (+) 0 ([1,2,3,4] :: Array Int) == 10
      t15 = idcpp $ map (\x -> x + 1) ([1,2,3] :: Array Int) == [2,3,4]
      t16 = idcpp $ map (\x -> x + 1) ([1,2,3] :: Deque Int) == [2,3,4]
      t17 = idcpp $ concatMap (\x -> [x, x + 1]) ([1,2] :: [Int]) == [1,2,2,3]
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10 && t11 && t12 && t13 && t14 && t15 && t16 && t17

testConcatR :: Bool
testConcatR =
  let t1 = idpy $ concat ([[1,2],[3],[4,5]] :: List (List Int)) == [1,2,3,4,5]
      t2 = idpy $ concat ([[1,2],[3],[4,5]] :: Deque (Deque Int)) == [1,2,3,4,5]
      t3 = idpy $ concat ([[1,2],[3],[4,5]] :: Array (Array Int)) == [1,2,3,4,5]
      t4 = idpy $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: [Int]) == [1,2,2,4,3,6]
      t5 = idpy $ concatMap (\x -> [x, x * 2]) ([1,2,3] :: Deque Int) == [1,2,2,4,3,6]
      t6 = idpy $ intercalate [0] [[1,2],[3,4],[5]] == [1,2,0,3,4,0,5]
      t7 = idpy $ ([1,2] :: [Int]) <> [3,4] == [1,2,3,4]
      t8 = idpy $ ([1,2] :: Deque Int) <> [3,4] == [1,2,3,4]
      t9 = idpy $ ([1,2] :: Array Int) <> [3,4] == [1,2,3,4]
      t10 = idpy $ (mempty :: [Int]) == []
      t11 = idpy $ (mempty :: Deque Int) == []
      t12 = idpy $ (mempty :: Array Int) == []
      t13 = idpy $ fold (+) 0 ([1,2,3,4] :: Deque Int) == 10
      t14 = idpy $ fold (+) 0 ([1,2,3,4] :: Array Int) == 10
      t15 = idpy $ map (\x -> x + 1) ([1,2,3] :: Array Int) == [2,3,4]
      t16 = idpy $ map (\x -> x + 1) ([1,2,3] :: Deque Int) == [2,3,4]
      t17 = idpy $ concatMap (\x -> [x, x + 1]) ([1,2] :: [Int]) == [1,2,2,3]
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10 && t11 && t12 && t13 && t14 && t15 && t16 && t17


================================================
FILE: test-suite/golden-tests/alias-dedup-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testAliasPy ---" > obs.txt
	./nexus testAliasPy >> obs.txt 2>> obs.err
	echo "--- testAliasCpp ---" >> obs.txt
	./nexus testAliasCpp >> obs.txt 2>> obs.err
	echo "--- testInt32Cpp ---" >> obs.txt
	./nexus testInt32Cpp >> obs.txt 2>> obs.err
	echo "--- testDeepChainPy ---" >> obs.txt
	./nexus testDeepChainPy >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/alias-dedup-1/exp.txt
================================================
--- testAliasPy ---
true
--- testAliasCpp ---
true
--- testInt32Cpp ---
true
--- testDeepChainPy ---
194


================================================
FILE: test-suite/golden-tests/alias-dedup-1/main.loc
================================================
-- Test alias deduplication correctness and performance.
-- Verifies that type aliases (Deque/Array = List, Int32/Int64 = Int)
-- are handled correctly by the typechecker's instance resolution dedup.

module main (testAliasPy, testAliasCpp, testInt32Cpp, testDeepChainPy)

import root-py
import root-cpp

-- ===== EXPLICIT ALIAS ANNOTATIONS =====
-- Each alias supports different typeclasses:
--   List:   Functor, Foldable, Indexed, Stack, Queue
--   Deque:  Functor, Foldable, Stack, Queue
--   Array:  Functor, Foldable, Indexed

-- Functor (all aliases have it)
mapDeque :: Deque Int -> Deque Int
mapDeque xs = map (\x -> x + 1) xs

mapArray :: Array Int -> Array Int
mapArray xs = map (\x -> x + 1) xs

-- Foldable (all aliases have it)
foldDeque :: Deque Int -> Int
foldDeque xs = fold (\a x -> a + x) 0 xs

foldArray :: Array Int -> Int
foldArray xs = fold (\a x -> a + x) 0 xs

-- Indexed (List, Array -- NOT Deque)
indexList :: [Int] -> Int
indexList xs = at 0 xs

indexArray :: Array Int -> Int
indexArray xs = at 0 xs

-- Stack (List, Deque -- NOT Array)
consDeque :: Deque Int -> Deque Int
consDeque xs = cons 0 xs

-- Queue (List, Deque -- NOT Array)
snocDeque :: Deque Int -> Deque Int
snocDeque xs = snoc xs 99

snocList :: [Int] -> [Int]
snocList xs = snoc xs 99

-- ===== MULTI-TYPECLASS CHAINS ON SPECIFIC ALIASES =====
-- Deque: map (Functor) + cons (Stack) + fold (Foldable)
chainDeque :: Deque Int -> Int
chainDeque xs =
  let ys = map (\x -> x + 1) xs
      zs = cons 0 ys
  in fold (\a x -> a + x) 0 zs

-- List: map (Functor) + snoc (Queue) + at (Indexed)
chainList :: [Int] -> Int
chainList xs =
  let ys = map (\x -> x + 1) xs
      zs = snoc ys 100
  in at 0 zs

-- Array: map (Functor) + at (Indexed) + fold (Foldable)
chainArray :: Array Int -> Int
chainArray xs =
  let ys = map (\x -> x * 2) xs
  in fold (\a x -> a + x) 0 ys

-- ===== INT32/INT64 ARITHMETIC (C++ only) =====
-- Int32 = Int at the general level, but "int32_t" in C++.
add32 :: Int32 -> Int32 -> Int32
add32 x y = x + y

mul64 :: Int64 -> Int64 -> Int64
mul64 x y = x * y

-- ===== DEEP CHAIN (performance stress) =====
-- 8 chained operations. Without alias dedup this would cause
-- exponential branching in instance resolution.
deepChain :: [Int] -> Int
deepChain xs =
  let a = map (\x -> x + 1) xs
      b = map (\x -> x * 2) a
      c = cons 0 b
      d = snoc c 100
      e = map (\x -> x - 1) d
      f = filter (\x -> x > 0) e
      g = map (\x -> x + 10) f
  in fold (\acc x -> acc + x) 0 g

-- ===== NESTED ALIAS CONTAINERS =====
nestedAliasMap :: [Deque Int] -> [Deque Int]
nestedAliasMap = map (map (\x -> x + 1))

-- ===== Eq on aliases =====
eqDeque :: Bool
eqDeque = mapDeque [1,2,3] == [2,3,4]

eqArray :: Bool
eqArray = mapArray [1,2,3] == [2,3,4]

-- ===== TEST RUNNERS =====

testAliasPy :: Bool
testAliasPy =
  let t1 = mapDeque [1,2,3] == [2,3,4]
      t2 = mapArray [1,2,3] == [2,3,4]
      t3 = foldDeque [1,2,3] == 6
      t4 = foldArray [1,2,3] == 6
      t5 = indexList [10,20,30] == 10
      t6 = indexArray [10,20,30] == 10
      t7 = consDeque [1,2] == [0,1,2]
      t8 = snocDeque [1,2] == [1,2,99]
      t9 = snocList [1,2] == [1,2,99]
      t10 = chainDeque [1,2,3] == 9
      t11 = chainList [1,2,3] == 2
      t12 = chainArray [1,2,3] == 12
      t13 = nestedAliasMap [[1,2],[3]] == [[2,3],[4]]
      t14 = eqDeque && eqArray
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10 && t11 && t12 && t13 && t14

testAliasCpp :: Bool
testAliasCpp =
  let t1 = mapDeque [1,2,3] == [2,3,4]
      t2 = mapArray [1,2,3] == [2,3,4]
      t3 = foldDeque [1,2,3] == 6
      t4 = foldArray [1,2,3] == 6
      t5 = indexList [10,20,30] == 10
      t6 = indexArray [10,20,30] == 10
      t7 = consDeque [1,2] == [0,1,2]
      t8 = snocDeque [1,2] == [1,2,99]
      t9 = snocList [1,2] == [1,2,99]
      t10 = chainDeque [1,2,3] == 9
      t11 = chainList [1,2,3] == 2
      t12 = chainArray [1,2,3] == 12
      t13 = nestedAliasMap [[1,2],[3]] == [[2,3],[4]]
      t14 = eqDeque && eqArray
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10 && t11 && t12 && t13 && t14

testInt32Cpp :: Bool
testInt32Cpp =
  let t1 = add32 10 20 == 30
      t2 = mul64 100 200 == 20000
  in t1 && t2

testDeepChainPy :: Int
testDeepChainPy = deepChain [1,2,3,4,5]


================================================
FILE: test-suite/golden-tests/alias-no-cross-instance/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err && echo "UNEXPECTED_SUCCESS" > obs.txt || echo "build_rejected" > obs.txt

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/alias-no-cross-instance/exp.txt
================================================
build_rejected


================================================
FILE: test-suite/golden-tests/alias-no-cross-instance/main.loc
================================================
-- Negative test: aliases do NOT inherit typeclass instances from
-- the underlying type. Vector has no Stack instance (no cons),
-- Array has no Queue instance (no snoc), Deque has no Indexed (no at).
-- Each subcommand tests one such case; all should fail at build time.

module main (consVector, snocArray, indexDeque)

import root-py

-- Vector has Functor, Foldable, Indexed, Queue -- but NOT Stack
consVector :: Vector Int -> Vector Int
consVector xs = cons 0 xs

-- Array has Functor, Foldable, Indexed -- but NOT Queue
snocArray :: Array Int -> Array Int
snocArray xs = snoc xs 99

-- Deque has Functor, Foldable, Stack, Queue -- but NOT Indexed
indexDeque :: Deque Int -> Int
indexDeque xs = at 0 xs


================================================
FILE: test-suite/golden-tests/argument-form-1-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-1-c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-1-c/main.loc
================================================
module main (foo)

import root-cpp

-- full application with constants
-- can potentially optimize out this manifold
foo :: Real -> Real
foo x = x + 2.0 * 20.0


================================================
FILE: test-suite/golden-tests/argument-form-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-1-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-1-py/main.loc
================================================
module main (foo)

import root-py

-- full application with constants
-- can potentially optimize out this manifold
foo x = x + 2.0 * 20.0


================================================
FILE: test-suite/golden-tests/argument-form-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-1-r/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-1-r/main.loc
================================================
module main (foo)

import root-r

-- full application with constants
-- can potentially optimize out this manifold
foo x = x + 2.0 * 20.0


================================================
FILE: test-suite/golden-tests/argument-form-2-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-2-c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-2-c/main.loc
================================================
module main (foo)

import root-cpp

-- full application with variable passing
-- cannot optimize out this manifold
foo x = x + 20.0 * x


================================================
FILE: test-suite/golden-tests/argument-form-2-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-2-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-2-py/main.loc
================================================
module main (foo)

import root-py

-- full application with variable passing
-- cannot optimize out this manifold
foo x = x + 20.0 * x


================================================
FILE: test-suite/golden-tests/argument-form-2-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-2-r/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-2-r/main.loc
================================================
module main (foo)

import root-r

-- full application with variable passing
-- cannot optimize out this manifold
foo x = x + 20.0 * x


================================================
FILE: test-suite/golden-tests/argument-form-3-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-3-c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-3-c/main.loc
================================================
module main (foo)

import root-cpp

y = 40.0

-- external constant
-- y will be turned into a manifold, making this the same as the f2 case
-- can optimize out the manifold
foo x = x + y


================================================
FILE: test-suite/golden-tests/argument-form-3-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-3-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-3-py/main.loc
================================================
module main (foo)

import root-py

y = 40.0

-- external constant
-- y will be turned into a manifold, making this the same as the f2 case
-- can optimize out the manifold
foo x = x + y


================================================
FILE: test-suite/golden-tests/argument-form-3-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-3-r/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-3-r/main.loc
================================================
module main (foo)

import root-r

y = 40.0

-- external constant
-- y will be turned into a manifold, making this the same as the f2 case
-- can optimize out the manifold
foo x = x + y


================================================
FILE: test-suite/golden-tests/argument-form-4-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-4-c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-4-c/main.loc
================================================
module main (foo)

import root-cpp

f = 20.0 * 2.0

-- external 0 input argument
-- cannot optimize out the manifold
-- a better example would be a random number generator
foo x = x + f


================================================
FILE: test-suite/golden-tests/argument-form-4-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-4-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-4-py/main.loc
================================================
module main (foo)

import root-py

f = 20.0 * 2.0

-- external 0 input argument
-- cannot optimize out the manifold
-- a better example would be a random number generator
foo x = x + f


================================================
FILE: test-suite/golden-tests/argument-form-4-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-4-r/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/argument-form-4-r/main.loc
================================================
module main (foo)

import root-r

f = 20.0 * 2.0

-- external 0 input argument
-- cannot optimize out the manifold
-- a better example would be a random number generator
foo x = x + f


================================================
FILE: test-suite/golden-tests/argument-form-5-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-5-c/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-5-c/main.loc
================================================
module main (foo)

import root-cpp

-- literal function with constant application
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-5-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-5-py/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-5-py/main.loc
================================================
module main (foo)

import root-py

-- literal function with constant application
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-5-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-5-r/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-5-r/main.loc
================================================
module main (foo)

import root-r

-- literal function with constant application
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-6-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] [2,3,4] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-6-c/exp.txt
================================================
[2,6,12]


================================================
FILE: test-suite/golden-tests/argument-form-6-c/main.loc
================================================
module main (foo)

import root-cpp

-- literal function with no application
foo :: [Real] -> [Real] -> [Real]
foo xs ys = zipWith (*) xs ys


================================================
FILE: test-suite/golden-tests/argument-form-6-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] [2,3,4] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-6-py/exp.txt
================================================
[2,6,12]


================================================
FILE: test-suite/golden-tests/argument-form-6-py/main.loc
================================================
module main (foo)

import root-py

-- literal function with no application
foo :: [Real] -> [Real] -> [Real]
foo xs ys = zipWith (*) xs ys


================================================
FILE: test-suite/golden-tests/argument-form-6-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] [2,3,4] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-6-r/exp.txt
================================================
[2,6,12]


================================================
FILE: test-suite/golden-tests/argument-form-6-r/main.loc
================================================
module main (foo)

import root-r

-- literal function with no application
foo :: [Real] -> [Real] -> [Real]
foo xs ys = zipWith (*) xs ys


================================================
FILE: test-suite/golden-tests/argument-form-7-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-7-c/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-7-c/main.loc
================================================
module main (foo)

import root-cpp

-- literal partially-applied function passed as argument
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-7-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-7-py/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-7-py/main.loc
================================================
module main (foo)

import root-py

-- literal partially-applied function passed as argument
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-7-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-7-r/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-7-r/main.loc
================================================
module main (foo)

import root-r

-- literal partially-applied function passed as argument
foo :: [Real] -> [Real]
foo xs = map ((*) 2.0) xs


================================================
FILE: test-suite/golden-tests/argument-form-8-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-8-c/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-8-c/main.loc
================================================
module main (foo)

import root-cpp

-- variable partially-applied function passed as argument
foo :: Real -> [Real] -> [Real]
foo x xs = map ((*) x) xs


================================================
FILE: test-suite/golden-tests/argument-form-8-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-8-py/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-8-py/main.loc
================================================
module main (foo)

import root-py

-- variable partially-applied function passed as argument
foo :: Real -> [Real] -> [Real]
foo x xs = map ((*) x) xs


================================================
FILE: test-suite/golden-tests/argument-form-8-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/argument-form-8-r/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/argument-form-8-r/main.loc
================================================
module main (foo)

import root-r

-- variable partially-applied function passed as argument
foo :: Real -> [Real] -> [Real]
foo x xs = map ((*) x) xs


================================================
FILE: test-suite/golden-tests/arrow-immutable-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/arrow-immutable-cp/exp.txt
================================================
249750


================================================
FILE: test-suite/golden-tests/arrow-immutable-cp/main.loc
================================================
module main (result)

import root
import root-cpp
import root-py

table Stats = Stats {idx :: Int, value :: Real}
table Cpp => Stats = "arrow"
table Py  => Stats = "arrow"

source Cpp from "src.hpp" ("makeLargeTable", "makeIndices", "sumReals")
source Py from "src.py" ("lookupValue")

makeLargeTable :: Int -> Stats
lookupValue :: Stats -> Int -> Real
makeIndices :: Int -> [Int]
sumReals :: [Real] -> Real

result ::
  --' number of rows in table
  --' arg: --nrows
  --' default: 100000
  Int ->
  --' number of foreign calls
  --' arg: --ncalls
  --' default: 1000
  Int ->
  Real
result nrows ncalls =
  let tbl = makeLargeTable nrows
  in sumReals (map (lookupValue tbl) (makeIndices ncalls))


================================================
FILE: test-suite/golden-tests/arrow-immutable-cp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__

#include "mlc_arrow.hpp"
#include <nanoarrow/nanoarrow.h>

mlc::ArrowTable makeLargeTable(int n) {
    struct ArrowSchema schema;
    struct ArrowArray array;

    ArrowSchemaInit(&schema);
    ArrowSchemaSetTypeStruct(&schema, 2);

    ArrowSchemaSetFormat(schema.children[0], "i");
    ArrowSchemaSetName(schema.children[0], "idx");

    ArrowSchemaSetFormat(schema.children[1], "g");
    ArrowSchemaSetName(schema.children[1], "value");

    ArrowArrayInitFromSchema(&array, &schema, nullptr);
    ArrowArrayStartAppending(&array);

    for (int i = 0; i < n; i++) {
        ArrowArrayAppendInt(array.children[0], i);
        ArrowArrayAppendDouble(array.children[1], (double)i * 0.5);
        ArrowArrayFinishElement(&array);
    }

    ArrowArrayFinishBuildingDefault(&array, nullptr);
    return mlc::ArrowTable(std::move(schema), std::move(array));
}

std::vector<int> makeIndices(int n) {
    std::vector<int> v(n);
    for (int i = 0; i < n; i++) v[i] = i;
    return v;
}

double sumReals(const std::vector<double>& xs) {
    double s = 0.0;
    for (double x : xs) s += x;
    return s;
}

#endif


================================================
FILE: test-suite/golden-tests/arrow-immutable-cp/src.py
================================================
def lookupValue(table, i):
    return table.column("value")[i].as_py()


================================================
FILE: test-suite/golden-tests/arrow-immutable-pc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/arrow-immutable-pc/exp.txt
================================================
249750


================================================
FILE: test-suite/golden-tests/arrow-immutable-pc/main.loc
================================================
module main (result)

import root
import root-cpp
import root-py

table Stats = Stats {idx :: Int, value :: Real}
table Cpp => Stats = "arrow"
table Py  => Stats = "arrow"

source Py from "src.py" ("makeLargeTable", "makeIndices", "sumReals")
source Cpp from "src.hpp" ("lookupValue")

makeLargeTable :: Int -> Stats
lookupValue :: Stats -> Int -> Real
makeIndices :: Int -> [Int]
sumReals :: [Real] -> Real

result ::
  --' number of rows in table
  --' arg: --nrows
  --' default: 100000
  Int ->
  --' number of foreign calls
  --' arg: --ncalls
  --' default: 1000
  Int ->
  Real
result nrows ncalls =
  let tbl = makeLargeTable nrows
  in sumReals (map (lookupValue tbl) (makeIndices ncalls))


================================================
FILE: test-suite/golden-tests/arrow-immutable-pc/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__

#include "mlc_arrow.hpp"
#include <nanoarrow/nanoarrow.h>

double lookupValue(const mlc::ArrowTable& table, int i) {
    struct ArrowArrayView view;
    ArrowArrayViewInitFromSchema(&view, table.schema(), nullptr);
    ArrowArrayViewSetArray(&view, table.array(), nullptr);

    double val = ArrowArrayViewGetDoubleUnsafe(view.children[1], (int64_t)i);

    ArrowArrayViewReset(&view);
    return val;
}

#endif


================================================
FILE: test-suite/golden-tests/arrow-immutable-pc/src.py
================================================
import pyarrow as pa

def makeLargeTable(n):
    return pa.RecordBatch.from_pydict({
        "idx": list(range(n)),
        "value": [float(i) * 0.5 for i in range(n)]
    })

def makeIndices(n):
    return list(range(n))

def sumReals(xs):
    return sum(xs)


================================================
FILE: test-suite/golden-tests/arrow-immutable-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/arrow-immutable-pr/exp.txt
================================================
249750


================================================
FILE: test-suite/golden-tests/arrow-immutable-pr/main.loc
================================================
module main (result)

import root
import root-py
import root-r (Int, Real)

table Stats = Stats {idx :: Int, value :: Real}
table Py => Stats = "arrow"
table R  => Stats = "arrow"

source Py from "src.py" ("makeLargeTable", "makeIndices", "sumReals")
source R from "src.R" ("lookupValue")

makeLargeTable :: Int -> Stats
lookupValue :: Stats -> Int -> Real
makeIndices :: Int -> [Int]
sumReals :: [Real] -> Real

result ::
  --' number of rows in table
  --' arg: --nrows
  --' default: 100000
  Int ->
  --' number of foreign calls
  --' arg: --ncalls
  --' default: 1000
  Int ->
  Real
result nrows ncalls =
  let tbl = makeLargeTable nrows
  in sumReals (map (lookupValue tbl) (makeIndices ncalls))


================================================
FILE: test-suite/golden-tests/arrow-immutable-pr/src.R
================================================
lookupValue <- function(table, i) {
  as.double(as.vector(table$value)[i + 1L])
}


================================================
FILE: test-suite/golden-tests/arrow-immutable-pr/src.py
================================================
import pyarrow as pa

def makeLargeTable(n):
    return pa.RecordBatch.from_pydict({
        "idx": list(range(n)),
        "value": [float(i) * 0.5 for i in range(n)]
    })

def makeIndices(n):
    return list(range(n))

def sumReals(xs):
    return sum(xs)


================================================
FILE: test-suite/golden-tests/arrow-immutable-rp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/arrow-immutable-rp/exp.txt
================================================
249750


================================================
FILE: test-suite/golden-tests/arrow-immutable-rp/main.loc
================================================
module main (result)

import root
import root-py
import root-r (Int, Real)

table Stats = Stats {idx :: Int, value :: Real}
table Py => Stats = "arrow"
table R  => Stats = "arrow"

source R from "src.R" ("makeLargeTable", "makeIndices", "sumReals")
source Py from "src.py" ("lookupValue")

makeLargeTable :: Int -> Stats
lookupValue :: Stats -> Int -> Real
makeIndices :: Int -> [Int]
sumReals :: [Real] -> Real

result ::
  --' number of rows in table
  --' arg: --nrows
  --' default: 100000
  Int ->
  --' number of foreign calls
  --' arg: --ncalls
  --' default: 1000
  Int ->
  Real
result nrows ncalls =
  let tbl = makeLargeTable nrows
  in sumReals (map (lookupValue tbl) (makeIndices ncalls))


================================================
FILE: test-suite/golden-tests/arrow-immutable-rp/src.R
================================================
makeLargeTable <- function(n) {
  arrow::record_batch(
    idx = 0L:(n - 1L),
    value = as.double(0:(n - 1)) * 0.5
  )
}

makeIndices <- function(n) {
  as.integer(0:(n - 1))
}

sumReals <- function(xs) {
  sum(xs)
}


================================================
FILE: test-suite/golden-tests/arrow-immutable-rp/src.py
================================================
def lookupValue(table, i):
    return table.column("value")[i].as_py()


================================================
FILE: test-suite/golden-tests/arrow-nexus-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus makePeople > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/arrow-nexus-cpp/exp.txt
================================================
[{"name":"Alice","age":30},{"name":"Bob","age":25}]


================================================
FILE: test-suite/golden-tests/arrow-nexus-cpp/main.loc
================================================
module main (makePeople)

import root
import root-cpp

table Person = Person {name :: Str, age :: Int}
table Cpp => Person = "arrow"

source Cpp from "src.hpp" ("makePeople")

makePeople :: Person


================================================
FILE: test-suite/golden-tests/arrow-nexus-cpp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__

#include "mlc_arrow.hpp"
#include <nanoarrow/nanoarrow.h>

mlc::ArrowTable makePeople() {
    struct ArrowSchema schema;
    struct ArrowArray array;

    ArrowSchemaInit(&schema);
    ArrowSchemaSetTypeStruct(&schema, 2);

    ArrowSchemaSetFormat(schema.children[0], "u");
    ArrowSchemaSetName(schema.children[0], "name");

    ArrowSchemaSetFormat(schema.children[1], "i");
    ArrowSchemaSetName(schema.children[1], "age");

    ArrowArrayInitFromSchema(&array, &schema, nullptr);
    ArrowArrayStartAppending(&array);

    ArrowArrayAppendString(array.children[0], ArrowCharView("Alice"));
    ArrowArrayAppendInt(array.children[1], 30);
    ArrowArrayFinishElement(&array);

    ArrowArrayAppendString(array.children[0], ArrowCharView("Bob"));
    ArrowArrayAppendInt(array.children[1], 25);
    ArrowArrayFinishElement(&array);

    ArrowArrayFinishBuildingDefault(&array, nullptr);

    return mlc::ArrowTable(std::move(schema), std::move(array));
}

#endif


================================================
FILE: test-suite/golden-tests/arrow-nexus-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus makePeople > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/arrow-nexus-py/exp.txt
================================================
[{"name":"Alice","age":30},{"name":"Bob","age":25}]


================================================
FILE: test-suite/golden-tests/arrow-nexus-py/main.loc
================================================
module main (makePeople)

import root
import root-py

table Person = Person {name :: Str, age :: Int}
table Py => Person = "arrow"

source Py from "src.py" ("makePeople")

makePeople :: Person


================================================
FILE: test-suite/golden-tests/arrow-nexus-py/src.py
================================================
import pyarrow as pa

def makePeople():
    return pa.RecordBatch.from_pydict({"name": ["Alice", "Bob"], "age": [30, 25]})


================================================
FILE: test-suite/golden-tests/bare-selector-args/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus starlingTest '[1,2]' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/bare-selector-args/exp.txt
================================================
1


================================================
FILE: test-suite/golden-tests/bare-selector-args/main.loc
================================================
module test (starlingTest)

import root
import root-py

starlingTest :: (Int, Int) -> Int
starlingTest = starling const .0 .1


================================================
FILE: test-suite/golden-tests/bare-selector-chain/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus getNestedFirst '[[1,2],3]' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/bare-selector-chain/exp.txt
================================================
1


================================================
FILE: test-suite/golden-tests/bare-selector-chain/main.loc
================================================
module test (getNestedFirst)

import root-py

getNestedFirst :: ((Int, Int), Int) -> Int
getNestedFirst = .0.0


================================================
FILE: test-suite/golden-tests/bug-intrinsic-schema-crash/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus schemaStable 42 > obs.txt 2> obs.err
	./nexus typeofStable 42 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/bug-intrinsic-schema-crash/exp.txt
================================================
true
true


================================================
FILE: test-suite/golden-tests/bug-intrinsic-schema-crash/helper.py
================================================
def identity(x):
    return x


================================================
FILE: test-suite/golden-tests/bug-intrinsic-schema-crash/main.loc
================================================
-- BUG-006: @schema and @typeof crash the compiler
--
-- In v0.74.0, using @schema or @typeof causes a compiler crash at codegen:
--     morloc: Runtime intrinsic @IntrSchema reached code generation without schema
--     CallStack (from HasCallStack):
--       error, called at library/Morloc/CodeGenerator/Grammars/Translator/Imperative.hs:513:3
--
-- Root cause: Serialize.hs:293-313 (intrinsicSchema) has explicit cases for
-- IntrHash/IntrSave/IntrSaveM/IntrSaveJ/IntrShow/IntrLoad/IntrRead but is
-- MISSING cases for IntrSchema and IntrTypeof. They fall through to the
-- catch-all that returns Nothing, and Imperative.hs:512-513 then errors
-- because the intrinsic reached lowering without a computed schema.
--
-- This test asserts: @schema and @typeof compile without crashing AND
-- produce deterministic output (the same schema/typeof string for the same
-- type across multiple calls).
module main (schemaStable, typeofStable)

import root-py

source Py from "helper.py" ("identity")
identity :: a -> a

-- @schema of the same type should be identical across calls
schemaStable :: Int -> Bool
schemaStable x = (@schema (identity x)) == (@schema (identity (identity x)))

-- @typeof of the same type should be identical across calls
typeofStable :: Int -> Bool
typeofStable x = (@typeof (identity x)) == (@typeof (identity (identity x)))


================================================
FILE: test-suite/golden-tests/bug-load-type-infer/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus roundTrip 42 '"/tmp/bug-load-type-infer.bin"' > obs.txt 2> obs.err
	rm -f /tmp/bug-load-type-infer.bin

clean:
	rm -rf nexus pools __pycache__ *err
	rm -f /tmp/bug-load-type-infer.bin


================================================
FILE: test-suite/golden-tests/bug-load-type-infer/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/bug-load-type-infer/helper.py
================================================
def identity(x):
    return x


================================================
FILE: test-suite/golden-tests/bug-load-type-infer/main.loc
================================================
-- BUG-003: @load type inference fails in do-blocks
--
-- In v0.74.0, a @save/@load round-trip in a do-block fails to typecheck:
--     Type mismatch:
--       expected: ?Int
--       inferred: <IO> ?<a>
--     Subtype error: Type mismatch fall through
--       <IO> ?<a> <: ?Int
--
-- Root cause: @load is assigned a fresh type variable in
-- Typecheck.hs:625-627 (intrinsicTypeG IntrLoad returns <IO> ?a), but the
-- do-block handler does not propagate the enclosing function's declared
-- return type inward to constrain that fresh variable.
--
-- This test asserts: roundTrip 42 path writes 42 to the file and loads it
-- back, returning 42.
module main (roundTrip)

import root-py

source Py from "helper.py" ("identity")
identity :: a -> a

roundTrip :: Int -> Str -> <IO> ?Int
roundTrip x path = do
  @save (identity x) path
  x <- @load path
  x


================================================
FILE: test-suite/golden-tests/claude-test-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus addTwo 5 > obs.txt 2> obs.err
	./nexus doubleList '[1,2,3,4]' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/claude-test-1/exp.txt
================================================
7
[2,4,6,8]


================================================
FILE: test-suite/golden-tests/claude-test-1/main.loc
================================================
module main (addTwo, doubleList)

import root-py

-- Simple function that adds 2 to a number
addTwo :: Int -> Int
addTwo x = x + 2

-- Function that doubles all elements in a list
doubleList :: [Int] -> [Int]
doubleList xs = map ((*) 2) xs


================================================
FILE: test-suite/golden-tests/claude-test-10/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus analyze --sample 1 > obs.txt 2> obs.err
	./nexus motifs --sample 1 --kmer-length 3 2>> obs.err  >> obs.txt
	./nexus align --seq1 1 --seq2 2 2>> obs.err  >> obs.txt
	./nexus gcContent 1 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-10/README.md
================================================
# Claude-Test-10: DNA Sequence Analyzer

## Overview
Demonstrates bioinformatics workflows with Python for sequence I/O, C++ for alignment algorithms, and R for statistical analysis of nucleotide sequences.

## Features Tested
- **String algorithms**: DNA sequence analysis, alignment, motif finding
- **Record field access**: `.nucleotides`, `.seqId` accessor syntax
- **Lists of strings**: K-mer lists
- **Records with strings**: Sequence, Alignment, KmerProfile records
- **String validation**: C++ validates DNA sequences
- **Cross-language biology pipelines**: Python → C++ → R

## Architecture

### Python (`sequence_io.py`)
- `getSampleSequence(id)`: Retrieve sample DNA sequences
- `createSequence(id, desc, nucleotides)`: Create Sequence record
- `formatAlignment(alignment)`: Format alignment results

### C++ (`sequence_align.hpp`)
- `alignSmithWaterman(seq1, seq2)`: Local sequence alignment
- `findKmers(seq, k)`: Extract all k-mers of length k
- `countKmer(seq, kmer)`: Count k-mer occurrences
- `validateSequence(seq)`: Validate DNA alphabet (ATGC only)

### R (`sequence_stats.R`)
- `calculateGC(seq)`: Compute GC content percentage
- `sequenceComplexity(seq)`: Measure sequence complexity (unique k-mers ratio)
- `analyzeComposition(seq)`: Full composition analysis

## Biological Background

**GC Content:** Percentage of guanine (G) and cytosine (C) bases. Important for:
- Gene prediction
- Species classification
- Thermal stability

**Smith-Waterman Alignment:** Finds optimal local alignment between sequences
- Match: +2
- Mismatch: -1
- Gap: -1

**K-mers:** Substrings of length k used for:
- Motif discovery
- Sequence assembly
- Pattern recognition

## Data Flow

1. **analyzeSequence**: Python gets sequence → R analyzes composition
2. **findMotifs**: Python gets sequence → C++ finds all k-mers
3. **alignSequences**: Python gets 2 sequences → C++ aligns them
4. **gcContent**: Python gets sequence → R calculates GC%

## Sample Sequences

1. **SEQ001**: Sample E. coli sequence (mixed content)
2. **SEQ002**: Sample human sequence (mixed content)
3. **SEQ003**: High GC content (all GC)
4. **SEQ004**: Low complexity (ATAT repeat)
5. **SEQ005**: Random sequence

## Example Usage

```bash
# Analyze sequence composition
./nexus analyze --sample 1

# Find all 3-mers
./nexus motifs --sample 1 --kmer-length 3

# Align sequences 1 and 2
./nexus align --seq1 1 --seq2 2

# Calculate GC content
./nexus gc-content --sample 3
```

## What This Tests

1. **String-heavy operations** across languages
2. **Record field accessors**: `.nucleotides`, `.seqId`
3. **Lists of strings** serialization
4. **Algorithm implementation**: Smith-Waterman in C++
5. **String validation**: DNA alphabet checking
6. **Statistical string analysis** in R
7. **Domain-specific types**: DNA sequences as strings
8. **Pattern matching** and motif finding

## Expected Results

- **GC content (SEQ001)**: ~47.5%
- **GC content (SEQ003)**: 100%
- **GC content (SEQ004)**: 0%
- **Alignment SEQ001 vs SEQ002**: High similarity
- **3-mers in SEQ001**: Multiple overlapping k-mers


================================================
FILE: test-suite/golden-tests/claude-test-10/exp.txt
================================================
{"gcContent":0.5,"atContent":0.5,"length":40,"complexity":0.342105263157895}
["ATG","TGC","GCG","CGA","GAT","ATC","TCG","CGA","GAT","ATC","TCG","CGA","GAT","ATC","TCG","CGA","GAT","ATC","TCG","CGT","GTA","TAG","AGC","GCT","CTA","TAG","AGC","GCT","CTA","TAG","AGC","GCT","CTA","TAG","AGC","GCT","CTA","TAG"]
{"score":56,"seq1":"ATGCGATCGATCGATCGATCGTAGCTAGCTAGCTAGCTAG","seq2":"ATGCGATCGTAGCTAGCTAGCTGCATGCTAGCTAGCTAG","alignedSeq1":"ATGCGATCGATCGATCGATCGTAGCTAGCTAGCTAGCTA","alignedSeq2":"ATGCGATCGTAGCTAGCTAGCTGCATGCTAGCTAGCTAG","identity":0.282051282051282}
0.5


================================================
FILE: test-suite/golden-tests/claude-test-10/main.loc
================================================
-- desc: DNA Sequence Analyzer - Bioinformatics
-- author: Claude
--
-- Demonstrates bioinformatics workflows with Python for I/O,
-- C++ for sequence alignment, and R for statistical analysis.
module main (analyzeSequence, findMotifs, alignSequences, gcContent)

-- Type mappings
type Cpp => List a = "std::vector<$1>" a
type Py => List a = "list" a
type R => List a = "list" a
type Cpp => Int = "int"
type Py => Int = "int"
type R => Int = "int"
type Cpp => Real = "double"
type Py => Real = "float"
type R => Real = "double"
type Cpp => Str = "std::string"
type Py => Str = "str"
type R => Str = "character"

-- DNA sequence record
record Sequence where
  seqId :: Str
  description :: Str
  nucleotides :: Str
  length :: Int

record Py => Sequence = "dict"
record Cpp => Sequence = "struct"
record R => Sequence = "list"

-- Alignment result
record Alignment where
  score :: Real
  seq1 :: Str
  seq2 :: Str
  alignedSeq1 :: Str
  alignedSeq2 :: Str
  identity :: Real

record Py => Alignment = "dict"
record Cpp => Alignment = "Alignment"
record R => Alignment = "list"

-- K-mer profile
record KmerProfile where
  kmer :: Str
  frequency :: Int
  positions :: [Int]

record Py => KmerProfile = "dict"
record Cpp => KmerProfile = "struct"
record R => KmerProfile = "list"

-- Sequence statistics
record SeqStats where
  gcContent :: Real
  atContent :: Real
  length :: Int
  complexity :: Real

record Py => SeqStats = "dict"
record Cpp => SeqStats = "struct"
record R => SeqStats = "list"

-- Python I/O
source Py from "sequence_io.py" ("createSequence", "getSampleSequence", "formatAlignment")
createSequence :: Str -> Str -> Str -> Sequence
getSampleSequence :: Int -> Sequence
formatAlignment :: Alignment -> Str

-- C++ sequence algorithms
source Cpp from "sequence_align.hpp" ("alignSmithWaterman", "findKmers", "countKmer", "validateSequence")
alignSmithWaterman :: Str -> Str -> Alignment
findKmers :: Str -> Int -> [Str]
countKmer :: Str -> Str -> Int
validateSequence :: Str -> Bool

-- R statistics
source R from "sequence_stats.R" ("calculateGC", "sequenceComplexity", "analyzeComposition")
calculateGC :: Str -> Real
sequenceComplexity :: Str -> Real
analyzeComposition :: Str -> SeqStats

--' Analyze a DNA sequence
--'
--' Computes GC content and complexity statistics using R.
--'
--' name: analyze
analyzeSequence ::
  --' Sample sequence ID (1-5)
  --' arg: --sample
  --' metavar: ID
  --' default: 1
  Int ->
  --' return: Sequence statistics
  SeqStats
analyzeSequence sampleId = analyzeComposition (.nucleotides seq) where
  seq = getSampleSequence sampleId

--' Find motifs (k-mers) in sequence
--'
--' Finds all k-mers of specified length in the sequence.
--'
--' name: motifs
findMotifs ::
  --' Sample sequence ID
  --' arg: --sample
  --' metavar: ID
  --' default: 1
  Int ->
  --' K-mer length
  --' arg: -k/--kmer-length
  --' metavar: K
  --' default: 3
  Int ->
  --' return: List of k-mers
  [Str]
findMotifs sampleId k = findKmers (.nucleotides seq) k where
  seq = getSampleSequence sampleId

--' Align two sequences
--'
--' Performs Smith-Waterman local alignment on two sample sequences.
--'
--' name: align
alignSequences ::
  --' First sequence ID
  --' arg: --seq1
  --' metavar: ID1
  --' default: 1
  Int ->
  --' Second sequence ID
  --' arg: --seq2
  --' metavar: ID2
  --' default: 2
  Int ->
  --' return: Alignment result
  Alignment
alignSequences id1 id2 = alignSmithWaterman (.nucleotides seq1) (.nucleotides seq2) where
  seq1 = getSampleSequence id1
  seq2 = getSampleSequence id2

--' Calculate GC content
--'
--' Computes the GC content percentage of a sequence.
--'
--' name: gcContent
gcContent ::
  --' Sample sequence ID
  --' metavar: ID
  Int ->
  --' return: GC content (0-1)
  Real
gcContent sampleId = calculateGC (.nucleotides seq) where
  seq = getSampleSequence sampleId


================================================
FILE: test-suite/golden-tests/claude-test-10/sequence_align.hpp
================================================
#include <vector>
#include <string>
#include <algorithm>
#include <cctype>

struct Alignment {
    double score;
    std::string seq1;
    std::string seq2;
    std::string alignedSeq1;
    std::string alignedSeq2;
    double identity;
};

// Simple Smith-Waterman local alignment
Alignment alignSmithWaterman(std::string seq1, std::string seq2) {
    int m = seq1.length();
    int n = seq2.length();

    // Scoring scheme
    const int match = 2;
    const int mismatch = -1;
    const int gap = -1;

    // Initialize matrix
    std::vector<std::vector<int>> H(m + 1, std::vector<int>(n + 1, 0));

    int maxScore = 0;
    int maxI = 0, maxJ = 0;

    // Fill matrix
    for (int i = 1; i <= m; i++) {
        for (int j = 1; j <= n; j++) {
            int matchScore = (seq1[i-1] == seq2[j-1]) ? match : mismatch;
            int score = std::max({
                0,
                H[i-1][j-1] + matchScore,
                H[i-1][j] + gap,
                H[i][j-1] + gap
            });
            H[i][j] = score;

            if (score > maxScore) {
                maxScore = score;
                maxI = i;
                maxJ = j;
            }
        }
    }

    // Traceback (simplified - just return simple alignment)
    std::string aligned1 = seq1.substr(0, std::min(m, n));
    std::string aligned2 = seq2.substr(0, std::min(m, n));

    // Calculate identity
    int matches = 0;
    int len = std::min(aligned1.length(), aligned2.length());
    for (int i = 0; i < len; i++) {
        if (aligned1[i] == aligned2[i]) matches++;
    }
    double identity = (len > 0) ? static_cast<double>(matches) / len : 0.0;

    Alignment result;
    result.score = maxScore;
    result.seq1 = seq1;
    result.seq2 = seq2;
    result.alignedSeq1 = aligned1;
    result.alignedSeq2 = aligned2;
    result.identity = identity;

    return result;
}

// Find all k-mers in a sequence
std::vector<std::string> findKmers(std::string seq, int k) {
    std::vector<std::string> kmers;

    for (size_t i = 0; i + k <= seq.length(); i++) {
        kmers.push_back(seq.substr(i, k));
    }

    return kmers;
}

// Count occurrences of a k-mer in sequence
int countKmer(std::string seq, std::string kmer) {
    int count = 0;
    size_t pos = 0;

    while ((pos = seq.find(kmer, pos)) != std::string::npos) {
        count++;
        pos++;
    }

    return count;
}

// Validate DNA sequence (only A, T, G, C)
bool validateSequence(std::string seq) {
    for (char c : seq) {
        char upper = std::toupper(c);
        if (upper != 'A' && upper != 'T' && upper != 'G' && upper != 'C') {
            return false;
        }
    }
    return true;
}


================================================
FILE: test-suite/golden-tests/claude-test-10/sequence_io.py
================================================
SAMPLE_SEQUENCES = {
    1: ("SEQ001", "Sample E. coli sequence", "ATGCGATCGATCGATCGATCGTAGCTAGCTAGCTAGCTAG"),
    2: ("SEQ002", "Sample human sequence", "ATGCGATCGTAGCTAGCTAGCTGCATGCTAGCTAGCTAG"),
    3: ("SEQ003", "High GC content", "GCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGC"),
    4: ("SEQ004", "Low complexity", "ATATATATATATATATATATATATATATATATAT"),
    5: ("SEQ005", "Random sequence", "ACGTACGTTAGCTAGCTAGCTAGCTACGTACGTACGT")
}

def getSampleSequence(sampleId):
    """Get a sample DNA sequence by ID"""
    if sampleId in SAMPLE_SEQUENCES:
        seqId, desc, nucs = SAMPLE_SEQUENCES[sampleId]
    else:
        seqId, desc, nucs = SAMPLE_SEQUENCES[1]

    return {
        "seqId": seqId,
        "description": desc,
        "nucleotides": nucs,
        "length": len(nucs)
    }

def createSequence(seqId, description, nucleotides):
    """Create a Sequence record"""
    return {
        "seqId": seqId,
        "description": description,
        "nucleotides": nucleotides,
        "length": len(nucleotides)
    }

def formatAlignment(alignment):
    """Format alignment result as a string"""
    lines = [
        f"Alignment Score: {alignment['score']:.2f}",
        f"Identity: {alignment['identity']*100:.1f}%",
        "",
        alignment['alignedSeq1'],
        alignment['alignedSeq2']
    ]
    return "\n".join(lines)


================================================
FILE: test-suite/golden-tests/claude-test-10/sequence_stats.R
================================================
calculateGC <- function(seq) {
  # Convert to uppercase
  seq <- toupper(seq)

  # Count G and C
  chars <- strsplit(seq, "")[[1]]
  gc_count <- sum(chars == "G" | chars == "C")
  total <- length(chars)

  gc_count / total
}

sequenceComplexity <- function(seq) {
  # Simple complexity measure: unique k-mers / total k-mers
  k <- 3
  chars <- strsplit(seq, "")[[1]]

  if (length(chars) < k) return(1.0)

  kmers <- character(length(chars) - k + 1)
  for (i in 1:(length(chars) - k + 1)) {
    kmers[i] <- paste(chars[i:(i+k-1)], collapse="")
  }

  unique_count <- length(unique(kmers))
  total_count <- length(kmers)

  unique_count / total_count
}

analyzeComposition <- function(seq) {
  seq <- toupper(seq)
  chars <- strsplit(seq, "")[[1]]

  gc <- sum(chars == "G" | chars == "C") / length(chars)
  at <- sum(chars == "A" | chars == "T") / length(chars)

  list(
    gcContent = gc,
    atContent = at,
    length = length(chars),
    complexity = sequenceComplexity(seq)
  )
}


================================================
FILE: test-suite/golden-tests/claude-test-11/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- sysReport ---" > obs.txt
	./nexus sysReport >> obs.txt 2>> obs.err
	echo "--- envCal ---" >> obs.txt
	./nexus envCal >> obs.txt 2>> obs.err
	echo "--- cpuLoad ---" >> obs.txt
	./nexus cpuLoad >> obs.txt 2>> obs.err
	echo "--- multiQuery ---" >> obs.txt
	./nexus multiQuery >> obs.txt 2>> obs.err
	echo "--- sharedQuery ---" >> obs.txt
	./nexus sharedQuery >> obs.txt 2>> obs.err
	echo "--- pipeline ---" >> obs.txt
	./nexus pipeline >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-11/exp.txt
================================================
--- sysReport ---
CLOCK_QUERY
PID_QUERY
UPTIME_QUERY
"[Jan-86400] code=524550 pid=1234"
--- envCal ---
PID_QUERY
"Oct-2025"
--- cpuLoad ---
CPU_QUERY
UPTIME_QUERY
904710
--- multiQuery ---
CPU_QUERY
CPU_QUERY
476269
--- sharedQuery ---
CPU_QUERY
476269
--- pipeline ---
ENV_QUERY
CLOCK_QUERY
UPTIME_QUERY
PID_QUERY
"[\/home\/user] code=904707 pid=1234"


================================================
FILE: test-suite/golden-tests/claude-test-11/main.loc
================================================
-- Test effects, do-notation, cross-language composition, and let-sharing
-- with OS-introspection-style functions returning deterministic fake values.
-- Each effectful call prints a trace message to stdout for evaluation verification.

module main (sysReport, envCal, cpuLoad, multiQuery, sharedQuery, pipeline)

import root-cpp
import root-py
import root-r

source Cpp from "sysinfo.hpp" ("clockResNs", "cpuCount", "hashStr")
source Py from "sysinfo.py" ("procId", "envHome", "calMonth")
source R from "sysinfo.R" ("uptimeSec", "fmtReport")

type Cpp => Int = "int"
type Cpp => Str = "std::string"

type Py => Int = "int"
type Py => Str = "str"

type R => Int = "integer"
type R => Str = "character"

clockResNs :: <IO> Int
cpuCount :: <IO> Int
hashStr :: Str -> Int

procId :: <IO> Int
envHome :: <IO> Str
calMonth :: Int -> Int -> Str

uptimeSec :: <IO> Int
fmtReport :: Str -> Int -> Int -> Str

-- Cross-language do-block: C++, Python, R effects; pure functions on results
sysReport :: <IO> Str
sysReport = do
    clk <- clockResNs
    pid <- procId
    up <- uptimeSec
    fmtReport (calMonth up clk) (hashStr "/home/user") pid

-- Do-block with effect evaluation as argument to pure function
envCal :: <IO> Str
envCal = do
    pid <- procId
    calMonth 2025 pid

-- Effectful results feeding into pure functions across languages
cpuLoad :: <IO> Int
cpuLoad = do
    c <- cpuCount
    u <- uptimeSec
    hashStr (calMonth c u)

-- Two independent evaluations of same effect (no sharing, 2x trace)
multiQuery :: <IO> Int
multiQuery = do
    c1 <- cpuCount
    c2 <- cpuCount
    hashStr (calMonth c1 c2)

-- Shared binding: evaluates once, result shared
sharedQuery :: <IO> Int
sharedQuery = do
    c <- cpuCount
    hashStr (calMonth c c)

-- Long cross-language chain: 4-step do-block, 3 languages
pipeline :: <IO> Str
pipeline = do
    home <- envHome
    clk <- clockResNs
    up <- uptimeSec
    pid <- procId
    fmtReport home (hashStr (calMonth clk up)) pid


================================================
FILE: test-suite/golden-tests/claude-test-11/sysinfo.R
================================================
uptimeSec <- function() {
    cat("UPTIME_QUERY\n")
    flush(stdout())
    86400L
}

fmtReport <- function(label, code, id) {
    paste0("[", label, "] code=", code, " pid=", id)
}


================================================
FILE: test-suite/golden-tests/claude-test-11/sysinfo.hpp
================================================
#ifndef __SYSINFO_HPP__
#define __SYSINFO_HPP__

#include <string>
#include <iostream>

int clockResNs() {
    std::cout << "CLOCK_QUERY" << std::endl;
    return 1;
}

int cpuCount() {
    std::cout << "CPU_QUERY" << std::endl;
    return 4;
}

int hashStr(std::string s) {
    int hash = 0;
    for (char c : s) {
        hash = (hash * 31 + c) % 1000003;
    }
    return hash;
}

#endif


================================================
FILE: test-suite/golden-tests/claude-test-11/sysinfo.py
================================================
import sys

def procId():
    print("PID_QUERY")
    sys.stdout.flush()
    return 1234

def envHome():
    print("ENV_QUERY")
    sys.stdout.flush()
    return "/home/user"

def calMonth(year, month):
    months = ["Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"]
    idx = (month - 1) % 12
    return months[idx] + "-" + str(year)


================================================
FILE: test-suite/golden-tests/claude-test-12/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- foo ---" > obs.txt
	./nexus foo >> obs.txt 2>> obs.err
	echo "--- bar ---" >> obs.txt
	./nexus bar >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-12/exp.txt
================================================
--- foo ---
42
--- bar ---
3.14


================================================
FILE: test-suite/golden-tests/claude-test-12/helper.py
================================================
def my_id(x):
    return x

def my_val():
    return 3.14


================================================
FILE: test-suite/golden-tests/claude-test-12/main.loc
================================================
-- Test type annotations on standalone polymorphic functions (not typeclass methods).
-- This exercises the fix for annotation lookup using the concrete index (ci)
-- rather than the general index (gi) in checkG/synthG.

module main (foo, bar)

import root-py

type Py => Int = "int"
type Py => Real = "float"

myId :: a -> a
source Py from "helper.py" ("my_id" as myId)

myVal :: a
source Py from "helper.py" ("my_val" as myVal)

foo :: Int
foo = (myId :: Int -> Int) 42

bar :: Real
bar = myVal :: Real


================================================
FILE: test-suite/golden-tests/claude-test-13/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- manyCallsSmall ---" > obs.txt
	./nexus manyCallsSmall >> obs.txt 2> obs.err
	echo "--- manyCallsLarge ---" >> obs.txt
	./nexus manyCallsLarge >> obs.txt 2>> obs.err
	echo "--- chainCppPy ---" >> obs.txt
	./nexus chainCppPy >> obs.txt 2>> obs.err
	echo "--- chainPyCpp ---" >> obs.txt
	./nexus chainPyCpp >> obs.txt 2>> obs.err
	echo "--- diamondStr ---" >> obs.txt
	./nexus diamondStr >> obs.txt 2>> obs.err
	echo "--- diamondList ---" >> obs.txt
	./nexus diamondList >> obs.txt 2>> obs.err
	echo "--- letSharedAcrossLangs ---" >> obs.txt
	./nexus letSharedAcrossLangs >> obs.txt 2>> obs.err
	echo "--- deepDoChain ---" >> obs.txt
	./nexus deepDoChain >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-13/exp.txt
================================================
--- manyCallsSmall ---
10
--- manyCallsLarge ---
1000
--- chainCppPy ---
5350
--- chainPyCpp ---
5350
--- diamondStr ---
100
--- diamondList ---
420
--- letSharedAcrossLangs ---
300
--- deepDoChain ---
245


================================================
FILE: test-suite/golden-tests/claude-test-13/main.loc
================================================
-- SHM stress tests: exercises reference counting and deferred cleanup
-- across many sequential cross-language calls with various data sizes.

module main
  ( manyCallsSmall
  , manyCallsLarge
  , chainCppPy
  , chainPyCpp
  , diamondStr
  , diamondList
  , letSharedAcrossLangs
  , deepDoChain
  )

import root-cpp
import root-py

source Cpp from "stress.hpp"
  ( "makeStr" as cppMakeStr
  , "strLen" as cppStrLen
  , "sumList" as cppSumList
  , "makeRange" as cppMakeRange
  , "incAll" as cppIncAll
  , "idStr" as cppIdStr
  , "idList" as cppIdList
  )

source Py from "stress.py"
  ( "makeStr" as pyMakeStr
  , "strLen" as pyStrLen
  , "sumList" as pySumList
  , "makeRange" as pyMakeRange
  , "incAll" as pyIncAll
  , "idStr" as pyIdStr
  , "idList" as pyIdList
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

cppMakeStr :: Int -> Str
cppStrLen :: Str -> Int
cppSumList :: [Int] -> Int
cppMakeRange :: Int -> [Int]
cppIncAll :: [Int] -> [Int]
cppIdStr :: Str -> Str
cppIdList :: [Int] -> [Int]

pyMakeStr :: Int -> Str
pyStrLen :: Str -> Int
pySumList :: [Int] -> Int
pyMakeRange :: Int -> [Int]
pyIncAll :: [Int] -> [Int]
pyIdStr :: Str -> Str
pyIdList :: [Int] -> [Int]

-- Test 1: 30 sequential small cross-language calls.
-- Each call crosses Cpp->Py or Py->Cpp boundary, allocating and freeing SHM.
-- Without proper cleanup, this would exhaust the 32-volume SHM limit.
manyCallsSmall :: Int
manyCallsSmall =
    let s1 = cppMakeStr 10
        n1 = pyStrLen s1
        s2 = pyMakeStr n1
        n2 = cppStrLen s2
        s3 = cppMakeStr n2
        n3 = pyStrLen s3
        s4 = pyMakeStr n3
        n4 = cppStrLen s4
        s5 = cppMakeStr n4
        n5 = pyStrLen s5
        s6 = pyMakeStr n5
        n6 = cppStrLen s6
        s7 = cppMakeStr n6
        n7 = pyStrLen s7
        s8 = pyMakeStr n7
        n8 = cppStrLen s8
        s9 = cppMakeStr n8
        n9 = pyStrLen s9
        s10 = pyMakeStr n9
        n10 = cppStrLen s10
        s11 = cppMakeStr n10
        n11 = pyStrLen s11
        s12 = pyMakeStr n11
        n12 = cppStrLen s12
        s13 = cppMakeStr n12
        n13 = pyStrLen s13
        s14 = pyMakeStr n13
        n14 = cppStrLen s14
        s15 = cppMakeStr n14
    in pyStrLen s15

-- Test 2: Cross-language calls with large strings (1000 chars each).
-- Large strings have sub-allocations in SHM that need shfree_by_schema.
manyCallsLarge :: Int
manyCallsLarge =
    let s1 = cppMakeStr 1000
        s2 = pyIdStr s1
        s3 = cppIdStr s2
        s4 = pyIdStr s3
        s5 = cppIdStr s4
        s6 = pyIdStr s5
        s7 = cppIdStr s6
        s8 = pyIdStr s7
        s9 = cppIdStr s8
        s10 = pyIdStr s9
    in cppStrLen s10

-- Test 3: Chain from C++ to Python - result forwarded through multiple hops.
-- Tests that forwarded result packets have proper refcounting.
chainCppPy :: Int
chainCppPy =
    let xs = cppMakeRange 100
        ys = pyIncAll xs
        zs = cppIncAll ys
        ws = pyIncAll zs
    in cppSumList ws

-- Test 4: Chain from Python to C++ - opposite direction.
chainPyCpp :: Int
chainPyCpp =
    let xs = pyMakeRange 100
        ys = cppIncAll xs
        zs = pyIncAll ys
        ws = cppIncAll zs
    in pySumList ws

-- Test 5: Diamond pattern - same string value sent to two different
-- cross-language calls. Tests that refcount handles fan-out correctly.
diamondStr :: Int
diamondStr =
    let s = cppMakeStr 50
        a = pyStrLen s
        b = cppStrLen (pyIdStr s)
    in a + b

-- Test 6: Diamond with list data - same list value sent to two paths.
diamondList :: Int
diamondList =
    let xs = pyMakeRange 20
        a = cppSumList xs
        b = pySumList (cppIdList xs)
    in a + b

-- Test 7: Let-bound value from one language used multiple times in another.
-- The let-bound value crosses the language boundary each time it is used.
letSharedAcrossLangs :: Int
letSharedAcrossLangs =
    let s = cppMakeStr 100
    in pyStrLen s + pyStrLen s + pyStrLen s

-- Test 8: Deep chain with 20 sequential cross-language list transformations.
-- Each step creates a new SHM allocation. Without cleanup, exhausts volumes.
deepDoChain :: Int
deepDoChain =
    let xs = cppMakeRange 10
        xs2 = pyIncAll xs
        xs3 = cppIncAll xs2
        xs4 = pyIncAll xs3
        xs5 = cppIncAll xs4
        xs6 = pyIncAll xs5
        xs7 = cppIncAll xs6
        xs8 = pyIncAll xs7
        xs9 = cppIncAll xs8
        xs10 = pyIncAll xs9
        xs11 = cppIncAll xs10
        xs12 = pyIncAll xs11
        xs13 = cppIncAll xs12
        xs14 = pyIncAll xs13
        xs15 = cppIncAll xs14
        xs16 = pyIncAll xs15
        xs17 = cppIncAll xs16
        xs18 = pyIncAll xs17
        xs19 = cppIncAll xs18
        xs20 = pyIncAll xs19
    in cppSumList xs20


================================================
FILE: test-suite/golden-tests/claude-test-13/stress.hpp
================================================
#ifndef __STRESS_HPP__
#define __STRESS_HPP__

#include <string>
#include <vector>

std::string makeStr(int n) {
    return std::string(n, 'x');
}

int strLen(const std::string& s) {
    return (int)s.size();
}

int sumList(const std::vector<int>& xs) {
    int total = 0;
    for (int x : xs) total += x;
    return total;
}

std::vector<int> makeRange(int n) {
    std::vector<int> result(n);
    for (int i = 0; i < n; i++) result[i] = i + 1;
    return result;
}

std::vector<int> incAll(const std::vector<int>& xs) {
    std::vector<int> result(xs.size());
    for (size_t i = 0; i < xs.size(); i++) result[i] = xs[i] + 1;
    return result;
}

std::string idStr(const std::string& s) {
    return s;
}

std::vector<int> idList(const std::vector<int>& xs) {
    return xs;
}

#endif


================================================
FILE: test-suite/golden-tests/claude-test-13/stress.py
================================================
def makeStr(n):
    return "y" * n

def strLen(s):
    return len(s)

def sumList(xs):
    return sum(xs)

def makeRange(n):
    return list(range(1, n + 1))

def incAll(xs):
    return [x + 1 for x in xs]

def idStr(s):
    return s

def idList(xs):
    return list(xs)


================================================
FILE: test-suite/golden-tests/claude-test-14/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- effectChain ---" > obs.txt
	./nexus effectChain >> obs.txt 2> obs.err
	echo "--- effectFanOut ---" >> obs.txt
	./nexus effectFanOut >> obs.txt 2>> obs.err
	echo "--- letForwardedTwice ---" >> obs.txt
	./nexus letForwardedTwice >> obs.txt 2>> obs.err
	echo "--- nestedLetCross ---" >> obs.txt
	./nexus nestedLetCross >> obs.txt 2>> obs.err
	echo "--- listAppendCross ---" >> obs.txt
	./nexus listAppendCross >> obs.txt 2>> obs.err
	echo "--- resultForwardChain ---" >> obs.txt
	./nexus resultForwardChain >> obs.txt 2>> obs.err
	echo "--- effectInLetRhs ---" >> obs.txt
	./nexus effectInLetRhs >> obs.txt 2>> obs.err
	echo "--- tripleForward ---" >> obs.txt
	./nexus tripleForward >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-14/edge.hpp
================================================
#ifndef __EDGE_HPP__
#define __EDGE_HPP__

#include <string>
#include <vector>

int counter() {
    static int n = 0;
    return ++n;
}

int addTwo(int a, int b) {
    return a + b;
}

int doubleIt(int x) {
    return x * 2;
}

std::vector<int> makePair(int a, int b) {
    return {a, b};
}

std::string replicateStr(int n, const std::string& s) {
    std::string result;
    for (int i = 0; i < n; i++) result += s;
    return result;
}

int lenStr(const std::string& s) {
    return (int)s.size();
}

int sumVec(const std::vector<int>& xs) {
    int s = 0;
    for (int x : xs) s += x;
    return s;
}

std::vector<int> appendVec(const std::vector<int>& a, const std::vector<int>& b) {
    std::vector<int> result = a;
    result.insert(result.end(), b.begin(), b.end());
    return result;
}

std::vector<int> incVec(const std::vector<int>& xs) {
    std::vector<int> result(xs.size());
    for (size_t i = 0; i < xs.size(); i++) result[i] = xs[i] + 1;
    return result;
}

#endif


================================================
FILE: test-suite/golden-tests/claude-test-14/edge.py
================================================
_counter = 0

def counter():
    global _counter
    _counter += 1
    return _counter

def addTwo(a, b):
    return a + b

def doubleIt(x):
    return x * 2

def makePair(a, b):
    return [a, b]

def replicateStr(n, s):
    return s * n

def lenStr(s):
    return len(s)

def sumVec(xs):
    return sum(xs)

def appendVec(a, b):
    return list(a) + list(b)

def incVec(xs):
    return [x + 1 for x in xs]


================================================
FILE: test-suite/golden-tests/claude-test-14/exp.txt
================================================
--- effectChain ---
4
--- effectFanOut ---
4
--- letForwardedTwice ---
24
--- nestedLetCross ---
12
--- listAppendCross ---
10
--- resultForwardChain ---
18
--- effectInLetRhs ---
4
--- tripleForward ---
49


================================================
FILE: test-suite/golden-tests/claude-test-14/main.loc
================================================
-- SHM reference counting edge cases: tests patterns that exercise
-- the refcount increment/decrement logic at language boundaries.

module main
  ( effectChain
  , effectFanOut
  , letForwardedTwice
  , nestedLetCross
  , listAppendCross
  , resultForwardChain
  , effectInLetRhs
  , tripleForward
  )

import root-cpp
import root-py

source Cpp from "edge.hpp"
  ( "counter" as cppCounter
  , "addTwo" as cppAdd
  , "doubleIt" as cppDouble
  , "makePair" as cppMakePair
  , "replicateStr" as cppReplicateStr
  , "lenStr" as cppLenStr
  , "sumVec" as cppSumVec
  , "appendVec" as cppAppendVec
  , "incVec" as cppIncVec
  )

source Py from "edge.py"
  ( "counter" as pyCounter
  , "addTwo" as pyAdd
  , "doubleIt" as pyDouble
  , "makePair" as pyMakePair
  , "replicateStr" as pyReplicateStr
  , "lenStr" as pyLenStr
  , "sumVec" as pySumVec
  , "appendVec" as pyAppendVec
  , "incVec" as pyIncVec
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

cppCounter :: <IO> Int
cppAdd :: Int -> Int -> Int
cppDouble :: Int -> Int
cppMakePair :: Int -> Int -> [Int]
cppReplicateStr :: Int -> Str -> Str
cppLenStr :: Str -> Int
cppSumVec :: [Int] -> Int
cppAppendVec :: [Int] -> [Int] -> [Int]
cppIncVec :: [Int] -> [Int]

pyCounter :: <IO> Int
pyAdd :: Int -> Int -> Int
pyDouble :: Int -> Int
pyMakePair :: Int -> Int -> [Int]
pyReplicateStr :: Int -> Str -> Str
pyLenStr :: Str -> Int
pySumVec :: [Int] -> Int
pyAppendVec :: [Int] -> [Int] -> [Int]
pyIncVec :: [Int] -> [Int]


-- Test 1: Chain of effects across languages.
-- cppCounter returns 1, pyDouble(1) = 2, cppCounter returns 2, pyAdd(2,2) = 4
effectChain :: <IO> Int
effectChain = do
    a <- cppCounter
    let b = pyDouble a
    c <- cppCounter
    pyAdd b c

-- Test 2: Fan-out of effectful result to multiple cross-language calls.
-- pyCounter returns 1, cppDouble(1) = 2, cppAdd(1,1) = 2, pyAdd(2,2) = 4
effectFanOut :: <IO> Int
effectFanOut = do
    x <- pyCounter
    let a = cppDouble x
        b = cppAdd x x
    pyAdd a b

-- Test 3: Let-bound cross-language result forwarded to two foreign calls.
-- cppMakePair(3,7) = [3,7], cppIncVec = [4,8], pySumVec = 12, twice = 24
letForwardedTwice :: Int
letForwardedTwice =
    let xs = cppMakePair 3 7
        a = pySumVec (cppIncVec xs)
        b = pySumVec (cppIncVec xs)
    in a + b

-- Test 4: Nested let where each binding crosses a language boundary.
-- cppReplicateStr(3, "ab") = "ababab" (len 6)
-- pyReplicateStr(2, "ababab") = "abababababab" (len 12)
-- cppLenStr("abababababab") = 12
nestedLetCross :: Int
nestedLetCross =
    let s1 = cppReplicateStr 3 "ab"
        s2 = pyReplicateStr 2 s1
    in cppLenStr s2

-- Test 5: Lists crossing boundaries with append operations.
-- pyMakePair(1,2) = [1,2], cppMakePair(3,4) = [3,4]
-- pyAppendVec([1,2], [3,4]) = [1,2,3,4], cppSumVec = 10
listAppendCross :: Int
listAppendCross =
    let a = pyMakePair 1 2
        b = cppMakePair 3 4
        c = pyAppendVec a b
    in cppSumVec c

-- Test 6: Long chain where each result is forwarded.
-- cppMakePair(1,1) = [1,1], 8 rounds of incVec: [9,9], sum = 18
resultForwardChain :: Int
resultForwardChain =
    let xs = cppMakePair 1 1
        xs2 = pyIncVec xs
        xs3 = cppIncVec xs2
        xs4 = pyIncVec xs3
        xs5 = cppIncVec xs4
        xs6 = pyIncVec xs5
        xs7 = cppIncVec xs6
        xs8 = pyIncVec xs7
        xs9 = cppIncVec xs8
    in pySumVec xs9

-- Test 7: Effect evaluation in let-binding RHS crossing languages.
-- cppCounter returns 1, pyDouble(1) = 2, cppAdd(2,2) = 4
effectInLetRhs :: <IO> Int
effectInLetRhs = do
    x <- cppCounter
    let y = pyDouble x
    cppAdd y y

-- Test 8: Value forwarded to three different cross-language calls.
-- pyMakePair(5,10) = [5,10]
-- cppSumVec([5,10]) = 15
-- cppIncVec([5,10]) = [6,11], pySumVec([6,11]) = 17
-- pyIncVec([5,10]) = [6,11], cppSumVec([6,11]) = 17
-- Total = 15 + 17 + 17 = 49
tripleForward :: Int
tripleForward =
    let xs = pyMakePair 5 10
        a = cppSumVec xs
        b = pySumVec (cppIncVec xs)
        c = cppSumVec (pyIncVec xs)
    in a + b + c


================================================
FILE: test-suite/golden-tests/claude-test-15/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- bigStrRoundTrip ---" > obs.txt
	./nexus bigStrRoundTrip >> obs.txt 2> obs.err
	echo "--- bigVecRoundTrip ---" >> obs.txt
	./nexus bigVecRoundTrip >> obs.txt 2>> obs.err
	echo "--- vecOfStrsRoundTrip ---" >> obs.txt
	./nexus vecOfStrsRoundTrip >> obs.txt 2>> obs.err
	echo "--- nestedVecRoundTrip ---" >> obs.txt
	./nexus nestedVecRoundTrip >> obs.txt 2>> obs.err
	echo "--- bigStrChain ---" >> obs.txt
	./nexus bigStrChain >> obs.txt 2>> obs.err
	echo "--- bigVecChain ---" >> obs.txt
	./nexus bigVecChain >> obs.txt 2>> obs.err
	echo "--- manyBigStrings ---" >> obs.txt
	./nexus manyBigStrings >> obs.txt 2>> obs.err
	echo "--- manyNestedVecs ---" >> obs.txt
	./nexus manyNestedVecs >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-15/bigdata.hpp
================================================
#ifndef __BIGDATA_HPP__
#define __BIGDATA_HPP__

#include <string>
#include <vector>

std::string bigStr(int n) {
    return std::string(n, 'A');
}

int bigStrLen(const std::string& s) {
    return (int)s.size();
}

std::vector<int> bigVec(int n) {
    std::vector<int> v(n);
    for (int i = 0; i < n; i++) v[i] = i;
    return v;
}

int bigVecSum(const std::vector<int>& v) {
    long long s = 0;
    for (int x : v) s += x;
    return (int)(s % 1000000007);
}

std::vector<std::string> vecOfStrs(int n, int m) {
    std::string s(m, 'B');
    return std::vector<std::string>(n, s);
}

int sumStrLens(const std::vector<std::string>& vs) {
    int total = 0;
    for (const auto& s : vs) total += (int)s.size();
    return total;
}

std::vector<std::vector<int>> nestedVec(int outer, int inner) {
    std::vector<int> row(inner);
    for (int i = 0; i < inner; i++) row[i] = i + 1;
    return std::vector<std::vector<int>>(outer, row);
}

int nestedSum(const std::vector<std::vector<int>>& vv) {
    int s = 0;
    for (const auto& v : vv)
        for (int x : v)
            s += x;
    return s;
}

std::vector<std::string> idVecStr(const std::vector<std::string>& vs) {
    return vs;
}

std::vector<std::vector<int>> idNestedVec(const std::vector<std::vector<int>>& vv) {
    return vv;
}

#endif


================================================
FILE: test-suite/golden-tests/claude-test-15/bigdata.py
================================================
def bigStr(n):
    return "A" * n

def bigStrLen(s):
    return len(s)

def bigVec(n):
    return list(range(n))

def bigVecSum(v):
    return sum(v) % 1000000007

def vecOfStrs(n, m):
    return ["B" * m] * n

def sumStrLens(vs):
    return sum(len(s) for s in vs)

def nestedVec(outer, inner):
    row = list(range(1, inner + 1))
    return [list(row) for _ in range(outer)]

def nestedSum(vv):
    return sum(x for v in vv for x in v)

def idVecStr(vs):
    return list(vs)

def idNestedVec(vv):
    return [list(v) for v in vv]


================================================
FILE: test-suite/golden-tests/claude-test-15/exp.txt
================================================
--- bigStrRoundTrip ---
10000
--- bigVecRoundTrip ---
12497500
--- vecOfStrsRoundTrip ---
5000
--- nestedVecRoundTrip ---
2100
--- bigStrChain ---
5000
--- bigVecChain ---
999000
--- manyBigStrings ---
20000
--- manyNestedVecs ---
2200


================================================
FILE: test-suite/golden-tests/claude-test-15/main.loc
================================================
-- SHM large data tests: exercises sub-allocation freeing with big objects
-- crossing language boundaries. Large strings and arrays have sub-allocations
-- in SHM that require shfree_by_schema for proper recursive cleanup.

module main
  ( bigStrRoundTrip
  , bigVecRoundTrip
  , vecOfStrsRoundTrip
  , nestedVecRoundTrip
  , bigStrChain
  , bigVecChain
  , manyBigStrings
  , manyNestedVecs
  )

import root-cpp
import root-py

source Cpp from "bigdata.hpp"
  ( "bigStr" as cppBigStr
  , "bigStrLen" as cppBigStrLen
  , "bigVec" as cppBigVec
  , "bigVecSum" as cppBigVecSum
  , "vecOfStrs" as cppVecOfStrs
  , "sumStrLens" as cppSumStrLens
  , "nestedVec" as cppNestedVec
  , "nestedSum" as cppNestedSum
  , "idVecStr" as cppIdVecStr
  , "idNestedVec" as cppIdNestedVec
  )

source Py from "bigdata.py"
  ( "bigStr" as pyBigStr
  , "bigStrLen" as pyBigStrLen
  , "bigVec" as pyBigVec
  , "bigVecSum" as pyBigVecSum
  , "vecOfStrs" as pyVecOfStrs
  , "sumStrLens" as pySumStrLens
  , "nestedVec" as pyNestedVec
  , "nestedSum" as pyNestedSum
  , "idVecStr" as pyIdVecStr
  , "idNestedVec" as pyIdNestedVec
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

cppBigStr :: Int -> Str
cppBigStrLen :: Str -> Int
cppBigVec :: Int -> [Int]
cppBigVecSum :: [Int] -> Int
cppVecOfStrs :: Int -> Int -> [Str]
cppSumStrLens :: [Str] -> Int
cppNestedVec :: Int -> Int -> [[Int]]
cppNestedSum :: [[Int]] -> Int
cppIdVecStr :: [Str] -> [Str]
cppIdNestedVec :: [[Int]] -> [[Int]]

pyBigStr :: Int -> Str
pyBigStrLen :: Str -> Int
pyBigVec :: Int -> [Int]
pyBigVecSum :: [Int] -> Int
pyVecOfStrs :: Int -> Int -> [Str]
pySumStrLens :: [Str] -> Int
pyNestedVec :: Int -> Int -> [[Int]]
pyNestedSum :: [[Int]] -> Int
pyIdVecStr :: [Str] -> [Str]
pyIdNestedVec :: [[Int]] -> [[Int]]


-- Test 1: Big string (10000 chars) created in C++, measured in Python.
bigStrRoundTrip :: Int
bigStrRoundTrip = pyBigStrLen (cppBigStr 10000)

-- Test 2: Big vector (5000 elements) created in Python, summed in C++.
-- sum(0..4999) = 12497500
bigVecRoundTrip :: Int
bigVecRoundTrip = cppBigVecSum (pyBigVec 5000)

-- Test 3: Vector of 50 strings (each 100 chars) round-tripped.
-- 50 * 100 = 5000
vecOfStrsRoundTrip :: Int
vecOfStrsRoundTrip = pySumStrLens (cppVecOfStrs 50 100)

-- Test 4: Nested vector (10 outer x 20 inner) round-tripped.
-- 10 * sum(1..20) = 10 * 210 = 2100
nestedVecRoundTrip :: Int
nestedVecRoundTrip = pyNestedSum (cppNestedVec 10 20)

-- Test 5: Large string bounced between languages.
bigStrChain :: Int
bigStrChain =
    let s1 = pyBigStr 5000
        s2 = cppBigStrLen s1
        s3 = pyBigStr s2
        s4 = cppBigStrLen s3
        s5 = pyBigStr s4
    in cppBigStrLen s5

-- Test 6: Large vector created and summed in alternating languages.
bigVecChain :: Int
bigVecChain =
    let xs = cppBigVec 1000
        s1 = pyBigVecSum xs
        xs2 = cppBigVec 1000
        s2 = pyBigVecSum xs2
    in s1 + s2

-- Test 7: Many sequential big string allocations (10 rounds).
-- Without SHM cleanup, these large allocations would exhaust volumes fast.
manyBigStrings :: Int
manyBigStrings =
    let a1 = pyBigStrLen (cppBigStr 2000)
        a2 = cppBigStrLen (pyBigStr 2000)
        a3 = pyBigStrLen (cppBigStr 2000)
        a4 = cppBigStrLen (pyBigStr 2000)
        a5 = pyBigStrLen (cppBigStr 2000)
        a6 = cppBigStrLen (pyBigStr 2000)
        a7 = pyBigStrLen (cppBigStr 2000)
        a8 = cppBigStrLen (pyBigStr 2000)
        a9 = pyBigStrLen (cppBigStr 2000)
        a10 = cppBigStrLen (pyBigStr 2000)
    in a1 + a2 + a3 + a4 + a5 + a6 + a7 + a8 + a9 + a10

-- Test 8: Many sequential nested vector allocations (8 rounds).
-- 5 * sum(1..10) = 5 * 55 = 275
manyNestedVecs :: Int
manyNestedVecs =
    let n1 = pyNestedSum (cppNestedVec 5 10)
        n2 = cppNestedSum (pyNestedVec 5 10)
        n3 = pyNestedSum (cppNestedVec 5 10)
        n4 = cppNestedSum (pyNestedVec 5 10)
        n5 = pyNestedSum (cppNestedVec 5 10)
        n6 = cppNestedSum (pyNestedVec 5 10)
        n7 = pyNestedSum (cppNestedVec 5 10)
        n8 = cppNestedSum (pyNestedVec 5 10)
    in n1 + n2 + n3 + n4 + n5 + n6 + n7 + n8


================================================
FILE: test-suite/golden-tests/claude-test-16/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- manyCallsSmall ---" > obs.txt
	./nexus manyCallsSmall >> obs.txt 2> obs.err
	echo "--- manyCallsLarge ---" >> obs.txt
	./nexus manyCallsLarge >> obs.txt 2>> obs.err
	echo "--- chainCppPy ---" >> obs.txt
	./nexus chainCppPy >> obs.txt 2>> obs.err
	echo "--- chainPyCpp ---" >> obs.txt
	./nexus chainPyCpp >> obs.txt 2>> obs.err
	echo "--- deepDoChain ---" >> obs.txt
	./nexus deepDoChain >> obs.txt 2>> obs.err
	echo "--- nestedLetCross ---" >> obs.txt
	./nexus nestedLetCross >> obs.txt 2>> obs.err
	echo "--- listAppendCross ---" >> obs.txt
	./nexus listAppendCross >> obs.txt 2>> obs.err
	echo "--- resultForwardChain ---" >> obs.txt
	./nexus resultForwardChain >> obs.txt 2>> obs.err
	echo "--- bigStrRoundTrip ---" >> obs.txt
	./nexus bigStrRoundTrip >> obs.txt 2>> obs.err
	echo "--- bigVecRoundTrip ---" >> obs.txt
	./nexus bigVecRoundTrip >> obs.txt 2>> obs.err
	echo "--- vecOfStrsRoundTrip ---" >> obs.txt
	./nexus vecOfStrsRoundTrip >> obs.txt 2>> obs.err
	echo "--- nestedVecRoundTrip ---" >> obs.txt
	./nexus nestedVecRoundTrip >> obs.txt 2>> obs.err
	echo "--- bigStrChain ---" >> obs.txt
	./nexus bigStrChain >> obs.txt 2>> obs.err
	echo "--- manyBigStrings ---" >> obs.txt
	./nexus manyBigStrings >> obs.txt 2>> obs.err
	echo "--- manyNestedVecs ---" >> obs.txt
	./nexus manyNestedVecs >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-16/cstress.hpp
================================================
#ifndef __CSTRESS_HPP__
#define __CSTRESS_HPP__

#include <string>
#include <vector>

std::string cmakeStr(int n) {
    return std::string(n, 'x');
}

int cstrLen(const std::string& s) {
    return (int)s.size();
}

int csumList(const std::vector<int>& xs) {
    int total = 0;
    for (int x : xs) total += x;
    return total;
}

std::vector<int> cmakeRange(int n) {
    std::vector<int> result(n);
    for (int i = 0; i < n; i++) result[i] = i + 1;
    return result;
}

std::vector<int> cincAll(const std::vector<int>& xs) {
    std::vector<int> result(xs.size());
    for (size_t i = 0; i < xs.size(); i++) result[i] = xs[i] + 1;
    return result;
}

std::string cidStr(const std::string& s) {
    return s;
}

std::vector<int> cidList(const std::vector<int>& xs) {
    return xs;
}

int cdoubleIt(int x) {
    return x * 2;
}

int caddTwo(int a, int b) {
    return a + b;
}

std::vector<int> cmakePair(int a, int b) {
    return {a, b};
}

std::string creplicateStr(int n, const std::string& s) {
    std::string result;
    for (int i = 0; i < n; i++) result += s;
    return result;
}

std::vector<int> cappendVec(const std::vector<int>& a, const std::vector<int>& b) {
    std::vector<int> result = a;
    result.insert(result.end(), b.begin(), b.end());
    return result;
}

std::vector<std::string> cvecOfStrs(int n, int m) {
    std::string s(m, 'B');
    return std::vector<std::string>(n, s);
}

int csumStrLens(const std::vector<std::string>& vs) {
    int total = 0;
    for (const auto& s : vs) total += (int)s.size();
    return total;
}

std::vector<std::vector<int>> cnestedVec(int outer, int inner) {
    std::vector<int> row(inner);
    for (int i = 0; i < inner; i++) row[i] = i + 1;
    return std::vector<std::vector<int>>(outer, row);
}

int cnestedSum(const std::vector<std::vector<int>>& vv) {
    int s = 0;
    for (const auto& v : vv)
        for (int x : v)
            s += x;
    return s;
}

int ccounter() {
    static int n = 0;
    return ++n;
}

#endif


================================================
FILE: test-suite/golden-tests/claude-test-16/exp.txt
================================================
--- manyCallsSmall ---
10
--- manyCallsLarge ---
1000
--- chainCppPy ---
5350
--- chainPyCpp ---
5350
--- deepDoChain ---
255
--- nestedLetCross ---
12
--- listAppendCross ---
10
--- resultForwardChain ---
18
--- bigStrRoundTrip ---
10000
--- bigVecRoundTrip ---
12502500
--- vecOfStrsRoundTrip ---
5000
--- nestedVecRoundTrip ---
2100
--- bigStrChain ---
5000
--- manyBigStrings ---
20000
--- manyNestedVecs ---
2200


================================================
FILE: test-suite/golden-tests/claude-test-16/main.loc
================================================
-- SHM reference counting comprehensive test.
-- Tests stress, edge cases, and large data patterns.
--
-- NOTE: consecutive let-bindings with foreign calls to the same pool trigger
-- a pre-existing codegen bug (documented in claude-test-17). Tests here
-- use nested function application to avoid that bug and focus on SHM testing.

module main
  ( manyCallsSmall
  , manyCallsLarge
  , chainCppPy
  , chainPyCpp
  , deepDoChain
  , nestedLetCross
  , listAppendCross
  , resultForwardChain
  , bigStrRoundTrip
  , bigVecRoundTrip
  , vecOfStrsRoundTrip
  , nestedVecRoundTrip
  , bigStrChain
  , manyBigStrings
  , manyNestedVecs
  )

import root-cpp
import root-py

source Cpp from "cstress.hpp"
  ( "cmakeStr" as cppMakeStr
  , "cstrLen" as cppStrLen
  , "csumList" as cppSumList
  , "cmakeRange" as cppMakeRange
  , "cincAll" as cppIncAll
  , "cidStr" as cppIdStr
  , "cidList" as cppIdList
  , "cdoubleIt" as cppDouble
  , "caddTwo" as cppAdd
  , "cmakePair" as cppMakePair
  , "creplicateStr" as cppReplicateStr
  , "cappendVec" as cppAppendVec
  , "cvecOfStrs" as cppVecOfStrs
  , "csumStrLens" as cppSumStrLens
  , "cnestedVec" as cppNestedVec
  , "cnestedSum" as cppNestedSum
  )

source Py from "pstress.py"
  ( "pmakeStr" as pyMakeStr
  , "pstrLen" as pyStrLen
  , "psumList" as pySumList
  , "pmakeRange" as pyMakeRange
  , "pincAll" as pyIncAll
  , "pidStr" as pyIdStr
  , "pidList" as pyIdList
  , "pdoubleIt" as pyDouble
  , "paddTwo" as pyAdd
  , "pmakePair" as pyMakePair
  , "preplicateStr" as pyReplicateStr
  , "pappendVec" as pyAppendVec
  , "pvecOfStrs" as pyVecOfStrs
  , "psumStrLens" as pySumStrLens
  , "pnestedVec" as pyNestedVec
  , "pnestedSum" as pyNestedSum
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

cppMakeStr :: Int -> Str
cppStrLen :: Str -> Int
cppSumList :: [Int] -> Int
cppMakeRange :: Int -> [Int]
cppIncAll :: [Int] -> [Int]
cppIdStr :: Str -> Str
cppIdList :: [Int] -> [Int]
cppDouble :: Int -> Int
cppAdd :: Int -> Int -> Int
cppMakePair :: Int -> Int -> [Int]
cppReplicateStr :: Int -> Str -> Str
cppAppendVec :: [Int] -> [Int] -> [Int]
cppVecOfStrs :: Int -> Int -> [Str]
cppSumStrLens :: [Str] -> Int
cppNestedVec :: Int -> Int -> [[Int]]
cppNestedSum :: [[Int]] -> Int

pyMakeStr :: Int -> Str
pyStrLen :: Str -> Int
pySumList :: [Int] -> Int
pyMakeRange :: Int -> [Int]
pyIncAll :: [Int] -> [Int]
pyIdStr :: Str -> Str
pyIdList :: [Int] -> [Int]
pyDouble :: Int -> Int
pyAdd :: Int -> Int -> Int
pyMakePair :: Int -> Int -> [Int]
pyReplicateStr :: Int -> Str -> Str
pyAppendVec :: [Int] -> [Int] -> [Int]
pyVecOfStrs :: Int -> Int -> [Str]
pySumStrLens :: [Str] -> Int
pyNestedVec :: Int -> Int -> [[Int]]
pyNestedSum :: [[Int]] -> Int

------------------------------------------------------------
-- STRESS TESTS: many sequential cross-language calls
------------------------------------------------------------

-- Test 1: 15 alternating cross-language calls using nested application.
-- cppMk -> pyLen -> cppMk -> pyLen -> ... -> pyLen
-- Each call allocates SHM. Without cleanup, would exhaust volumes.
manyCallsSmall :: Int
manyCallsSmall =
    pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr (pyStrLen (cppMakeStr 10)))))))))))))))

-- Test 2: Large strings (1000 chars) bounced between languages 10 times.
manyCallsLarge :: Int
manyCallsLarge =
    cppStrLen (pyIdStr (cppIdStr (pyIdStr (cppIdStr (pyIdStr (cppIdStr (pyIdStr (cppIdStr (pyIdStr (cppMakeStr 1000))))))))))

-- Test 3: List chain C++->Py->C++->Py->C++ with incrementing.
-- [1..100] -> +1 -> +1 -> +1 -> sum = sum(4..103) = 5350
chainCppPy :: Int
chainCppPy = cppSumList (pyIncAll (cppIncAll (pyIncAll (cppMakeRange 100))))

-- Test 4: Opposite direction.
chainPyCpp :: Int
chainPyCpp = pySumList (cppIncAll (pyIncAll (cppIncAll (pyMakeRange 100))))

-- Test 5: Deep chain with 20 cross-language list transformations.
-- [1..10] + 20*1 = [21..30], sum = sum(21..30) = 255
deepDoChain :: Int
deepDoChain = cppSumList (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (cppMakeRange 10)))))))))))))))))))))

------------------------------------------------------------
-- EDGE CASES: reference counting patterns (no let bindings)
------------------------------------------------------------

-- Test 6: Nested lets crossing boundaries (pure nesting, no let).
nestedLetCross :: Int
nestedLetCross = cppStrLen (pyReplicateStr 2 (cppReplicateStr 3 "ab"))

-- Test 7: List append across languages.
listAppendCross :: Int
listAppendCross = cppSumList (pyAppendVec (pyMakePair 1 2) (cppMakePair 3 4))

-- Test 8: 8 rounds of alternating incVec.
-- [1,1] + 8*1 = [9,9], sum = 18
resultForwardChain :: Int
resultForwardChain = pySumList (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppIncAll (pyIncAll (cppMakePair 1 1)))))))))

------------------------------------------------------------
-- LARGE DATA: sub-allocation freeing
------------------------------------------------------------

-- Test 9: Big string (10000 chars) round-tripped.
bigStrRoundTrip :: Int
bigStrRoundTrip = pyStrLen (cppMakeStr 10000)

-- Test 10: Big vector round-tripped. pyMakeRange 5000 = [1..5000]
-- cppSumList [1..5000] = 12502500
bigVecRoundTrip :: Int
bigVecRoundTrip = cppSumList (pyMakeRange 5000)

-- Test 11: Vector of 50 strings (100 chars each) round-tripped.
vecOfStrsRoundTrip :: Int
vecOfStrsRoundTrip = pySumStrLens (cppVecOfStrs 50 100)

-- Test 12: Nested vector (10x20) round-tripped.
nestedVecRoundTrip :: Int
nestedVecRoundTrip = pyNestedSum (cppNestedVec 10 20)

-- Test 13: Large string bounced between languages via nested calls.
bigStrChain :: Int
bigStrChain = cppStrLen (pyMakeStr (cppStrLen (pyMakeStr (cppStrLen (pyMakeStr 5000)))))

-- Test 14: Many big string allocations (10 rounds, 2000 chars each).
manyBigStrings :: Int
manyBigStrings =
    pyStrLen (cppMakeStr 2000) + cppStrLen (pyMakeStr 2000)
    + pyStrLen (cppMakeStr 2000) + cppStrLen (pyMakeStr 2000)
    + pyStrLen (cppMakeStr 2000) + cppStrLen (pyMakeStr 2000)
    + pyStrLen (cppMakeStr 2000) + cppStrLen (pyMakeStr 2000)
    + pyStrLen (cppMakeStr 2000) + cppStrLen (pyMakeStr 2000)

-- Test 15: Many nested vector allocations (8 rounds).
manyNestedVecs :: Int
manyNestedVecs =
    pyNestedSum (cppNestedVec 5 10) + cppNestedSum (pyNestedVec 5 10)
    + pyNestedSum (cppNestedVec 5 10) + cppNestedSum (pyNestedVec 5 10)
    + pyNestedSum (cppNestedVec 5 10) + cppNestedSum (pyNestedVec 5 10)
    + pyNestedSum (cppNestedVec 5 10) + cppNestedSum (pyNestedVec 5 10)


================================================
FILE: test-suite/golden-tests/claude-test-16/pstress.py
================================================
def pmakeStr(n):
    return "y" * n

def pstrLen(s):
    return len(s)

def psumList(xs):
    return sum(xs)

def pmakeRange(n):
    return list(range(1, n + 1))

def pincAll(xs):
    return [x + 1 for x in xs]

def pidStr(s):
    return s

def pidList(xs):
    return list(xs)

def pdoubleIt(x):
    return x * 2

def paddTwo(a, b):
    return a + b

def pmakePair(a, b):
    return [a, b]

def preplicateStr(n, s):
    return s * n

def pappendVec(a, b):
    return list(a) + list(b)

def pvecOfStrs(n, m):
    return ["B" * m] * n

def psumStrLens(vs):
    return sum(len(s) for s in vs)

def pnestedVec(outer, inner):
    row = list(range(1, inner + 1))
    return [list(row) for _ in range(outer)]

def pnestedSum(vv):
    return sum(x for v in vv for x in v)

_counter = 0
def pcounter():
    global _counter
    _counter += 1
    return _counter


================================================
FILE: test-suite/golden-tests/claude-test-17/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- foo ---" > obs.txt
	./nexus foo >> obs.txt 2>> obs.err
	echo "--- bar ---" >> obs.txt
	./nexus bar >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-17/exp.txt
================================================
--- foo ---
3
--- bar ---
[1,2,3]


================================================
FILE: test-suite/golden-tests/claude-test-17/helper.py
================================================
def my_len(xs):
    return len(xs)

def make_three():
    return [1, 2, 3]


================================================
FILE: test-suite/golden-tests/claude-test-17/main.loc
================================================
-- Test type-level Nat literals in type signatures.
-- Verifies that integer literals parse correctly in type positions
-- and that types parameterized by Nat values typecheck.

module main (foo, bar)

import root-py

type Py => Int = "int"

type SizedList n a = [a]
type Py => (SizedList n a) = "list" a

-- A function that takes a "SizedList 3 Int" and returns its length
myLen :: SizedList 3 Int -> Int
source Py from "helper.py" ("my_len" as myLen)

-- A function that creates a SizedList 3 Int
makeThree :: SizedList 3 Int
source Py from "helper.py" ("make_three" as makeThree)

foo :: Int
foo = myLen makeThree

bar :: SizedList 3 Int
bar = makeThree


================================================
FILE: test-suite/golden-tests/claude-test-18/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- foo ---" > obs.txt
	./nexus foo >> obs.txt 2>> obs.err
	echo "--- bar ---" >> obs.txt
	./nexus bar >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-18/exp.txt
================================================
--- foo ---
[30,40,50]
--- bar ---
[10,20,30,40,50]


================================================
FILE: test-suite/golden-tests/claude-test-18/helper.py
================================================
def my_id(xs):
    return xs

def my_append(xs, ys):
    return xs + ys

def make_two():
    return [10, 20]

def make_three():
    return [30, 40, 50]


================================================
FILE: test-suite/golden-tests/claude-test-18/main.loc
================================================
-- Test type-level Nat literals and arithmetic in type signatures.
-- Verifies:
--   1. Nat literals unify with forall-bound type variables
--   2. NatAddU (m + n) in return types works through codegen

module main (foo, bar)

import root-py

type Py => Int = "int"

type SizedList n a = [a]
type Py => (SizedList n a) = "list" a

-- Polymorphic function with Nat parameter
myId :: SizedList n a -> SizedList n a
source Py from "helper.py" ("my_id" as myId)

-- Function with Nat arithmetic in return type
myAppend :: SizedList m a -> SizedList n a -> SizedList (m + n) a
source Py from "helper.py" ("my_append" as myAppend)

makeTwo :: SizedList 2 Int
source Py from "helper.py" ("make_two" as makeTwo)

makeThree :: SizedList 3 Int
source Py from "helper.py" ("make_three" as makeThree)

foo :: SizedList 3 Int
foo = myId makeThree

bar :: SizedList (2 + 3) Int
bar = myAppend makeTwo makeThree


================================================
FILE: test-suite/golden-tests/claude-test-19/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- foo ---" > obs.txt
	./nexus foo >> obs.txt 2>> obs.err
	echo "--- bar ---" >> obs.txt
	./nexus bar >> obs.txt 2>> obs.err
	echo "--- baz ---" >> obs.txt
	./nexus baz >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-19/exp.txt
================================================
--- foo ---
[10,20,30,40,50]
--- bar ---
[30,40,50,10,20]
--- baz ---
[10,20,30,40,50]


================================================
FILE: test-suite/golden-tests/claude-test-19/helper.py
================================================
def my_append(xs, ys):
    return xs + ys

def make_two():
    return [10, 20]

def make_three():
    return [30, 40, 50]


================================================
FILE: test-suite/golden-tests/claude-test-19/main.loc
================================================
-- Test SOP-based Nat constraint solving.
-- Verifies:
--   1. Cross-form equality: (2 + 3) ~ 5 via SOP normalization
--   2. Commutativity: (3 + 2) ~ (2 + 3)
--   3. Nat variable solving: ?m + 3 = 5 => ?m = 2

module main (foo, bar, baz)

import root-py

type Py => Int = "int"

type SizedList n a = [a]
type Py => (SizedList n a) = "list" a

myAppend :: SizedList m a -> SizedList n a -> SizedList (m + n) a
source Py from "helper.py" ("my_append" as myAppend)

makeTwo :: SizedList 2 Int
source Py from "helper.py" ("make_two" as makeTwo)

makeThree :: SizedList 3 Int
source Py from "helper.py" ("make_three" as makeThree)

-- Cross-form: return type is SizedList (2+3) Int, expected SizedList 5 Int
foo :: SizedList 5 Int
foo = myAppend makeTwo makeThree

-- Commutativity: myAppend returns SizedList (3+2) Int, expected SizedList (2+3) Int
bar :: SizedList (2 + 3) Int
bar = myAppend makeThree makeTwo

-- Mixed: ensure Nat solving through variable instantiation still works
baz :: SizedList (2 + 3) Int
baz = myAppend makeTwo makeThree


================================================
FILE: test-suite/golden-tests/claude-test-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus pythonToCpp 3 2 > obs.txt 2> obs.err
	./nexus cppToPython 4 7 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/claude-test-2/exp.txt
================================================
26
27


================================================
FILE: test-suite/golden-tests/claude-test-2/main.loc
================================================
module main (pythonToCpp, cppToPython)

import root-py
import root-cpp

-- These helper functions force language selection through identity functions
-- idpy and idcpp come from root-py and root-cpp respectively
pyAdd x = idpy . (+) x
cppMul x = idcpp . (*) x

-- Compose Python add followed by C++ multiply
pythonToCpp x y = cppMul y (pyAdd x (10.0 :: Real))

-- Compose C++ multiply followed by Python add
cppToPython x y = pyAdd y (cppMul x (5.0 :: Real))


================================================
FILE: test-suite/golden-tests/claude-test-20/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err && echo "UNEXPECTED_SUCCESS" > obs.txt || echo "build_rejected" > obs.txt

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-20/exp.txt
================================================
build_rejected


================================================
FILE: test-suite/golden-tests/claude-test-20/helper.py
================================================
def my_append(xs, ys):
    return xs + ys

def make_two():
    return [10, 20]

def make_three():
    return [30, 40, 50]


================================================
FILE: test-suite/golden-tests/claude-test-20/main.loc
================================================
-- Negative test: Nat constraint mismatch should be rejected at compile time.
-- SizedList (2 + 3) Int has 5 elements, but foo claims 4.

module main (foo)

import root-py

type Py => Int = "int"

type SizedList n a = [a]
type Py => (SizedList n a) = "list" a

myAppend :: SizedList m a -> SizedList n a -> SizedList (m + n) a
source Py from "helper.py" ("my_append" as myAppend)

makeTwo :: SizedList 2 Int
source Py from "helper.py" ("make_two" as makeTwo)

makeThree :: SizedList 3 Int
source Py from "helper.py" ("make_three" as makeThree)

-- ERROR: 2 + 3 = 5, not 4
foo :: SizedList 4 Int
foo = myAppend makeTwo makeThree


================================================
FILE: test-suite/golden-tests/claude-test-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus threeLangChain 5 > obs.txt 2> obs.err
	./nexus reverseChain 25 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus poolsgc


================================================
FILE: test-suite/golden-tests/claude-test-3/exp.txt
================================================
-11
25


================================================
FILE: test-suite/golden-tests/claude-test-3/main.loc
================================================
module main (threeLangChain, reverseChain)

import root-py
import root-cpp
import root-r

-- Force language selection with identity functions
pyAdd x = idpy . (+) x
cppMul x = idcpp . (*) x
rSub x = idr . (-) x

-- Chain: Python add -> C++ multiply -> R subtract
-- Input goes through all three languages
threeLangChain x = rSub 5.0 (cppMul 2.0 (pyAdd 3.0 (x :: Real)))

-- Reverse chain: R subtract -> C++ multiply -> Python add
reverseChain x = pyAdd 10.0 (cppMul 3.0 (rSub x (20.0 :: Real)))


================================================
FILE: test-suite/golden-tests/claude-test-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc > /dev/null 2> build.err
	./nexus processNumbers '[1,2,3]' > obs.txt 2> obs.err
	./nexus composeMaps '[5.0,10.0]' 2>> obs.err  >> obs.txt
	./nexus nestedLambda 10 '[1,2,3]' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/claude-test-4/exp.txt
================================================
[12,14,16]
[18,33]
[12,14,16]


================================================
FILE: test-suite/golden-tests/claude-test-4/main.loc
================================================
module main (processNumbers, composeMaps, nestedLambda)

import root-py
import root-cpp

-- Use map with lambda across languages
-- Python map, C++ operations
processNumbers :: [Int] -> [Int]
processNumbers xs = map (\x -> idcpp (2 * (x + 5))) xs

-- Compose two map operations
-- First map in Python, second map in C++
composeMaps :: [Real] -> [Real]
composeMaps xs = map (\x -> idcpp (x * 3.0)) (map (\y -> idpy (y + 1.0)) xs)

-- Nested lambda with multiple arguments captured
-- Tests closure and cross-language lambda evaluation
nestedLambda :: Int -> [Int] -> [Int]
nestedLambda offset xs = map (\x -> offset + x * 2) xs


================================================
FILE: test-suite/golden-tests/claude-test-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testStep --seed 42 > obs.txt 2> obs.err
	./nexus play --seed 12345 --time 0.0 --steps 1 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-5/exp.txt
================================================
1
43


================================================
FILE: test-suite/golden-tests/claude-test-5/game.hpp
================================================
#include <vector>
#include <random>

// Initialize a random Game of Life board
std::vector<std::vector<int>> initGame(int seed, int width, int height) {
    std::mt19937 gen(seed);
    std::uniform_int_distribution<> dis(0, 1);

    std::vector<std::vector<int>> board(height, std::vector<int>(width));
    for (int i = 0; i < height; i++) {
        for (int j = 0; j < width; j++) {
            board[i][j] = dis(gen);
        }
    }
    return board;
}

// Apply one step of Conway's Game of Life
std::vector<std::vector<int>> updateGame(std::vector<std::vector<int>> board) {
    int height = board.size();
    if (height == 0) return board;
    int width = board[0].size();

    std::vector<std::vector<int>> newBoard(height, std::vector<int>(width));

    for (int i = 0; i < height; i++) {
        for (int j = 0; j < width; j++) {
            int neighbors = 0;

            // Count neighbors (wrap around edges)
            for (int di = -1; di <= 1; di++) {
                for (int dj = -1; dj <= 1; dj++) {
                    if (di == 0 && dj == 0) continue;
                    int ni = (i + di + height) % height;
                    int nj = (j + dj + width) % width;
                    neighbors += board[ni][nj];
                }
            }

            // Apply Game of Life rules
            if (board[i][j] == 1) {
                // Live cell survives with 2-3 neighbors
                newBoard[i][j] = (neighbors == 2 || neighbors == 3) ? 1 : 0;
            } else {
                // Dead cell becomes alive with exactly 3 neighbors
                newBoard[i][j] = (neighbors == 3) ? 1 : 0;
            }
        }
    }
    return newBoard;
}


================================================
FILE: test-suite/golden-tests/claude-test-5/game.py
================================================
import time
import os

def drawGame(board):
    """Draw the game board and return it (for composition)"""
    # Clear screen (works on Unix-like systems)
    print("\033[2J\033[H", end="")  # ANSI escape codes

    # Draw board
    for row in board:
        print(''.join(['█' if cell else '·' for cell in row]))
    print()  # Extra newline

    return board

def doSleep(board, duration):
    """Sleep for duration seconds and return board (for composition)"""
    time.sleep(duration)
    return board

def gameLoop(initBoard, updateFn, sleepTime, steps):
    """Main game loop - applies draw, sleep, update for N steps"""
    board = initBoard

    for i in range(steps):
        # Draw current state
        print("\033[2J\033[H", end="")
        for row in board:
            print(''.join(['█' if cell else '·' for cell in row]))
        print(f"Step: {i+1}/{steps}")

        # Sleep
        time.sleep(sleepTime)

        # Update
        board = updateFn(board)

    # Draw final state
    print("\033[2J\033[H", end="")
    for row in board:
        print(''.join(['█' if cell else '·' for cell in row]))
    print(f"Step: {steps}/{steps} (Final)")

    return board


================================================
FILE: test-suite/golden-tests/claude-test-5/main.loc
================================================
-- desc: Conway's Game of Life - Polyglot Implementation
-- author: Claude
--
-- This module main cross-language composition by implementing
-- Conway's Game of Life with C++ for computation and Python for display.
module main (playGame, testStep)

-- Type mappings
type Cpp => List a = "std::vector<$1>" a
type Py => List a = "list" a
type Cpp => Int = "int"
type Py => Int = "int"
type Cpp => Real = "double"
type Py => Real = "float"

-- C++ game logic functions
source Cpp from "game.hpp" ("initGame", "updateGame")
initGame :: Int -> Int -> Int -> [[Int]]
updateGame :: [[Int]] -> [[Int]]

-- Python display and timing functions
source Py from "game.py" ("drawGame", "doSleep", "gameLoop")
drawGame :: [[Int]] -> [[Int]]
doSleep :: [[Int]] -> Real -> [[Int]]
gameLoop :: [[Int]] -> ([[Int]] -> [[Int]]) -> Real -> Int -> [[Int]]

-- Compose one game step: draw -> sleep -> update
-- This demonstrates the composition pattern requested
oneStep :: Real -> [[Int]] -> [[Int]]
oneStep sleepTime board = updateGame (doSleep (drawGame board) sleepTime)

--' Test a single step of the game
--'
--' This function creates a small 20x10 board and runs one update cycle.
--' Returns just the board state without drawing (for testing).
--'
--' name: testStep
testStep ::
  --' Random seed for board initialization
  --' arg: --seed
  --' metavar: SEED
  --' default: 42
  Int ->
  --' return: The board state after one update
  [[Int]]
testStep seed = updateGame (initGame seed 20 10)

--' Play Conway's Game of Life
--'
--' Runs an animated Game of Life simulation in the terminal.
--' The board is initialized with random cells based on the seed.
--' C++ handles the game logic while Python manages display and timing.
--'
--' name: play
playGame ::
  --' Random seed for initial board state
  --' arg: -s/--seed
  --' metavar: SEED
  --' default: 12345
  Int ->
  --' Sleep duration in seconds between frames
  --' arg: -t/--time
  --' metavar: SECONDS
  --' default: 0.5
  Real ->
  --' Number of simulation steps to run
  --' arg: -n/--steps
  --' metavar: STEPS
  --' default: 50
  Int ->
  --' return: Final board state
  [[Int]]
playGame seed sleepTime steps = gameLoop (initGame seed 40 20) updateGame sleepTime steps


================================================
FILE: test-suite/golden-tests/claude-test-5/package.yaml
================================================
name: conway
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
# Files to include when installing with `morloc make --install`
include: ["game.hpp", "game.py"]


================================================
FILE: test-suite/golden-tests/claude-test-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus blur --width 10 --height 10 > obs.txt 2> obs.err
	./nexus edges --width 10 --height 10 2>> obs.err  >> obs.txt
	./nexus analyze --width 8 --height 8 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-6/README.md
================================================
# Claude-Test-6: Image Filter Pipeline

## Overview

Demonstrates cross-language image processing with Python for I/O, C++ for
computationally intensive filtering, and R for statistical analysis.

## Features Tested

- **Records**: Multiple nested records (ImageMetadata, ColorStats, FilteredResult)
- **Cross-language composition**: Python → C++ → R
- **2D arrays**: Image pixel data as `[[Real]]`
- **Where bindings**: Multi-step computations with intermediate variables
- **Struct/dict mapping**: Records map to different native types per language

## Architecture

### Python (`image_io.py`)
- `createTestImage(width, height)`: Generate random test images
- `pixelsToDict(pixels, metadata, stats)`: Combine results into FilteredResult record

### C++ (`filters.hpp`)
- `blurFilter(pixels)`: Apply 3x3 box blur
- `edgeDetect(pixels)`: Sobel-like edge detection
- `getMetadata(pixels)`: Extract image dimensions

### R (`stats.R`)
- `computeColorStats(pixels)`: Calculate mean and standard deviation per channel

## Data Flow

1. **analyzeImage**: Python creates image → R computes statistics
2. **applyBlur**: Python creates image → C++ blurs → R stats → Python assembles result
3. **detectEdges**: Python creates image → C++ edge detection → R stats → Python assembles result

## Example Usage

```bash
# Analyze 8x8 test image
./nexus analyzeImage 8 8

# Apply blur to 10x10 image
./nexus blur --width 10 --height 10

# Detect edges
./nexus edges --width 12 --height 12
```

## What This Tests

1. **Record serialization** across 3 languages
2. **Nested records** (FilteredResult contains ImageMetadata and ColorStats)
3. **2D array serialization** (pixel matrices)
4. **Let bindings** for multi-step pipelines
5. **Language-specific type mappings** (struct in C++, dict in Python, list in R)


================================================
FILE: test-suite/golden-tests/claude-test-6/exp.txt
================================================
{"pixels":[[88.5124645574542,71.8248344472212,53.2941381091155,89.6736964753596,128.776912874218,158.126214412896,127.944791156772,128.357521761093,82.6137428093435,80.8125762868008],[122.926552194863,100.135815926087,69.3557253934204,100.949185158775,126.914410234863,144.703157661752,100.201469122092,114.952117793293,98.9340371517504,115.551917760727],[160.004508712088,132.255085508328,117.970762254393,119.455582414322,134.488174662077,129.250990759298,109.952305325868,140.6955322057,141.970130060156,157.513868034606],[161.126634383042,138.708434624715,113.221577496731,111.573820225094,112.056880300236,100.869993740308,88.9039857427642,123.56867577441,138.380164300018,165.358832826946],[121.845131803404,110.444706561671,119.434228324492,122.871020241791,133.152006375924,102.052955128652,116.765276859958,124.325497452641,130.561523136145,126.753428183668],[125.78331145061,113.657273142207,109.304724845062,128.439587907295,144.478973500098,104.544028339343,89.4854669464691,75.2229821176182,89.6967919530109,90.3791605185259],[142.931905817769,143.462967660245,153.811988474807,163.839423338309,166.119339407671,148.518321135725,122.274653974189,92.8922191921351,80.9664221319985,69.5962801842219],[153.319829971672,159.387148527789,163.218967992923,164.693434883792,146.92982920377,153.843679700023,128.422653187069,108.030871411127,63.2741636531421,52.3909138975773],[115.391642588102,140.763696188744,162.089080509925,141.838383350666,106.238654044517,142.322452993978,153.064345412625,162.422732350186,112.735047601714,105.459140519644],[99.5268133146645,124.859486446369,152.440523846624,134.281997691943,101.313672062729,129.944907856884,154.412686024922,174.007215150174,127.862291514445,125.580096549724]],"metadata":{"width":10,"height":10,"channels":1},"stats":{"meanRed":122.255651751921,"meanGreen":122.255651751921,"meanBlue":122.255651751921,"stddevRed":27.6812835801793,"stddevGreen":27.6812835801793,"stddevBlue":27.6812835801793}}
{"pixels":[[0,0,0,0,0,0,0,0,0,0],[0,507.692513165403,307.933721942629,594.141621461922,338.44569802573,512.692652559272,526.984480328925,383.718032084751,408.873732729833,0],[0,531.026988905135,592.095841396817,628.851777469493,95.2364029085228,444.56055298287,333.392183606607,573.51196986859,205.383834052314,0],[0,541.381513725793,195.44292737003,188.21241260997,476.3598728794,274.981760802021,28.6700473681393,347.650379419914,179.095309652623,0],[0,559.427270170928,464.926072531052,26.2391203789429,262.027116536394,70.1436486822546,301.338533676107,402.037359166487,382.423199322948,0],[0,540.525517020466,611.494264524542,532.08223114212,648.058960431852,640.142399373039,183.300939929458,232.949529192443,268.555146219915,0],[0,494.901449881851,342.578556802197,245.788245834935,209.902059373713,377.712047181093,419.630782916545,145.919686133976,56.0246151237916,0],[0,376.771444273009,149.668633232663,87.0330144302201,331.952882860641,238.395178774245,380.972075867401,661.965551924579,173.148314464784,0],[0,412.019392675303,147.030124032927,356.521188629432,435.914283073864,624.217253470402,209.351073727266,677.154128402466,572.771772527998,0],[0,0,0,0,0,0,0,0,0,0]],"metadata":{"width":10,"height":10,"channels":1},"stats":{"meanRed":234.69351291231,"meanGreen":234.69351291231,"meanBlue":234.69351291231,"stddevRed":227.8315944865,"stddevGreen":227.8315944865,"stddevBlue":227.8315944865}}
{"meanRed":119.088624280306,"meanGreen":119.088624280306,"meanBlue":119.088624280306,"stddevRed":73.4853614921213,"stddevGreen":73.4853614921213,"stddevBlue":73.4853614921213}


================================================
FILE: test-suite/golden-tests/claude-test-6/filters.hpp
================================================
#include <vector>
#include <cmath>
#include <algorithm>

// Simple box blur filter
std::vector<std::vector<double>> blurFilter(std::vector<std::vector<double>> pixels) {
    int height = pixels.size();
    if (height == 0) return pixels;
    int width = pixels[0].size();

    std::vector<std::vector<double>> result(height, std::vector<double>(width));

    // Simple 3x3 box blur
    for (int i = 0; i < height; i++) {
        for (int j = 0; j < width; j++) {
            double sum = 0;
            int count = 0;

            for (int di = -1; di <= 1; di++) {
                for (int dj = -1; dj <= 1; dj++) {
                    int ni = i + di;
                    int nj = j + dj;
                    if (ni >= 0 && ni < height && nj >= 0 && nj < width) {
                        sum += pixels[ni][nj];
                        count++;
                    }
                }
            }
            result[i][j] = sum / count;
        }
    }
    return result;
}

// Simple edge detection (Sobel-like)
std::vector<std::vector<double>> edgeDetect(std::vector<std::vector<double>> pixels) {
    int height = pixels.size();
    if (height == 0) return pixels;
    int width = pixels[0].size();

    std::vector<std::vector<double>> result(height, std::vector<double>(width));

    for (int i = 1; i < height - 1; i++) {
        for (int j = 1; j < width - 1; j++) {
            // Horizontal gradient
            double gx = pixels[i-1][j+1] + 2*pixels[i][j+1] + pixels[i+1][j+1]
                      - pixels[i-1][j-1] - 2*pixels[i][j-1] - pixels[i+1][j-1];

            // Vertical gradient
            double gy = pixels[i+1][j-1] + 2*pixels[i+1][j] + pixels[i+1][j+1]
                      - pixels[i-1][j-1] - 2*pixels[i-1][j] - pixels[i-1][j+1];

            result[i][j] = std::sqrt(gx*gx + gy*gy);
        }
    }
    return result;
}

// Get image metadata
struct ImageMetadata {
    int width;
    int height;
    int channels;
};

ImageMetadata getMetadata(std::vector<std::vector<double>> pixels) {
    ImageMetadata meta;
    meta.height = pixels.size();
    meta.width = (meta.height > 0) ? pixels[0].size() : 0;
    meta.channels = 1;  // Grayscale
    return meta;
}


================================================
FILE: test-suite/golden-tests/claude-test-6/image_io.py
================================================
import random

def createTestImage(width, height):
    """Create a test image with random grayscale values"""
    random.seed(42)  # Deterministic for testing
    # Create 2D array of random values between 0 and 255
    pixels = [[random.uniform(0, 255) for _ in range(width)] for _ in range(height)]
    return pixels

def pixelsToDict(pixels, metadata, stats):
    """Combine pixels, metadata, and stats into a result dictionary"""
    return {
        "pixels": pixels,
        "metadata": metadata,
        "stats": stats
    }


================================================
FILE: test-suite/golden-tests/claude-test-6/main.loc
================================================
-- desc: Image Filter Pipeline - Polyglot Image Processing
-- author: Claude
--
-- Demonstrates cross-language image processing with Python for I/O,
-- C++ for intensive filtering, and R for statistical analysis.
module main (applyBlur, detectEdges, analyzeImage)

-- Type mappings
type Cpp => List a = "std::vector<$1>" a
type Py => List a = "list" a
type R => List a = "list" a
type Cpp => Int = "int"
type Py => Int = "int"
type R => Int = "int"
type Cpp => Real = "double"
type Py => Real = "float"
type R => Real = "double"

-- Image metadata record
record ImageMetadata where
  width :: Int
  height :: Int
  channels :: Int

record Py => ImageMetadata = "dict"
record Cpp => ImageMetadata = "ImageMetadata"
record R => ImageMetadata = "list"

-- Color statistics record
record ColorStats where
  meanRed :: Real
  meanGreen :: Real
  meanBlue :: Real
  stddevRed :: Real
  stddevGreen :: Real
  stddevBlue :: Real

record Py => ColorStats = "dict"
record Cpp => ColorStats = "struct"
record R => ColorStats = "list"

-- Filtered result with metadata
record FilteredResult where
  pixels :: [[Real]]
  metadata :: ImageMetadata
  stats :: ColorStats

record Py => FilteredResult = "dict"
record Cpp => FilteredResult = "struct"
record R => FilteredResult = "list"

-- Python I/O functions
source Py from "image_io.py" ("createTestImage", "pixelsToDict")
createTestImage :: Int -> Int -> [[Real]]
pixelsToDict :: [[Real]] -> ImageMetadata -> ColorStats -> FilteredResult

-- C++ filter functions
source Cpp from "filters.hpp" ("blurFilter", "edgeDetect", "getMetadata")
blurFilter :: [[Real]] -> [[Real]]
edgeDetect :: [[Real]] -> [[Real]]
getMetadata :: [[Real]] -> ImageMetadata

-- R statistics functions
source R from "stats.R" ("computeColorStats")
computeColorStats :: [[Real]] -> ColorStats

--' Apply blur filter to an image
--'
--' Creates a test image and applies Gaussian blur using C++.
--' Returns the filtered result with metadata and statistics.
--'
--' name: blur
applyBlur ::
  --' Image width in pixels
  --' arg: --width
  --' metavar: WIDTH
  --' default: 10
  Int ->
  --' Image height in pixels
  --' arg: --height
  --' metavar: HEIGHT
  --' default: 10
  Int ->
  --' return: Filtered image with metadata
  FilteredResult
applyBlur width height = pixelsToDict blurred metadata stats where
  pixels = createTestImage width height
  blurred = blurFilter pixels
  metadata = getMetadata blurred
  stats = computeColorStats blurred

--' Detect edges in an image
--'
--' Creates a test image and applies edge detection using C++.
--'
--' name: edges
detectEdges ::
  --' Image width in pixels
  --' arg: --width
  --' metavar: WIDTH
  --' default: 10
  Int ->
  --' Image height in pixels
  --' arg: --height
  --' metavar: HEIGHT
  --' default: 10
  Int ->
  --' return: Edge-detected image with metadata
  FilteredResult
detectEdges width height = pixelsToDict edges metadata stats where
  pixels = createTestImage width height
  edges = edgeDetect pixels
  metadata = getMetadata edges
  stats = computeColorStats edges

--' Analyze image statistics
--'
--' Creates a test image and computes color channel statistics using R.
--'
--' name: analyze
analyzeImage ::
  --' Image width in pixels
  --' arg: --width
  --' metavar: WIDTH
  --' default: 8
  Int ->
  --' Image height in pixels
  --' arg: --height
  --' metavar: HEIGHT
  --' default: 8
  Int ->
  --' return: Image statistics
  ColorStats
analyzeImage width height = computeColorStats pixels where
  pixels = createTestImage width height


================================================
FILE: test-suite/golden-tests/claude-test-6/stats.R
================================================
computeColorStats <- function(pixels) {
  # Flatten the matrix
  flat <- unlist(pixels)

  # For grayscale, all channels are the same
  mean_val <- mean(flat)
  sd_val <- sd(flat)

  # Return as list (morloc record)
  list(
    meanRed = mean_val,
    meanGreen = mean_val,
    meanBlue = mean_val,
    stddevRed = sd_val,
    stddevGreen = sd_val,
    stddevBlue = sd_val
  )
}


================================================
FILE: test-suite/golden-tests/claude-test-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus analyze -n 50 > obs.txt 2> obs.err
	./nexus summary 2>> obs.err  >> obs.txt
	./nexus groupBy -n 50 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-7/README.md
================================================
# Claude-Test-7: CSV Data Analysis Dashboard

## Overview
Demonstrates data science workflows with Python for I/O, R for statistics, and C++ for fast aggregations. Tests records, lists of records, and field accessors.

## Features Tested
- **Records**: SalesRecord, Summary, CategorySummary
- **Lists of records**: `[SalesRecord]`, `[CategorySummary]`
- **Field accessors**: `.price`, `.category` to extract record fields
- **Map with lambdas**: `map (\s -> .price s) sales`
- **Cross-language data pipeline**: Python → C++ → Python
- **String generation**: Formatted reports from Python

## Architecture

### Python (`data_io.py`)
- `generateSalesData(n)`: Create random sales records (deterministic seed)
- `formatReport(summaries)`: Format category summaries as text

### C++ (`aggregations.hpp`)
- `calculateRevenue(sales)`: Fast sum of all revenues
- `fastGroupBy(sales)`: Group by category and aggregate

### R (`statistics.R`)
- `computeSummary(values)`: Compute count, mean, stddev, min, max
- `correlationAnalysis(x, y)`: Pearson correlation coefficient

## Data Flow

1. **analyzeSales**: Python generates data → C++ calculates total revenue
2. **summarizeStats**: Python generates → Extract prices with map → R computes statistics
3. **groupByCategory**: Python generates → C++ groups and aggregates → Python formats report

## Example Usage

```bash
# Calculate total revenue from 100 sales
./nexus analyze --records 100

# Get summary statistics
./nexus summary --records 50

# Group by category and format report
./nexus group-by --records 200
```

## What This Tests

1. **Records with multiple fields** (strings, ints, reals)
2. **Lists of records** serialization
3. **Field accessor syntax** (`.price`, `.category`)
4. **Map with lambda and field access**: `map (\s -> .price s) sales`
5. **Cross-language aggregation** patterns
6. **String formatting** and text generation
7. **Deterministic random data** for reproducible tests


================================================
FILE: test-suite/golden-tests/claude-test-7/aggregations.hpp
================================================
#include <vector>
#include <string>
#include <map>
#include <algorithm>

struct SalesRecord {
    std::string product;
    std::string category;
    int quantity;
    double price;
    std::string region;
};

struct CategorySummary {
    std::string category;
    double totalSales;
    int itemCount;
    double avgPrice;
};

// Calculate total revenue from all sales
double calculateRevenue(std::vector<SalesRecord> sales) {
    double total = 0.0;
    for (const auto& sale : sales) {
        total += sale.quantity * sale.price;
    }
    return total;
}

// Group sales by category and compute aggregates
std::vector<CategorySummary> fastGroupBy(std::vector<SalesRecord> sales) {
    std::map<std::string, std::pair<double, int>> categoryData;

    // Aggregate by category
    for (const auto& sale : sales) {
        double revenue = sale.quantity * sale.price;
        categoryData[sale.category].first += revenue;
        categoryData[sale.category].second += 1;
    }

    // Convert to result vector
    std::vector<CategorySummary> results;
    for (const auto& entry : categoryData) {
        CategorySummary summary;
        summary.category = entry.first;
        summary.totalSales = entry.second.first;
        summary.itemCount = entry.second.second;
        summary.avgPrice = entry.second.first / entry.second.second;
        results.push_back(summary);
    }

    return results;
}


================================================
FILE: test-suite/golden-tests/claude-test-7/data_io.py
================================================
import random

def generateSalesData(n):
    """Generate n sales records with deterministic random data"""
    random.seed(42)

    products = ["Widget", "Gadget", "Doohickey", "Thingamajig", "Gizmo"]
    categories = ["Electronics", "Hardware", "Software", "Services"]
    regions = ["North", "South", "East", "West"]

    sales = []
    for i in range(n):
        record = {
            "product": random.choice(products),
            "category": random.choice(categories),
            "quantity": random.randint(1, 100),
            "price": round(random.uniform(10.0, 500.0), 2),
            "region": random.choice(regions)
        }
        sales.append(record)

    return sales

def formatReport(summaries):
    """Format category summaries as a text report"""
    lines = ["Category Sales Report", "=" * 50]

    for summary in summaries:
        line = f"{summary['category']:20s} | Total: ${summary['totalSales']:10.2f} | Items: {summary['itemCount']:5d} | Avg: ${summary['avgPrice']:8.2f}"
        lines.append(line)

    lines.append("=" * 50)
    return "\n".join(lines)


================================================
FILE: test-suite/golden-tests/claude-test-7/exp.txt
================================================
624570.87
{"count":50,"total":12875.4,"mean":257.508,"stddev":131.659373462007,"minVal":24.6,"maxVal":498.1}
"Category Sales Report\n==================================================\nElectronics          | Total: $ 239557.13 | Items:    17 | Avg: $14091.60\nHardware             | Total: $  82341.63 | Items:     9 | Avg: $ 9149.07\nServices             | Total: $ 237477.21 | Items:    16 | Avg: $14842.33\nSoftware             | Total: $  65194.90 | Items:     8 | Avg: $ 8149.36\n=================================================="


================================================
FILE: test-suite/golden-tests/claude-test-7/main.loc
================================================
-- desc: CSV Data Analysis Dashboard
-- author: Claude
--
-- Demonstrates table types, statistical aggregation with R,
-- fast C++ operations, and Python data I/O.
module main (analyzeSales, summarizeStats, groupByCategory)

import root-py
import root-r
import root-cpp

-- Sales data record
record SalesRecord where
  product :: Str
  category :: Str
  quantity :: Int
  price :: Real
  region :: Str

record Py => SalesRecord = "dict"
record Cpp => SalesRecord = "SalesRecord"
record R => SalesRecord = "list"

-- Summary statistics record
record Summary where
  count :: Int
  total :: Real
  mean :: Real
  stddev :: Real
  minVal :: Real
  maxVal :: Real

record Py => Summary = "dict"
record Cpp => Summary = "struct"
record R => Summary = "list"

-- Category summary
record CategorySummary where
  category :: Str
  totalSales :: Real
  itemCount :: Int
  avgPrice :: Real

record Py => CategorySummary = "dict"
record Cpp => CategorySummary = "CategorySummary"
record R => CategorySummary = "list"

-- Python data generation and I/O
source Py from "data_io.py" ("generateSalesData", "formatReport")
generateSalesData :: Int -> [SalesRecord]
formatReport :: [CategorySummary] -> Str

-- C++ fast aggregations
source Cpp from "aggregations.hpp" ("fastGroupBy", "calculateRevenue")
fastGroupBy :: [SalesRecord] -> [CategorySummary]
calculateRevenue :: [SalesRecord] -> Real

-- R statistical functions
source R from "statistics.R" ("computeSummary", "correlationAnalysis")
computeSummary :: [Real] -> Summary
correlationAnalysis :: [Real] -> [Real] -> Real

--' Analyze sales data
--'
--' Generates sales data and computes total revenue using C++.
--'
--' name: analyze
analyzeSales ::
  --' Number of sales records to generate
  --' arg: -n/--records
  --' metavar: COUNT
  --' default: 100
  Int ->
  --' return: Total revenue
  Real
analyzeSales n = calculateRevenue sales where
  sales = generateSalesData n

--' Compute summary statistics
--'
--' Generates sales data, extracts prices, and computes statistics using R.
--'
--' name: summary
summarizeStats ::
  --' Number of records to analyze
  --' arg: -n/--records
  --' metavar: COUNT
  --' default: 50
  Int ->
  --' return: Statistical summary
  Summary
summarizeStats n = computeSummary prices where
  sales = generateSalesData n
  prices = map (\s -> .price s) sales

--' Group sales by category
--'
--' Groups sales data by category using C++ and formats a report with Python.
--'
--' name: groupBy
groupByCategory ::
  --' Number of records to analyze
  --' arg: -n/--records
  --' metavar: COUNT
  --' default: 100
  Int ->
  --' return: Formatted report
  Str
groupByCategory n = formatReport grouped where
  sales = generateSalesData n
  grouped = fastGroupBy sales


================================================
FILE: test-suite/golden-tests/claude-test-7/statistics.R
================================================
computeSummary <- function(values) {
  list(
    count = length(values),
    total = sum(values),
    mean = mean(values),
    stddev = sd(values),
    minVal = min(values),
    maxVal = max(values)
  )
}

correlationAnalysis <- function(x, y) {
  cor(x, y)
}


================================================
FILE: test-suite/golden-tests/claude-test-8/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus analyze --sample 1 > obs.txt 2> obs.err
	./nexus topWords --sample 1 2>> obs.err  >> obs.txt
	./nexus sentiment --sample 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-8/README.md
================================================
# Claude-Test-8: Text Mining Pipeline

## Overview
Demonstrates text processing and NLP workflows with Python for tokenization, C++ for fast string operations, and R for sentiment analysis.

## Features Tested
- **String processing**: Tokenization, word counting, n-grams
- **Lists of strings**: `[Str]` for tokens
- **Tuples**: `(Str, Int)` for word-count pairs
- **Helper functions**: `take`, `reverse` for list manipulation
- **Pattern matching**: Case expressions on lists
- **Records with strings**: Document, WordFreq, Sentiment records
- **Cross-language text analysis**: Python → C++ → R

## Architecture

### Python (`text_processing.py`)
- `getSampleText(id)`: Retrieve sample texts for testing
- `tokenizeText(text)`: Tokenize into lowercase words
- `createDocument(id, text)`: Create Document record

### C++ (`string_ops.hpp`)
- `countWords(tokens)`: Count word frequencies, return sorted list
- `findNgrams(tokens, n)`: Generate n-grams
- `calculateTfidf(word, tokens)`: Simple TF-IDF calculation

### R (`text_stats.R`)
- `computeSentiment(tokens)`: Sentiment analysis with word lists
- `wordDiversity(tokens)`: Type-token ratio

## Data Flow

1. **analyzeText**: Python gets text → tokenizes → creates Document record
2. **findTopWords**: Python tokenizes → C++ counts and sorts → morloc takes top N
3. **computeSentiment**: Python tokenizes → R analyzes sentiment

## Example Usage

```bash
# Analyze sample text 1
./nexus analyze --sample 1

# Find top 10 words from sample 3
./nexus top-words --sample 3 --count 10

# Compute sentiment for sample 2 (positive text)
./nexus sentiment --sample 2
```

## What This Tests

1. **String operations** across languages
2. **Tuples**: `(Str, Int)` for word frequencies
3. **Pattern matching**: Case expressions on lists (`case xs of`)
4. **Helper functions**: `take`, `reverse` implemented in morloc
5. **Lists of tuples** serialization
6. **Records with string fields**
7. **Cross-language text processing** pipelines

## Sample Texts

1. "The quick brown fox..." (neutral)
2. "This is a wonderful day!..." (positive)
3. "The weather is terrible..." (negative)
4. "Machine learning..." (neutral/technical)
5. "The cat sat on the mat..." (neutral)


================================================
FILE: test-suite/golden-tests/claude-test-8/exp.txt
================================================
{"docId":"doc1","text":"The quick brown fox jumps over the lazy dog. The dog was very lazy indeed.","tokens":["the","quick","brown","fox","jumps","over","the","lazy","dog","the","dog","was","very","lazy","indeed"],"wordCount":15}
[{"word":"the","count":3},{"word":"dog","count":2},{"word":"lazy","count":2},{"word":"brown","count":1},{"word":"fox","count":1},{"word":"indeed","count":1},{"word":"jumps","count":1},{"word":"over","count":1},{"word":"quick","count":1},{"word":"very","count":1},{"word":"was","count":1}]
{"positive":0.25,"negative":0,"neutral":0.75,"overall":0.25}


================================================
FILE: test-suite/golden-tests/claude-test-8/main.loc
================================================
-- desc: Text Mining Pipeline - NLP and Text Analytics
-- author: Claude
--
-- Demonstrates string processing, tokenization, and text analysis
-- across Python, C++, and R.
module main (analyzeText, findTopWords, analyzeSentiment)

-- Type mappings
type Cpp => List a = "std::vector<$1>" a
type Py => List a = "list" a
type R => List a = "list" a
type Cpp => Int = "int"
type Py => Int = "int"
type R => Int = "int"
type Cpp => Real = "double"
type Py => Real = "float"
type R => Real = "double"
type Cpp => Str = "std::string"
type Py => Str = "str"
type R => Str = "character"
type Cpp => Tuple2 a b = "std::pair<$1,$2>" a b
type Py => Tuple2 a b = "tuple" a b
type R => Tuple2 a b = "list" a b

-- Document record
record Document where
  docId :: Str
  text :: Str
  tokens :: [Str]
  wordCount :: Int

record Py => Document = "dict"
record Cpp => Document = "struct"
record R => Document = "list"

-- Word frequency record
record WordFreq where
  word :: Str
  count :: Int

record Py => WordFreq = "dict"
record Cpp => WordFreq = "WordFreq"
record R => WordFreq = "list"

-- Sentiment scores
record Sentiment where
  positive :: Real
  negative :: Real
  neutral :: Real
  overall :: Real

record Py => Sentiment = "dict"
record Cpp => Sentiment = "struct"
record R => Sentiment = "list"

-- Python tokenization and I/O
source Py from "text_processing.py" ("createDocument", "tokenizeText", "getSampleText")
createDocument :: Str -> Str -> Document
tokenizeText :: Str -> [Str]
getSampleText :: Int -> Str

-- C++ fast string operations
source Cpp from "string_ops.hpp" ("countWords", "findNgrams")
countWords :: [Str] -> [WordFreq]
findNgrams :: [Str] -> Int -> [Str]

-- R sentiment and statistics
source R from "text_stats.R" ("computeSentiment", "wordDiversity")
computeSentiment :: [Str] -> Sentiment
wordDiversity :: [Str] -> Real

--' Analyze text document
--'
--' Creates a document from sample text and tokenizes it.
--'
--' name: analyze
analyzeText ::
  --' Sample text ID (1-5)
  --' arg: --sample
  --' metavar: ID
  --' default: 1
  Int ->
  --' return: Document with tokens
  Document
analyzeText sampleId = createDocument "doc1" text where
  text = getSampleText sampleId

--' Find top N most frequent words
--'
--' Tokenizes text and finds the most common words using C++.
--'
--' name: topWords
findTopWords ::
  --' Sample text ID
  --' arg: --sample
  --' metavar: ID
  --' default: 1
  Int ->
  --' return: List of word frequencies
  [WordFreq]
findTopWords sampleId = countWords tokens where
  text = getSampleText sampleId
  tokens = tokenizeText text

--' Compute sentiment analysis
--'
--' Analyzes the sentiment of sample text using R.
--'
--' name: sentiment
analyzeSentiment ::
  --' Sample text ID
  --' arg: --sample
  --' metavar: ID
  --' default: 2
  Int ->
  --' return: Sentiment scores
  Sentiment
analyzeSentiment sampleId = computeSentiment tokens where
  text = getSampleText sampleId
  tokens = tokenizeText text


================================================
FILE: test-suite/golden-tests/claude-test-8/string_ops.hpp
================================================
#include <vector>
#include <string>
#include <map>
#include <algorithm>
#include <cmath>

struct WordFreq {
    std::string word;
    int count;
};

// Count word frequencies and return sorted list
std::vector<WordFreq> countWords(std::vector<std::string> tokens) {
    std::map<std::string, int> wordCounts;

    // Count occurrences
    for (const auto& token : tokens) {
        wordCounts[token]++;
    }

    // Convert to vector and sort by count (descending)
    std::vector<WordFreq> result;
    for (const auto& entry : wordCounts) {
        result.push_back({entry.first, entry.second});
    }

    std::sort(result.begin(), result.end(),
              [](const auto& a, const auto& b) { return a.count > b.count; });

    return result;
}

// Generate n-grams from tokens
std::vector<std::string> findNgrams(std::vector<std::string> tokens, int n) {
    std::vector<std::string> ngrams;

    for (size_t i = 0; i + n <= tokens.size(); i++) {
        std::string ngram;
        for (int j = 0; j < n; j++) {
            if (j > 0) ngram += " ";
            ngram += tokens[i + j];
        }
        ngrams.push_back(ngram);
    }

    return ngrams;
}

// Calculate simple TF-IDF score for a word in a document
double calculateTfidf(std::string word, std::vector<std::string> tokens) {
    // Term frequency
    int termCount = 0;
    for (const auto& token : tokens) {
        if (token == word) termCount++;
    }

    if (termCount == 0) return 0.0;

    double tf = static_cast<double>(termCount) / tokens.size();

    // Simple IDF (assuming single document, so just use log of doc length)
    double idf = std::log(static_cast<double>(tokens.size()) / (1.0 + termCount));

    return tf * idf;
}


================================================
FILE: test-suite/golden-tests/claude-test-8/text_processing.py
================================================
import re

SAMPLE_TEXTS = {
    1: "The quick brown fox jumps over the lazy dog. The dog was very lazy indeed.",
    2: "This is a wonderful day! I feel great and everything is amazing.",
    3: "The weather is terrible today. It's cold, rainy, and miserable.",
    4: "Machine learning and artificial intelligence are transforming technology.",
    5: "The cat sat on the mat. The mat was soft and comfortable for the cat."
}

def getSampleText(sampleId):
    """Get a sample text by ID"""
    return SAMPLE_TEXTS.get(sampleId, SAMPLE_TEXTS[1])

def tokenizeText(text):
    """Tokenize text into words (lowercase, alphanumeric only)"""
    # Convert to lowercase and split on non-alphanumeric
    words = re.findall(r'\b[a-z]+\b', text.lower())
    return words

def createDocument(docId, text):
    """Create a Document record from text"""
    tokens = tokenizeText(text)
    return {
        "docId": docId,
        "text": text,
        "tokens": tokens,
        "wordCount": len(tokens)
    }


================================================
FILE: test-suite/golden-tests/claude-test-8/text_stats.R
================================================
computeSentiment <- function(tokens) {
  # Simple sentiment based on word lists
  positive_words <- c("great", "wonderful", "amazing", "good", "happy", "excellent", "fantastic")
  negative_words <- c("terrible", "bad", "awful", "horrible", "sad", "miserable", "poor", "cold", "rainy")

  pos_count <- sum(tokens %in% positive_words)
  neg_count <- sum(tokens %in% negative_words)
  total <- length(tokens)

  positive_score <- pos_count / total
  negative_score <- neg_count / total
  neutral_score <- 1 - positive_score - negative_score
  overall <- positive_score - negative_score

  list(
    positive = positive_score,
    negative = negative_score,
    neutral = neutral_score,
    overall = overall
  )
}

wordDiversity <- function(tokens) {
  # Type-token ratio (unique words / total words)
  unique_count <- length(unique(tokens))
  total_count <- length(tokens)
  unique_count / total_count
}


================================================
FILE: test-suite/golden-tests/claude-test-9/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus price --spot 100 --strike 105 --volatility 0.2 --paths 100 --steps 50 > obs.txt 2> obs.err
	./nexus analyzeDist --spot 100 --paths 100 2>> obs.err  >> obs.txt
	./nexus paths --paths 5 --steps 10 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/claude-test-9/README.md
================================================
# Claude-Test-9: Monte Carlo Option Pricer

## Overview
Demonstrates quantitative finance workflows with C++ for performance-critical Monte Carlo simulation, R for statistical analysis, and Python for I/O.

## Features Tested
- **Numerical computation**: Monte Carlo simulation with Geometric Brownian Motion
- **2D arrays**: `[[Real]]` for price paths
- **Records with reals**: MarketParams, SimulationResult, PriceDistribution
- **Tuples in records**: `confidenceInterval :: (Real, Real)`
- **Map with lambdas**: Extract final prices from paths
- **Helper functions**: `last` to get final element
- **Deterministic random numbers**: Seeded RNG for reproducible results

## Architecture

### Python (`market_io.py`)
- `createMarketParams(...)`: Build market parameter record
- `formatResults(price, stdError)`: Format output string

### C++ (`monte_carlo.hpp`)
- `simulatePaths(params, nPaths, nSteps)`: Generate stock price paths using GBM
- `priceCallOption(params, paths)`: Calculate discounted expected payoff
- `calculateStdError(values)`: Compute standard error

### R (`finance_stats.R`)
- `analyzeDistribution(prices)`: Comprehensive distribution analysis
- `confidenceInterval(values, alpha)`: Calculate confidence intervals
- `percentiles(values, probs)`: Compute percentiles

## Mathematical Background

**Geometric Brownian Motion:**
```
dS = μS dt + σS dW
```

Where:
- S = stock price
- μ = drift (risk-free rate in risk-neutral measure)
- σ = volatility
- dW = Wiener process increment

**Option Pricing:**
```
Call Price = e^(-rT) * E[max(S_T - K, 0)]
```

## Data Flow

1. **priceOption**: Create params → C++ simulates paths → C++ prices option
2. **analyzeDistribution**: Create params → C++ simulates → Extract final prices → R analyzes
3. **generatePaths**: Create params → C++ simulates → Return raw paths

## Example Usage

```bash
# Price option with spot=100, strike=105, vol=0.2, 1000 paths
./nexus price --spot 100 --strike 105 --volatility 0.2 --paths 1000

# Analyze price distribution
./nexus analyze-dist --spot 100 --paths 5000

# Generate 20 paths with 100 steps
./nexus paths --paths 20 --steps 100
```

## What This Tests

1. **Large numeric arrays**: Thousands of price paths
2. **2D array serialization**: `[[Real]]`
3. **Records with multiple real fields**
4. **Tuples in records**: `(Real, Real)` for confidence intervals
5. **Statistical functions** in R
6. **Performance-critical C++ code**
7. **Map with lambda**: `map (\path -> last path) paths`
8. **Deterministic randomness**: Seed 42 for reproducible tests

## Default Parameters

- Spot price: $100
- Strike price: $105
- Volatility: 20% (0.2)
- Risk-free rate: 5% (0.05)
- Time to maturity: 1 year
- Paths: 1000
- Steps: 50


================================================
FILE: test-suite/golden-tests/claude-test-9/exp.txt
================================================
9.38469771857192
{"mean":107.266318819265,"median":103.746880550564,"stddev":21.6400811382564,"percentile5":74.3267000908099,"percentile95":143.705401150951,"ciLower":103.024862916167,"ciUpper":111.507774722363}
[[100,96.8700414176103,100.380618985345,103.745288142639,113.464172647557,107.393741203849,106.873954852161,94.3928839636883,91.7711575504317,94.3609180080303,89.2427500962744],[100,100.808148613603,100.096076020442,100.538015221198,98.1483309311996,95.1871378298816,94.7664100795858,96.3955969686945,92.1013340207717,93.2141635459931,93.2895486769626],[100,107.760600180497,107.370708534733,104.175369907028,117.925138733867,104.049734411036,112.018895426603,118.031086742208,110.421901920188,118.960369506565,122.166946110177],[100,97.8785565933973,91.2351672012759,94.8450537404749,90.9846670542748,83.6417221349421,82.0402029368624,79.9198096455361,80.4985787422201,79.8452386069075,86.4046394327139],[100,104.830086352176,104.009896454446,98.5053179508003,106.515000875625,112.276800329512,133.212830144785,135.858295136884,151.176362303217,156.114809841396,157.437093840174]]


================================================
FILE: test-suite/golden-tests/claude-test-9/finance_stats.R
================================================
analyzeDistribution <- function(prices) {
  meanVal <- mean(prices)
  medianVal <- median(prices)
  stddevVal <- sd(prices)
  p5 <- quantile(prices, 0.05)
  p95 <- quantile(prices, 0.95)

  # 95% confidence interval for mean
  se <- sd(prices) / sqrt(length(prices))
  ci_lower <- meanVal - 1.96 * se
  ci_upper <- meanVal + 1.96 * se

  list(
    mean = meanVal,
    median = medianVal,
    stddev = stddevVal,
    percentile5 = as.numeric(p5),
    percentile95 = as.numeric(p95),
    ciLower = ci_lower,
    ciUpper = ci_upper
  )
}

confidenceInterval <- function(values, alpha) {
  n <- length(values)
  meanVal <- mean(values)
  se <- sd(values) / sqrt(n)
  z <- qnorm(1 - alpha/2)

  list(meanVal - z * se, meanVal + z * se)
}

percentiles <- function(values, probs) {
  quantile(values, probs)
}


================================================
FILE: test-suite/golden-tests/claude-test-9/helpers.py
================================================
def last(xs):
    return xs[-1]


================================================
FILE: test-suite/golden-tests/claude-test-9/main.loc
================================================
-- desc: Monte Carlo Option Pricer - Quantitative Finance
-- author: Claude
--
-- Demonstrates numerical computation with C++ for simulation,
-- R for statistical analysis, and Python for I/O and formatting.
module main (priceOption, analyzePriceDistribution, generatePaths)

import root-py

-- Type mappings
type Cpp => List a = "std::vector<$1>" a
type Py => List a = "list" a
type R => List a = "list" a
type Cpp => Int = "int"
type Py => Int = "int"
type R => Int = "int"
type Cpp => Real = "double"
type Py => Real = "float"
type R => Real = "double"

-- Market parameters
record MarketParams where
  spot :: Real
  strike :: Real
  volatility :: Real
  riskFreeRate :: Real
  timeToMaturity :: Real

record Py => MarketParams = "dict"
record Cpp => MarketParams = "MarketParams"
record R => MarketParams = "list"

-- Statistical summary
record PriceDistribution where
  mean :: Real
  median :: Real
  stddev :: Real
  percentile5 :: Real
  percentile95 :: Real
  ciLower :: Real
  ciUpper :: Real

record Py => PriceDistribution = "dict"
record Cpp => PriceDistribution = "PriceDistribution"
record R => PriceDistribution = "list"

-- Python I/O and formatting
source Py from "market_io.py" ("createMarketParams", "formatResults")
createMarketParams :: Real -> Real -> Real -> Real -> Real -> MarketParams
formatResults :: Real -> Real -> Str

-- C++ Monte Carlo simulation
source Cpp from "monte_carlo.hpp" ("simulatePaths", "priceCallOption", "calculateStdError")
simulatePaths :: MarketParams -> Int -> Int -> [[Real]]
priceCallOption :: MarketParams -> [[Real]] -> Real
calculateStdError :: [Real] -> Real

-- R statistical analysis
source R from "finance_stats.R" ("analyzeDistribution")
analyzeDistribution :: [Real] -> PriceDistribution

-- Local helpers
source Py from "helpers.py" ("last")
last :: [a] -> a

--' Price a European call option using Monte Carlo
--'
--' Simulates stock price paths and computes option price.
--'
--' name: price
priceOption ::
  --' Current stock price
  --' arg: --spot
  --' metavar: PRICE
  --' default: 100.0
  Real ->
  --' Strike price
  --' arg: --strike
  --' metavar: STRIKE
  --' default: 105.0
  Real ->
  --' Volatility (annual)
  --' arg: --volatility
  --' metavar: VOL
  --' default: 0.2
  Real ->
  --' Number of simulation paths
  --' arg: -n/--paths
  --' metavar: N
  --' default: 1000
  Int ->
  --' Number of time steps
  --' arg: --steps
  --' metavar: STEPS
  --' default: 50
  Int ->
  --' return: Option price
  Real
priceOption spot strike vol nPaths nSteps = priceCallOption params paths where
  params = createMarketParams spot strike vol 0.05 1.0
  paths = simulatePaths params nPaths nSteps

--' Analyze price distribution
--'
--' Runs Monte Carlo and analyzes the distribution of final prices using R.
--'
--' name: analyzeDist
analyzePriceDistribution ::
  --' Current stock price
  --' arg: --spot
  --' metavar: PRICE
  --' default: 100.0
  Real ->
  --' Number of paths
  --' arg: -n/--paths
  --' metavar: N
  --' default: 1000
  Int ->
  --' return: Distribution statistics
  PriceDistribution
analyzePriceDistribution spot nPaths = analyzeDistribution finalPrices where
  params = createMarketParams spot 105.0 0.2 0.05 1.0
  paths = simulatePaths params nPaths 50
  finalPrices = map (\path -> last path) paths

--' Generate and return price paths
--'
--' Generates Monte Carlo paths for visualization.
--'
--' name: paths
generatePaths ::
  --' Number of paths
  --' arg: -n/--paths
  --' metavar: N
  --' default: 10
  Int ->
  --' Number of steps
  --' arg: --steps
  --' metavar: STEPS
  --' default: 50
  Int ->
  --' return: Simulated paths
  [[Real]]
generatePaths nPaths nSteps = simulatePaths params nPaths nSteps where
  params = createMarketParams 100.0 105.0 0.2 0.05 1.0


================================================
FILE: test-suite/golden-tests/claude-test-9/market_io.py
================================================
def createMarketParams(spot, strike, volatility, riskFreeRate, timeToMaturity):
    """Create market parameters record"""
    return {
        "spot": spot,
        "strike": strike,
        "volatility": volatility,
        "riskFreeRate": riskFreeRate,
        "timeToMaturity": timeToMaturity
    }

def formatResults(price, stdError):
    """Format pricing results as a string"""
    return f"Option Price: ${price:.4f} ± ${stdError:.4f}"

def extractFinalPrices(paths):
    """Extract the final price from each path"""
    return [path[-1] for path in paths]


================================================
FILE: test-suite/golden-tests/claude-test-9/monte_carlo.hpp
================================================
#include <vector>
#include <cmath>
#include <random>

struct MarketParams {
    double spot;
    double strike;
    double volatility;
    double riskFreeRate;
    double timeToMaturity;
};

struct PriceDistribution {
    double mean;
    double median;
    double stddev;
    double percentile5;
    double percentile95;
    double ciLower;
    double ciUpper;
};

// Simulate stock price paths using Geometric Brownian Motion
std::vector<std::vector<double>> simulatePaths(MarketParams params, int nPaths, int nSteps) {
    std::mt19937 gen(42);  // Deterministic seed
    std::normal_distribution<> dist(0.0, 1.0);

    double dt = params.timeToMaturity / nSteps;
    double drift = (params.riskFreeRate - 0.5 * params.volatility * params.volatility) * dt;
    double diffusion = params.volatility * std::sqrt(dt);

    std::vector<std::vector<double>> paths(nPaths, std::vector<double>(nSteps + 1));

    for (int i = 0; i < nPaths; i++) {
        paths[i][0] = params.spot;

        for (int j = 1; j <= nSteps; j++) {
            double z = dist(gen);
            double S_prev = paths[i][j-1];
            paths[i][j] = S_prev * std::exp(drift + diffusion * z);
        }
    }

    return paths;
}

// Price a European call option using simulated paths
double priceCallOption(MarketParams params, std::vector<std::vector<double>> paths) {
    int nPaths = paths.size();
    double payoffSum = 0.0;

    for (int i = 0; i < nPaths; i++) {
        double finalPrice = paths[i].back();
        double payoff = std::max(finalPrice - params.strike, 0.0);
        payoffSum += payoff;
    }

    double avgPayoff = payoffSum / nPaths;
    double discountedPrice = avgPayoff * std::exp(-params.riskFreeRate * params.timeToMaturity);

    return discountedPrice;
}

// Calculate standard error of a sample
double calculateStdError(std::vector<double> values) {
    int n = values.size();
    if (n == 0) return 0.0;

    double mean = 0.0;
    for (double v : values) mean += v;
    mean /= n;

    double variance = 0.0;
    for (double v : values) {
        double diff = v - mean;
        variance += diff * diff;
    }
    variance /= (n - 1);

    return std::sqrt(variance / n);
}


================================================
FILE: test-suite/golden-tests/claude-test-9/test-map.loc
================================================
module main (testMapWorks)

import root-py

-- Test that map is available through Functor typeclass
testMapWorks :: [Int] -> [Int]
testMapWorks xs = map (\x -> x + 1) xs


================================================
FILE: test-suite/golden-tests/command-groups/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus math double 5 > obs.txt 2> obs.err
	./nexus math triple 3 >> obs.txt 2>> obs.err
	./nexus text greet '"hello"' >> obs.txt 2>> obs.err
	./nexus version >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/command-groups/exp.txt
================================================
[5,5]
[3,3,3]
["hello","hello"]
42


================================================
FILE: test-suite/golden-tests/command-groups/main.loc
================================================
module main (
  --* group: math
  --* Mathematical operations
  double, triple,

  --* group: text
  --* Text utilities
  greet,

  --* group:
  version
)

double :: Int -> (Int, Int)
double x = (x, x)

triple :: Int -> (Int, Int, Int)
triple x = (x, x, x)

greet :: Str -> [Str]
greet x = [x, x]

version :: Int
version = 42


================================================
FILE: test-suite/golden-tests/composition/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '["x","y"]' > obs.txt 2> obs.err
	./nexus bar 0 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/composition/exp.txt
================================================
["abcx","abcy"]
1


================================================
FILE: test-suite/golden-tests/composition/main.loc
================================================
module main (foo, bar)

import root-py

source py from "paste.py" (
    "morloc_paste" as paste
    )

source py ("abs")

abs :: Real -> Real
paste :: Str -> Str -> Str

foo :: [Str] -> [Str]
foo xs = map (paste "a" . paste "b" . paste "c") xs

bar :: Real -> Real
bar = abs . (-) 1.0 . abs


================================================
FILE: test-suite/golden-tests/composition/paste.py
================================================
def morloc_paste(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/demo-trimming/.gitignore
================================================
example.json


================================================
FILE: test-suite/golden-tests/demo-trimming/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus readFASTQ '"example.fastq"' | \
		./nexus trim config.json /dev/stdin | \
		./nexus writeFASTA '"obs.txt"' /dev/stdin

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/demo-trimming/config.json
================================================
{ "minLength":40
, "minQuality":20
}


================================================
FILE: test-suite/golden-tests/demo-trimming/example.fastq
================================================
@SEQ_1
GATTTGGGGTTCAAAGCAGTATCGATCAAATAGTAAATCCATTTGTTCAACTCACAGTTT
+
!!!!!!!!***+))%%%++)(%%%%).1***-+*''))**55CCF>>>>>>!!!!!!!!!
@SEQ_2
GATTTGGGGTTCAAAGCAGTATCGATCAAATAGTAAATCCATTTGTTCAACTCACAGTTT
+
!''*((((***+))%%%++)(%%%%).1***-+*''))**55CCF>>>>>>CCCCCCC65


================================================
FILE: test-suite/golden-tests/demo-trimming/exp.txt
================================================
>SEQ_1
ATTTGTTCAAC
>SEQ_2
ATTTGTTCAACTCACAGTTT


================================================
FILE: test-suite/golden-tests/demo-trimming/foo.hpp
================================================
// This code was adapted from that generated by Perplexity using the Morloc type
// signatures as prompts

// C++ header sourced by morloc script
#pragma one

#include <algorithm>
#include <cstdint>
#include <fstream>
#include <iostream>
#include <map>
#include <string>
#include <tuple>
#include <vector>

// Types for clarity
using Str = std::string;
using FASTQRecord = std::tuple< std::tuple<Str, Str>, Str >;
using namespace std;

// Struct to hold the trimming configuration
struct Config {
    int minLength;
    int minQuality;
};

// Read a FASTQ file into a vector of tuples
vector<FASTQRecord> readFASTQ(const Str& filename) {
    ifstream fin(filename);
    vector<FASTQRecord> result;
    if (!fin) {
        cerr << "Cannot open file: " << filename << endl;
        return result;
    }
    Str header, seq, plus, qual;
    while (getline(fin, header)) {
        // FASTQ files: 4 lines per record
        if (!getline(fin, seq)) break;
        if (!getline(fin, plus)) break;
        if (!getline(fin, qual)) break;
        // Strip '@' from header if present
        if (!header.empty() && header[0] == '@') header = header.substr(1);
        // Pair (header, quality), then sequence
        result.push_back(
            make_tuple(
                make_tuple(header, qual),
                seq
            )
        );
    }
    return result;
}

// Write a list of (header, sequence) to FASTA file
int writeFASTA(const Str& filename, const std::vector< std::tuple<Str, Str> >& records) {
    std::ofstream fout(filename);
    if (!fout) {
        std::cerr << "Cannot open file for writing: " << filename << std::endl;
        return 1;
    }
    for (const auto& rec : records) {
        fout << ">" << std::get<0>(rec) << "\n";
        fout << std::get<1>(rec) << "\n";
    }
    fout.close();
    return 0;
}


// Helper to convert ASCII (Phred+33) to score
inline uint8_t phredScore(char c) {
    return static_cast<uint8_t>(c) - 33;
}

// Trim low-quality bases at both ends
std::string trimRead(
    const Config& config,
    const std::string& qualities,
    const std::string& sequence
) {
    size_t n = sequence.size();
    if (qualities.size() != n) return "";

    size_t left = 0, right = n;
    while (left < n && phredScore(qualities[left]) < config.minQuality) ++left;
    while (right > left && phredScore(qualities[right-1]) < config.minQuality) --right;

    if (right <= left) return "";

    std::string trimmed_seq = sequence.substr(left, right - left);

    return trimmed_seq;
}


================================================
FILE: test-suite/golden-tests/demo-trimming/main.loc
================================================
module main (trim, readFASTQ, writeFASTA)

source Cpp from "foo.hpp" ("trimRead", "readFASTQ", "writeFASTA")

import root-cpp

record Config = Config
    { minLength :: Int
    , minQuality :: Int 
    }
record Cpp => Config = "Config"

--' Read a FASTQ file
readFASTQ
    :: Str -- FASTQ filename
    -> [ ( ( Str -- FASTQ header
           , Str -- quality reads as phred scores
           )
         , Str -- read sequence
         ) ]

--' Write a annotated sequence data to a FASTA file
writeFASTA
    :: Str -- output filename
    -> [(Str, Str)] -- list of headers and sequences
    -> Int -- exit code, 0 for success, 1 for failure

--' Trim a single read
trimRead
    :: Config
    -> Str -- quality scores
    -> Str -- sequence
    -> Str -- trimmed sequence

wrapRead :: Config -> ((Str, Str), Str) -> (Str, Str) 
wrapRead config x = ( .0 (.0 x)
             , trimRead config (.1 (.0 x)) (.1 x)
             )

--' Trim a list of reads with phred quality scores
trim
    :: Config
    -> [((Str, Str), Str)]
    -> [(Str, Str)]
trim config = map (wrapRead config) 


================================================
FILE: test-suite/golden-tests/edge-cases-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/edge-cases-1/exp.txt
================================================
4.2


================================================
FILE: test-suite/golden-tests/edge-cases-1/foo.py
================================================
def g(f, x):
    return x

def f (f, xs):
    return xs


================================================
FILE: test-suite/golden-tests/edge-cases-1/main.loc
================================================
module main (foo)

source Py from "foo.py" ("g", "f")

type Py => Real = "float"
type Py => Bool = "bool"
type Py => (List a) = "list" a

g :: (a -> [a] -> [a]) -> a -> a
f :: (a -> Bool) -> [a] -> [a]

foo = g h1 4.2 where
  h1 x xs = h2 xs
  h2 xs = f h3 xs
  h3 x = True


================================================
FILE: test-suite/golden-tests/edge-cases-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"Alice"' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/edge-cases-2/exp.txt
================================================
{"name":"Alice","age":42}


================================================
FILE: test-suite/golden-tests/edge-cases-2/foo.R
================================================
id <- function(x) x


================================================
FILE: test-suite/golden-tests/edge-cases-2/foo.py
================================================
def foo(name):
    return dict(name = name, age = 42)


================================================
FILE: test-suite/golden-tests/edge-cases-2/main.loc
================================================
module main (foo, bar)

import root ((.))

type R => Str = "character"
type R => Int = "integer"
type R => (Tuple2 a b) = "list" a b

type Py => Str = "str"
type Py => Int = "int"
type Py => (Tuple2 a b) = "tuple" a b

-- So this is really obvious code duplication now, but I'll fix it later

record Person = Person
  { name :: Str
  , age :: Int
  }

record Py => Person = "dict"
  { name :: Str
  , age :: Int
  }

record R => Person = "list"
  { name :: Str
  , age :: Int
  }

source Py from "foo.py" ("foo")
source R from "foo.R" ("id")

id :: a -> a
foo :: Str -> Person

bar = id . foo


================================================
FILE: test-suite/golden-tests/effect-accumulate-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus combined > obs.txt 2> obs.err
	./nexus ioOnly >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-accumulate-py/exp.txt
================================================
20
10


================================================
FILE: test-suite/golden-tests/effect-accumulate-py/foo.py
================================================
def read_value():
    return 10

def risky_double(x):
    return x * 2


================================================
FILE: test-suite/golden-tests/effect-accumulate-py/main.loc
================================================
-- Test effect accumulation: do-block with mixed effects
-- readValue is <IO>, riskyDouble is <Error>
-- combined do-block uses <IO, Error> annotation
module main (combined, ioOnly)

import root-py

source Py from "foo.py" ("read_value" as readValue, "risky_double" as riskyDouble)

type Py => Int = "int"

readValue :: <IO> Int
riskyDouble :: Int -> <Error> Int

-- Uses both <IO> and <Error> source functions in one do-block
combined :: <IO, Error> Int
combined = do
  x <- readValue
  y <- riskyDouble x
  y

-- Uses only <IO> source function
ioOnly :: <IO> Int
ioOnly = do
  x <- readValue
  x


================================================
FILE: test-suite/golden-tests/effect-coerce-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testPureLit > obs.txt 2> obs.err
	./nexus testPureExpr >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-coerce-cpp/exp.txt
================================================
42
30


================================================
FILE: test-suite/golden-tests/effect-coerce-cpp/main.loc
================================================
-- Test implicit coercion from pure values to effect types in C++
module main (testPureLit, testPureExpr)

import root-cpp

-- Pure literal coerced to effect return type
testPureLit :: <IO> Int
testPureLit = 42

-- Pure expression coerced to effect return type
testPureExpr :: <IO> Int
testPureExpr = 10 + 20


================================================
FILE: test-suite/golden-tests/effect-coerce-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testPureLit > obs.txt 2> obs.err
	./nexus testPureExpr >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-coerce-py/exp.txt
================================================
42
30


================================================
FILE: test-suite/golden-tests/effect-coerce-py/main.loc
================================================
-- Test implicit coercion from pure values to effect types
module main (testPureLit, testPureExpr)

import root-py

-- Pure literal coerced to effect return type
testPureLit :: <IO> Int
testPureLit = 42

-- Pure expression coerced to effect return type
testPureExpr :: <IO> Int
testPureExpr = 10 + 20


================================================
FILE: test-suite/golden-tests/effect-error-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus riskyCall > obs.txt 2> obs.err
	./nexus safeCall >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-error-cpp/exp.txt
================================================
42
8


================================================
FILE: test-suite/golden-tests/effect-error-cpp/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

int riskyAdd(int a, int b) {
    return a + b;
}

int safeAdd(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/effect-error-cpp/main.loc
================================================
-- Test C++ codegen with Error effect label.
-- riskyCall uses <Error> source functions -> enriched try/catch
-- safeCall uses <IO> source functions -> transparent catch
-- Both should compile and run correctly.
module main (riskyCall, safeCall)

import root-cpp

source Cpp from "foo.hpp" ("riskyAdd", "safeAdd")

type Cpp => Int = "int"

riskyAdd :: Int -> Int -> <Error> Int
safeAdd :: Int -> Int -> <IO> Int

riskyCall :: <Error> Int
riskyCall = do
  x <- riskyAdd 10 20
  riskyAdd x 12

safeCall :: <IO> Int
safeCall = do
  x <- safeAdd 3 4
  safeAdd x 1


================================================
FILE: test-suite/golden-tests/effect-multi-label-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMulti > obs.txt 2> obs.err
	./nexus testSingle >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-multi-label-py/exp.txt
================================================
42
30


================================================
FILE: test-suite/golden-tests/effect-multi-label-py/main.loc
================================================
-- Test multi-label effects: <IO, Error> parses and works
module main (testMulti, testSingle)

import root-py

-- Multi-label effect annotation
testMulti :: <IO, Error> Int
testMulti = 42

-- Single-label effect annotation (for comparison)
testSingle :: <IO> Int
testSingle = 10 + 20


================================================
FILE: test-suite/golden-tests/effect-subtype-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testSubtype > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/effect-subtype-py/exp.txt
================================================
99


================================================
FILE: test-suite/golden-tests/effect-subtype-py/foo.py
================================================
def ioFunc():
    return 99


================================================
FILE: test-suite/golden-tests/effect-subtype-py/main.loc
================================================
-- Test effect row subtyping: <IO> value used where <IO, Error> expected
module main (testSubtype)

import root-py

source Py from "foo.py" ("ioFunc")

type Py => Int = "int"

-- ioFunc returns <IO> Int
ioFunc :: <IO> Int

-- testSubtype expects <IO, Error> but ioFunc only has <IO>
-- This should work because <IO> <: <IO, Error>
testSubtype :: <IO, Error> Int
testSubtype = do
  x <- ioFunc
  x


================================================
FILE: test-suite/golden-tests/errors/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus ccerr 0 2>&1 | grep -c "zero" >  obs.txt || true
	./nexus cperr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus crerr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus pcerr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus pperr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus prerr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus rcerr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus rperr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true
	./nexus rrerr 0 2>&1 | grep -c "zero" 2>> obs.err  >> obs.txt || true

clean:
	rm -rf nexus poolscpp.out __pycache__


================================================
FILE: test-suite/golden-tests/errors/exp.txt
================================================
1
1
1
1
1
1
1
1
1


================================================
FILE: test-suite/golden-tests/errors/foo.R
================================================
rid <- function(x) x

rdiv <- function(x){
    if(x == 0){
        stop("Cannot divide by zero")
    } else {
        1 / x
    }
}


================================================
FILE: test-suite/golden-tests/errors/foo.hpp
================================================
template <typename T>
T cid(T x){
    return x;
}

double cdiv(double x){
    if(x == 0){
       throw std::runtime_error("Cannot divide by zero"); 
    } else {
        return 1 / x;
    }
}


================================================
FILE: test-suite/golden-tests/errors/foo.py
================================================
def pid(x): 
    return x

def pdiv(x):
    if x == 0:
        raise ValueError("Cannot divide by zero")
    else:
        return 1 / x


================================================
FILE: test-suite/golden-tests/errors/main.loc
================================================
module main (
      ccerr, cperr, crerr
    , rcerr, rperr, rrerr
    , pcerr, pperr, prerr
  )

import root ((.))

source Cpp from "foo.hpp" ("cid", "cdiv")
source R from "foo.R" ("rid", "rdiv")
source Py from "foo.py" ("pid", "pdiv")

type Cpp => Real = "double"
type Py => Real = "float"
type R => Real = "double"

cid :: a -> a 
rid :: a -> a 
pid :: a -> a 

-- 1 / n, raise an error if n == 0
cdiv :: Real -> Real
rdiv :: Real -> Real 
pdiv :: Real -> Real

ccerr :: Real -> Real
cperr :: Real -> Real
crerr :: Real -> Real
rcerr :: Real -> Real
rperr :: Real -> Real
rrerr :: Real -> Real
pcerr :: Real -> Real
pperr :: Real -> Real
prerr :: Real -> Real

ccerr = cid . rid . cid . pid . cdiv
cperr = cid . rid . pid . cid . pdiv
crerr = cid . rid . rid . cid . rdiv

rcerr = rid . pid . cid . rid . cdiv
rperr = rid . pid . rid . cid . pdiv
rrerr = rid . pid . rid . cid . rdiv

pcerr = pid . cid . pid . rid . cdiv
pperr = pid . rid . cid . rid . pdiv
prerr = pid . cid . rid . pid . rdiv


================================================
FILE: test-suite/golden-tests/eta-reduction-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 6 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolsgc


================================================
FILE: test-suite/golden-tests/eta-reduction-1/exp.txt
================================================
30


================================================
FILE: test-suite/golden-tests/eta-reduction-1/main.loc
================================================
module main (foo)

import root-py

bar y = (*) (1.0 + y)

foo x = bar 4.0 x

--   \x -> (\y -> mul (add 1 y)) y x
--   \x -> (\y -> \z -> mul (add 1 y) z) y x

-- This expression enters the typechecker (sans alternate implementations):
--   \x -> (\y -> mul (add 1 y)) y x
-- Given `mul (add 1 y) |- Real -> Real`, and given two arguments are passed to
-- it, we should rewrite the expression as:
--   \x -> (\y x -> mul (add 1 y) x) y x
-- The first lambda layer isn't relevant, so just rewrite this:
--   (\y -> mul (add 1 y)) y x
-- As
--   (\y x -> mul (add 1 y) x) y x


================================================
FILE: test-suite/golden-tests/eta-reduction-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus bar 1.0 2.0 3.0 4.0 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolsgc


================================================
FILE: test-suite/golden-tests/eta-reduction-2/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/eta-reduction-2/main.loc
================================================
module main (bar)

import root-py

bar :: Real -> Real -> Real -> Real -> Real
bar x y z = (+) x . (+) y . (+) z


================================================
FILE: test-suite/golden-tests/eta-reduction-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo0 2 > obs.txt 2> obs.err
	./nexus foo1 2 2>> obs.err  >> obs.txt
	./nexus foo2 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus poolsgc


================================================
FILE: test-suite/golden-tests/eta-reduction-3/exp.txt
================================================
[7,9,11]
[7,9,11]
[7,9,11]


================================================
FILE: test-suite/golden-tests/eta-reduction-3/main.loc
================================================
module main (foo0, foo1, foo2)

import root-py (zipWith, Integral, Real, List)

bar x y z = x + y + z

foo0 a = zipWith (        bar a    ) [1.0, 2.0, 3.0] [4.0, 5.0, 6.0]
foo1 a = zipWith (\x   -> bar a x  ) [1.0, 2.0, 3.0] [4.0, 5.0, 6.0]
foo2 a = zipWith (\x y -> bar a x y) [1.0, 2.0, 3.0] [4.0, 5.0, 6.0]


================================================
FILE: test-suite/golden-tests/eta-reduction-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo "[1.0,2.0,3.0]" > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/eta-reduction-4/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/eta-reduction-4/main.loc
================================================
module main (foo)

import root-py (Functor, Integral, List, Real)

foo :: [Real] -> [Real]
foo = map ((+) 1.0)


================================================
FILE: test-suite/golden-tests/eta-reduction-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo0 "[1.0,2.0]" "[3.0,4.0]" >  obs.txt
	./nexus foo1 "[1.0,2.0]" "[3.0,4.0]" 2>> obs.err  >> obs.txt
	./nexus foo2 "[1.0,2.0]" "[3.0,4.0]" 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/eta-reduction-5/exp.txt
================================================
[4,6]
[4,6]
[4,6]


================================================
FILE: test-suite/golden-tests/eta-reduction-5/main.loc
================================================
module main (foo0, foo1, foo2)

import root-cpp (zipWith, Integral, Real, List)

foo0 :: [Real] -> [Real] -> [Real]
foo0 = zipWith (+)

foo1 :: [Real] -> [Real] -> [Real]
foo1 xs = zipWith (+) xs

foo2 :: [Real] -> [Real] -> [Real]
foo2 xs ys = zipWith (+) xs ys


================================================
FILE: test-suite/golden-tests/eta-reduction-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 6 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/eta-reduction-6/exp.txt
================================================
15.4


================================================
FILE: test-suite/golden-tests/eta-reduction-6/main.loc
================================================
module main (foo)

import root-py

bar :: Real -> Real
bar = (+) (4.2 * 2.0)

foo :: Real -> Real
foo x = bar (1.0 + x)


================================================
FILE: test-suite/golden-tests/eta-reduction-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1 [2,3,4] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/eta-reduction-7/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/eta-reduction-7/main.loc
================================================
module main (foo)

import root-py

type Py => Real = "float"
type Py => (List a) = "list" a

foo :: Real -> [Real] -> [Real]
foo x = map id


================================================
FILE: test-suite/golden-tests/eta-reduction-8-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 23 35 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/eta-reduction-8-cpp/exp.txt
================================================
[24,true]


================================================
FILE: test-suite/golden-tests/eta-reduction-8-cpp/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <functional>
#include <type_traits>
#include <utility>

template<class A, class B, class C, class F>
auto onThree(F f, const std::tuple<A, B, C>& x) -> std::invoke_result_t<F, A, B, C> {
    return f(std::get<0>(x), std::get<1>(x), std::get<2>(x));
}

int inc(int x){
    return x + 1;
}

#endif


================================================
FILE: test-suite/golden-tests/eta-reduction-8-cpp/main.loc
================================================
module main (foo)

import root-cpp

source Cpp from "foo.hpp" ("onThree", "inc")

onThree :: (a -> b -> c -> d) -> (a, b, c) -> d

inc :: Int -> Int

foo x y = onThree (\a b c -> (inc x, b)) (inc y, True, "hi")


================================================
FILE: test-suite/golden-tests/eta-reduction-8-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 23 45 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/eta-reduction-8-py/exp.txt
================================================
[24,true]


================================================
FILE: test-suite/golden-tests/eta-reduction-8-py/foo.py
================================================
def onThree(f, x):
    return f(x[0], x[1], x[2])

def inc(x):
    return x + 1


================================================
FILE: test-suite/golden-tests/eta-reduction-8-py/main.loc
================================================
module main (foo)

import root-py

source Py from "foo.py" ("onThree" as onThree, "inc")

onThree :: (a -> b -> c -> d) -> (a, b, c) -> d
inc :: Int -> Int

foo x y = onThree (\a b c -> (inc x, b)) (inc y, True, "hi")


================================================
FILE: test-suite/golden-tests/eval-restrict-source/Makefile
================================================
all:
	rm -f obs.txt obs.err build.err
	morloc eval 'source Py from "x.py" ("f" as f)' 2> build.err || true
	grep -c "source statements are not allowed in eval mode" build.err > obs.txt
	morloc eval 'class Foo a where; foo :: a -> a' 2>> build.err || true
	grep -c "class declarations are not allowed in eval mode" build.err >> obs.txt
	morloc eval 'instance Foo Int where; source Py from "x.py" ("foo" as foo)' 2>> build.err || true
	grep -c "instance declarations are not allowed in eval mode" build.err >> obs.txt

clean:
	rm -f obs.err build.err


================================================
FILE: test-suite/golden-tests/eval-restrict-source/exp.txt
================================================
1
1
1


================================================
FILE: test-suite/golden-tests/feature-integration-1/Makefile
================================================
all:
	morloc make -o nexus main.loc
	./nexus test > obs.txt

clean:
	rm -rf __pycache__ nexus log


================================================
FILE: test-suite/golden-tests/feature-integration-1/exp.txt
================================================
[true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true]


================================================
FILE: test-suite/golden-tests/feature-integration-1/main.loc
================================================
module main (test)

import root-py

-- No-argument declarations combining features

val1 = .1 (10, 20)
val2 = .(.1, .0) (10, 20)
val3 = (_, 42) 7
val4 = .1 ((_, 42) 7)
add5 = (+) 5
neg_add5 = neg . (+) 5
get_fst = .0
inc = (+) _ 1
neg_snd = neg . .1
add10_fst = (+) 10 . .0

-- Declarations with arguments combining features

get_second x = .1 x
set_first v pair = .(.0 = v) pair
pair_with x = (_, x)
extract_neg x = neg (g x) where g = .1
apply_template x = f 10 where f = (_, x)
transform x = h x where h = neg . .0

-- Map/fold with combined features

neg_seconds xs = map (neg . .1) xs

test =
  [ val1 == 20
  , val2 == (20, 10)
  , val3 == (7, 42)
  , val4 == 42
  , add5 3 == 8
  , neg_add5 3 == neg 8
  , get_fst (100, 200) == 100
  , inc 5 == 6
  , neg_snd (3, 7) == neg 7
  , add10_fst (5, 20) == 15
  , get_second (1, 2) == 2
  , set_first 99 (1, 2) == (99, 2)
  , pair_with 42 7 == (7, 42)
  , extract_neg (3, 7) == neg 7
  , apply_template 42 == (10, 42)
  , transform (5, 20) == neg 5
  , neg_seconds [(1, 2), (3, 4)] == [neg 2, neg 4]
  , map (_, 0) [1, 2, 3] == [(1, 0), (2, 0), (3, 0)]
  , map .(.1 = 0) [(1, 2), (3, 4)] == [(1, 0), (3, 0)]
  , map ((+) _ 1) [1, 2, 3] == [2, 3, 4]
  , fold (\acc x -> acc + .1 x) 0 [(1, 10), (2, 20), (3, 30)] == 60
  ]


================================================
FILE: test-suite/golden-tests/file-input-c/.gitignore
================================================
a.json
b.json


================================================
FILE: test-suite/golden-tests/file-input-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	bash run.sh > obs.txt 2> obs.err

clean:
	rm -rf nexus pools a.json b.json


================================================
FILE: test-suite/golden-tests/file-input-c/exp.txt
================================================
["ab",2]
["ab",2]
["ab",2]
["ab",2]
["ab",2]


================================================
FILE: test-suite/golden-tests/file-input-c/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>

std::string cat(std::string x, std::string y){
  std::string z = x + y;
  return z;
}

int len(std::string x){
  return x.size();
}

#endif


================================================
FILE: test-suite/golden-tests/file-input-c/main.loc
================================================
module main (foo)

source Cpp from "foo.hpp" ("cat", "len")

type Cpp => Str = "std::string"
type Cpp => Int = "int"
type Cpp => Tuple2 a b = "std::tuple<$1,$2>" a b
cat :: Str -> Str -> Str
len :: Str -> Int

foo x y = (v, l) where
  v = cat x y
  l = len v


================================================
FILE: test-suite/golden-tests/file-input-c/run.sh
================================================
#!/usr/bin/env bash
echo '"a"' > a.json
echo '"b"' > b.json
./nexus foo a.json b.json
./nexus foo '"a"' b.json
./nexus foo '"a"' '"b"'
./nexus foo '"a"' <(echo '"b"')
echo '"b"' | ./nexus foo '"a"' /dev/stdin


================================================
FILE: test-suite/golden-tests/file-input-py/.gitignore
================================================
a.json
b.json


================================================
FILE: test-suite/golden-tests/file-input-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	bash run.sh > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__ a.json b.json


================================================
FILE: test-suite/golden-tests/file-input-py/exp.txt
================================================
["<ab>",4]
["<ab>",4]
["<ab>",4]
["<ab>",4]
["<ab>",4]


================================================
FILE: test-suite/golden-tests/file-input-py/foo.py
================================================
def cat(xs):
    return "".join(xs)


================================================
FILE: test-suite/golden-tests/file-input-py/main.loc
================================================
module main (foo)

source Py ("len")
source Py from "foo.py" ("cat")

type Py => Str = "str"
type Py => Int = "int"
type Py => List a = "list" a
type Py => Tuple2 a b = "tuple" a b
cat :: [Str] -> Str
len :: Str -> Int

foo x y = (v, l) where
  v = cat ["<", x, y, ">"]
  l = len v


================================================
FILE: test-suite/golden-tests/file-input-py/run.sh
================================================
#!/usr/bin/env bash
echo '"a"' > a.json
echo '"b"' > b.json
./nexus foo a.json b.json
./nexus foo '"a"' b.json
./nexus foo '"a"' '"b"'
./nexus foo '"a"' <(echo '"b"')
echo '"b"' | ./nexus foo '"a"' /dev/stdin


================================================
FILE: test-suite/golden-tests/file-input-r/.gitignore
================================================
a.json
b.json


================================================
FILE: test-suite/golden-tests/file-input-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	bash run.sh > obs.txt 2> obs.err

clean:
	rm -rf nexus pools a.json b.json


================================================
FILE: test-suite/golden-tests/file-input-r/exp.txt
================================================
["<ab>",4]
["<ab>",4]
["<ab>",4]
["<ab>",4]
["<ab>",4]


================================================
FILE: test-suite/golden-tests/file-input-r/foo.R
================================================
concat <- function(xs){
    paste(xs, collapse="")
}


================================================
FILE: test-suite/golden-tests/file-input-r/main.loc
================================================
module main (foo)

source R from "foo.R" ("concat" as cat, "nchar" as len)

type R => Str = "character"
type R => Int = "integer"
type R => Tuple2 a b = "list" a b
type R => List a = "list" a

cat :: [Str] -> Str
len :: Str -> Int

foo x y = (v, l) where
  v = cat ["<", x, y, ">"]
  l = len v


================================================
FILE: test-suite/golden-tests/file-input-r/run.sh
================================================
#!/usr/bin/env bash
echo '"a"' > a.json
echo '"b"' > b.json
./nexus foo a.json b.json
./nexus foo '"a"' b.json
./nexus foo '"a"' '"b"'
./nexus foo '"a"' <(echo '"b"')
echo '"b"' | ./nexus foo '"a"' /dev/stdin


================================================
FILE: test-suite/golden-tests/force-inline-basic/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- forceTuple ---" > obs.txt
	./nexus forceTuple >> obs.txt 2>> obs.err
	echo "--- forceApp ---" >> obs.txt
	./nexus forceApp >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/force-inline-basic/exp.txt
================================================
--- forceTuple ---
EVAL 2
EVAL 1
[2,4]
--- forceApp ---
EVAL 4
EVAL 3
14


================================================
FILE: test-suite/golden-tests/force-inline-basic/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/force-inline-basic/main.loc
================================================
-- Test inline force operator (!) inside do-blocks
module main (forceTuple, forceApp)

import root-cpp

source Cpp from "foo.hpp" ("sideEffect", "add")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int
add :: Int -> Int -> Int

-- Force applied expressions in a tuple
forceTuple :: <IO> (Int, Int)
forceTuple = do (!(sideEffect 1), !(sideEffect 2))

-- Force in function args
forceApp :: <IO> Int
forceApp = do add !(sideEffect 3) !(sideEffect 4)


================================================
FILE: test-suite/golden-tests/formatting/.gitignore
================================================
z*


================================================
FILE: test-suite/golden-tests/formatting/Makefile
================================================
all:
	rm -f *.err obs.txt z*
	morloc make -o nexus main.loc 2> build.err
	# 0
	./nexus -f json f0 '[1,2,3,4,5,6]' > z0.json
	./nexus -f mpk f0 z0.json > z0.mpk
	./nexus -f voidstar f0 z0.mpk > z0.dat
	./nexus f0 z0.mpk > obs.txt 2> obs.err
	# 1
	./nexus -f json f1 '[["abc",5],["def",6]]' > z1.json
	./nexus -f mpk f1 z1.json > z1.mpk
	./nexus -f voidstar f1 z1.mpk > z1.dat
	./nexus f1 z1.mpk 2>> obs.err  >> obs.txt
	# 2
	./nexus -f json f2 '[["abc","def"],[5,6]]' > z2.json
	./nexus -f mpk f2 z2.json > z2.mpk
	./nexus -f voidstar f2 z2.mpk > z2.dat
	./nexus f2 z2.mpk 2>> obs.err  >> obs.txt
	# 3
	./nexus -f json f3 '[[[[9,9,9],[1,2],7],[[4,4,4,4],[3,4,5],8]],9]' > z3.json
	./nexus -f mpk f3 z3.json > z3.mpk
	./nexus -f voidstar f3 z3.mpk > z3.dat
	./nexus f3 z3.mpk 2>> obs.err  >> obs.txt
	# 4
	./nexus -f json f4 '[[[6,7]]]' > z4.json
	./nexus -f mpk f4 z4.json > z4.mpk
	./nexus -f voidstar f4 z4.mpk > z4.dat
	./nexus f4 z4.mpk 2>> obs.err  >> obs.txt
	# 5
	./nexus -f json f5 '[[[["abc","defg"],[1,2],7],[["hijkl","mnopqrs"],[3,4,5],8]],9]' > z5.json
	./nexus -f mpk f5 z5.json > z5.mpk
	./nexus -f voidstar f5 z5.mpk > z5.dat
	./nexus f5 z5.mpk 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools z* __pycache__


================================================
FILE: test-suite/golden-tests/formatting/exp.txt
================================================
[1,2,3,4,5,6]
[["abc",5],["def",6]]
[["abc","def"],[5,6]]
[[[[9,9,9],[1,2],7],[[4,4,4,4],[3,4,5],8]],9]
[[[6,7]]]
[[[["abc","defg"],[1,2],7],[["hijkl","mnopqrs"],[3,4,5],8]],9]


================================================
FILE: test-suite/golden-tests/formatting/foo.py
================================================
def foo(x):
    return x


================================================
FILE: test-suite/golden-tests/formatting/main.loc
================================================
module main (f0, f1, f2, f3, f4, f5)

type Py => Int = "int"
type Py => Str = "str"
type Py => Tuple2 a b = "tuple" a b
type Py => Tuple3 a b c = "tuple" a b c
type Py => List a = "list" a

source Py from "foo.py"
 (  "foo" as f0
 ,  "foo" as f1
 ,  "foo" as f2
 ,  "foo" as f3
 ,  "foo" as f4
 ,  "foo" as f5
 )

--' yolo foo foo 0
f0 :: [Int]
   -> [Int]

--' yolo foo foo 1
f1 :: 
    [(Str,Int)] ->
    [(Str,Int)]

--' yolo foo foo 2
f2 :: ([Str],[Int])
   -> ([Str],[Int])

--' yolo foo foo 3
f3 :: ([([Int],[Int],Int)],Int) -> ([([Int],[Int],Int)],Int)

--' yolo foo foo 4
f4 :: [[[Int]]] -> [[[Int]]]

--' yolo foo foo 5
f5 :: ([([Str],[Int],Int)],Int) -> ([([Str],[Int],Int)],Int)


================================================
FILE: test-suite/golden-tests/functional-data-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 17 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-1/bar.py
================================================
#  f :: Int -> Int -> Bool
#  g :: Bool -> Bool -> Bool
#  bar :: Tools -> Int -> Int
def bar(tools, x):
    p1 = tools["f"](x, 2)
    p2 = tools["g"](True, p1 > 2)
    return p2


================================================
FILE: test-suite/golden-tests/functional-data-1/exp.txt
================================================
2


================================================
FILE: test-suite/golden-tests/functional-data-1/foo.hpp
================================================
// funf :: Int -> Int -> Int
int funf(int x, int y){
  return 2 * x + 3 * y;
}

// fung :: Bool -> Bool -> Int
int fung(bool x, bool y){
  return x + y;
}


================================================
FILE: test-suite/golden-tests/functional-data-1/main.loc
================================================
module main (foo)

import root-py
import root-cpp

record Tools where
  f :: Int -> Int -> Int
  g :: Bool -> Bool -> Int
record Py => Tools = "dict"
record Cpp => Tools = "struct"

source Cpp from "foo.hpp" ("funf", "fung")
funf :: Int -> Int -> Int
fung :: Bool -> Bool -> Int

tools :: Tools
tools = { f = funf, g = fung }

source Py from "bar.py" ("bar")
bar :: Tools -> Int -> Int

foo = bar tools


================================================
FILE: test-suite/golden-tests/functional-data-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 38 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-2/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/functional-data-2/foo.py
================================================
def bar(funcs, x):
    return funcs["f"](x)


================================================
FILE: test-suite/golden-tests/functional-data-2/main.loc
================================================
module main (foo)

import root-py

record Funs where
  f :: Int -> Int
  g :: Int -> Int
record Py => Funs = "dict"

funs = { f = (+) 4, g = (+) 1 }

bar :: Funs -> Int -> Int

foo = bar funs

source Py from "foo.py" ("bar")


================================================
FILE: test-suite/golden-tests/functional-data-3a/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 37 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3a/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/functional-data-3a/main.loc
================================================
module main (foo)

import root-py

record Funs where
  f :: Int -> Int
  g :: Int -> Int
record Py => Funs = "dict"

funs :: Funs
funs = { f = (+) 4, g = (+) 1 }

foo :: Int -> Int
foo x = (.f funs) (1 + x)


================================================
FILE: test-suite/golden-tests/functional-data-3b/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 33 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3b/exp.txt
================================================
67


================================================
FILE: test-suite/golden-tests/functional-data-3b/main.hpp
================================================
int funf(int x){
  return 2*x;
}


================================================
FILE: test-suite/golden-tests/functional-data-3b/main.loc
================================================
module main (foo)

import root-py
import root-cpp

record Funs where
  f :: Int -> Int
  g :: Int -> Int
record Py => Funs = "dict"
record Cpp => Funs = "struct"

source Cpp from "main.hpp" ("funf")
funf :: Int -> Int

source Py  from "main.py"  ("fung", "doit")
fung :: Int -> Int
doit :: (Int -> Int) -> Int -> Int

funs :: Funs
funs = { f = funf, g = fung }

foo :: Int -> Int
foo = doit (.f funs)


================================================
FILE: test-suite/golden-tests/functional-data-3b/main.py
================================================
def fung(x):
    return 3*x

def doit(f, x):
    return f(x) + 1


================================================
FILE: test-suite/golden-tests/functional-data-3c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 21 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/functional-data-3c/main.loc
================================================
module main (foo)

import root-py

record Funs where
  f :: Int -> Int
  g :: Int -> Int
record Py => Funs = "dict"

bar :: Int -> Int -> Funs
source Py from "main.py" ("bar")

foo :: Int -> Int -> Int
foo x y = (.f (bar x 9)) y


================================================
FILE: test-suite/golden-tests/functional-data-3c/main.py
================================================
def funf(a):
    def f(x):
        return a*x
    return f

def fung(b):
    def g(x):
        return b*x
    return g

def bar(a, b):
    return { "f": funf(a), "g": fung(b) }


================================================
FILE: test-suite/golden-tests/functional-data-3d/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	> obs.txt
	./nexus bar true true 5 2>> obs.err  >> obs.txt # 10
	./nexus bar false true 5 2>> obs.err  >> obs.txt # 16
	./nexus bar false false 5 2>> obs.err  >> obs.txt # 15
	./nexus baz true 5 true 2>> obs.err  >> obs.txt # 9
	./nexus foo true 5 2>> obs.err  >> obs.txt # 20

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3d/exp.txt
================================================
10
16
15
9
14


================================================
FILE: test-suite/golden-tests/functional-data-3d/main.loc
================================================
module main (foo, bar, baz)

import root-py

bar :: Bool -> Bool -> Int -> Int
baz :: Bool -> Int -> Bool -> Int
source Py from "main.py" where
  --' takes two bools and returns a function of an integer
  --' rsize: 2
  bar
  --' takes one bool and returns a fuction of an int that returns a function of a bool
  --' rsize: 1 1
  baz

foo :: Bool -> Int -> Int
foo x y = baz x (bar x x y) x


================================================
FILE: test-suite/golden-tests/functional-data-3d/main.py
================================================
def bar(cond1, cond2):
    if cond1:
        return lambda x: 2*x
    else:
        return lambda x: 3*x + cond2

def baz(cond1):
    def f1(num):
        def f2(cond2):
            return cond1 + num + 3*cond2
        return f2
    return f1


================================================
FILE: test-suite/golden-tests/functional-data-3d-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	> obs.txt
	./nexus bar true true 5 2>> obs.err  >> obs.txt # 10
	./nexus bar false true 5 2>> obs.err  >> obs.txt # 16
	./nexus bar false false 5 2>> obs.err  >> obs.txt # 15
	./nexus baz true 5 true 2>> obs.err  >> obs.txt # 9
	./nexus foo true 5 2>> obs.err  >> obs.txt # 14

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3d-c/exp.txt
================================================
10
16
15
9
14


================================================
FILE: test-suite/golden-tests/functional-data-3d-c/main.hpp
================================================
#include <functional>

std::function<int(int)> bar(bool cond1, bool cond2) {
    if (cond1) {
        return [](int x) { return 2 * x; };
    } else {
        return [cond2](int x) { return 3 * x + (int)cond2; };
    }
}

std::function<std::function<int(bool)>(int)> baz(bool cond1) {
    auto f1 = [cond1](int num) {
        auto f2 = [cond1, num](bool cond2) {
            return cond1 + num + 3 * (int)cond2;
        };
        return f2;
    };
    return f1;
}


================================================
FILE: test-suite/golden-tests/functional-data-3d-c/main.loc
================================================
module main (foo, bar, baz)

import root-cpp

bar :: Bool -> Bool -> Int -> Int
baz :: Bool -> Int -> Bool -> Int
source Cpp from "main.hpp" where
  --' takes two bools and returns a function of an integer
  --' rsize: 2
  bar
  --' takes one bool and returns a fuction of an int that returns a function of a bool
  --' rsize: 1 1
  baz

foo :: Bool -> Int -> Int
foo x y = baz x (bar x x y) x


================================================
FILE: test-suite/golden-tests/functional-data-3d-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	> obs.txt
	./nexus bar true true 5 2>> obs.err  >> obs.txt # 10
	./nexus bar false true 5 2>> obs.err  >> obs.txt # 16
	./nexus bar false false 5 2>> obs.err  >> obs.txt # 15
	./nexus baz true 5 true 2>> obs.err  >> obs.txt # 9
	./nexus foo true 5 2>> obs.err  >> obs.txt # 20

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3d-py/exp.txt
================================================
10
16
15
9
14


================================================
FILE: test-suite/golden-tests/functional-data-3d-py/main.loc
================================================
module main (foo, bar, baz)

import root-py

bar :: Bool -> Bool -> Int -> Int
baz :: Bool -> Int -> Bool -> Int
source Py from "main.py" where
  --' takes two bools and returns a function of an integer
  --' rsize: 2
  bar
  --' takes one bool and returns a fuction of an int that returns a function of a bool
  --' rsize: 1 1
  baz

foo :: Bool -> Int -> Int
foo x y = baz x (bar x x y) x


================================================
FILE: test-suite/golden-tests/functional-data-3d-py/main.py
================================================
def bar(cond1, cond2):
    if cond1:
        return lambda x: 2*x
    else:
        return lambda x: 3*x + cond2

def baz(cond1):
    def f1(num):
        def f2(cond2):
            return cond1 + num + 3*cond2
        return f2
    return f1


================================================
FILE: test-suite/golden-tests/functional-data-3d-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	> obs.txt
	./nexus bar true true 5 2>> obs.err  >> obs.txt # 10
	./nexus bar false true 5 2>> obs.err  >> obs.txt # 16
	./nexus bar false false 5 2>> obs.err  >> obs.txt # 15
	./nexus baz true 5 true 2>> obs.err  >> obs.txt # 9
	./nexus foo true 5 2>> obs.err  >> obs.txt # 20

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3d-r/exp.txt
================================================
10
16
15
9
14


================================================
FILE: test-suite/golden-tests/functional-data-3d-r/main.R
================================================
bar <- function(cond1, cond2){
    if(cond1){
        function(x){ 2*x }
    } else {
        function(x){ 3*x + cond2 }
    }
}

baz <- function(cond1){
    function(num){
        function(cond2){
            cond1 + num + 3*cond2
        }
    }
}


================================================
FILE: test-suite/golden-tests/functional-data-3d-r/main.loc
================================================
module main (foo, bar, baz)

import root-r

bar :: Bool -> Bool -> Int -> Int
baz :: Bool -> Int -> Bool -> Int
source R from "main.R" where
  --' takes two bools and returns a function of an integer
  --' rsize: 2
  bar
  --' takes one bool and returns a fuction of an int that returns a function of a bool
  --' rsize: 1 1
  baz

foo :: Bool -> Int -> Int
foo x y = baz x (bar x x y) x


================================================
FILE: test-suite/golden-tests/functional-data-3e/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo true 3 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3e/exp.txt
================================================
[6,9]


================================================
FILE: test-suite/golden-tests/functional-data-3e/main.loc
================================================
module main (foo)

import root-py

bar :: Bool -> [(Int -> Int)]
source Py from "main.py" ("bar")

foo :: Bool -> Int -> [Int]
foo x y = map (\f -> f y) (bar x)


================================================
FILE: test-suite/golden-tests/functional-data-3e/main.py
================================================
def bar(cond):
    if cond:
        return [lambda x: 2*x, lambda x: 3*x]
    else:
        return [lambda x: 4*x, lambda x: 5*x]


================================================
FILE: test-suite/golden-tests/functional-data-3f/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo true 3 > obs.txt 2> obs.err
	./nexus baz true 4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-3f/exp.txt
================================================
6
[6,8]


================================================
FILE: test-suite/golden-tests/functional-data-3f/main.loc
================================================
module main (foo, baz)

import root-py

bar :: Bool -> (Int -> Int, Bool -> Int)
source Py from "main.py" ("bar", "fst")

fst :: (a, b) -> a

foo :: Bool -> Int -> Int
foo x y = (fst (bar x)) y

baz :: Bool -> Int -> (Int, Int)
baz x y = ((.1 fs) x, (.0 fs) y) where
  fs = bar x


================================================
FILE: test-suite/golden-tests/functional-data-3f/main.py
================================================
#  bar :: Bool -> (Int -> Int, Bool -> Int)
def bar(cond):
    return (lambda x: 2 * x, lambda x: x + 5)

def fst(xs):
    return xs[0]

def snd(xs):
    return xs[1]


================================================
FILE: test-suite/golden-tests/functional-data-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-4/exp.txt
================================================
[6,7]


================================================
FILE: test-suite/golden-tests/functional-data-4/main.loc
================================================
module main (foo)

import root-py

funs :: [(Int -> Int)]
funs = [ (+) 1, (+) 2 ]

source Py from "main.py" ("runAll")
runAll :: a -> [(a -> b)] -> [b]

foo x = runAll x funs


================================================
FILE: test-suite/golden-tests/functional-data-4/main.py
================================================
def runAll(x, fs):
    ys = []
    for f in fs:
        ys.append(f(x))
    return ys


================================================
FILE: test-suite/golden-tests/functional-data-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/functional-data-5/exp.txt
================================================
[6,7]


================================================
FILE: test-suite/golden-tests/functional-data-5/main.loc
================================================
module main (foo)

import root-r
import root-py
import root-cpp

funs :: [(Int -> Int)]
funs = [ idcpp . (+) 1, idr . (+) 2 ]

source Py from "main.py" ("runAll")
runAll :: a -> [(a -> b)] -> [b]

foo x = runAll x funs


================================================
FILE: test-suite/golden-tests/functional-data-5/main.py
================================================
def runAll(x, fs):
    ys = []
    for f in fs:
        ys.append(f(x))
    return ys


================================================
FILE: test-suite/golden-tests/generic-hofs-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/generic-hofs-1/exp.txt
================================================
[1,2]


================================================
FILE: test-suite/golden-tests/generic-hofs-1/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

template <class A, class F>
auto map(F f, const std::vector<A> &xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys(xs.size());
    std::transform(xs.begin(), xs.end(), ys.begin(), f);
    return ys;
}

template <class A, class B>
B snd(const std::tuple<A,B> &x){
    return(std::get<1>(x));
}

#endif


================================================
FILE: test-suite/golden-tests/generic-hofs-1/main.loc
================================================
module main (foo)

type Cpp => (List a) = "std::vector<$1>" a
type Cpp => Str = "std::string"
type Cpp => Real = "double"
type Cpp => (Tuple2 a b) = "std::tuple<$1,$2>" a b

source Cpp from "foo.hpp" ("map" as cppmap, "snd" as cppsnd)

cppmap :: (a -> b) -> [a] -> [b]
cppsnd :: (a, b) -> b

foo x = cppmap cppsnd [("hi", 1.0), ("bi", x)]


================================================
FILE: test-suite/golden-tests/generic-hofs-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2.4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/generic-hofs-2/exp.txt
================================================
[1,2]


================================================
FILE: test-suite/golden-tests/generic-hofs-2/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

template <class A, class F>
auto map(F f, const std::vector<A> &xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys(xs.size());
    std::transform(xs.begin(), xs.end(), ys.begin(), f);
    return ys;
}

template <class A, class B>
B bar(B dummy, const std::tuple<A,B> &x){
    return(std::get<1>(x));
}

#endif


================================================
FILE: test-suite/golden-tests/generic-hofs-2/main.loc
================================================
module main (foo)

type Cpp => (List a) = "std::vector<$1>" a
type Cpp => Str = "std::string"
type Cpp => Real = "double"
type Cpp => (Tuple2 a b) = "std::tuple<$1,$2>" a b

source Cpp from "foo.hpp" ("map", "bar")

map :: (a -> b) -> [a] -> [b]

-- the `forall a b` sets the order of qualifiers and ensures that the C++
-- template arguments are generated in the right order.
bar :: b -> (a, b) -> b

foo x = map (bar x) [("hi", 1.0), ("bi", 2.0)]


================================================
FILE: test-suite/golden-tests/guards-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus myabs 5 > obs.txt 2> obs.err
	./nexus myabs 0 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 5 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 1 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 10 >> obs.txt 2>> obs.err
	./nexus classify 5 >> obs.txt 2>> obs.err
	./nexus classify 50 >> obs.txt 2>> obs.err
	./nexus classify 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-cpp/exp.txt
================================================
5
0
5
2
8
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-cpp/main.loc
================================================
module main (myabs, clamp, classify)

import root-cpp

myabs :: Int -> Int
myabs x
  ? x >= 0 = x
  : neg x

clamp :: Int -> Int -> Int -> Int
clamp lo hi x
  ? x < lo = lo
  ? x > hi = hi
  : x

classify :: Int -> Str
classify x
  ? x > big = "big"
  ? x > small = "medium"
  : "small"
  where
    big = 100
    small = 10


================================================
FILE: test-suite/golden-tests/guards-inline-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus classify 5 > obs.txt 2> obs.err
	./nexus classify 50 >> obs.txt 2>> obs.err
	./nexus classify 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-inline-cpp/exp.txt
================================================
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-inline-cpp/main.loc
================================================
module main (classify)

import root-cpp

classify :: Int -> Str
classify x = (? x > 100 = "big" ? x > 10 = "medium" : "small")


================================================
FILE: test-suite/golden-tests/guards-let-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus absLet 5 > obs.txt 2> obs.err
	./nexus absLet -- -3 >> obs.txt 2>> obs.err
	./nexus absLet 0 >> obs.txt 2>> obs.err
	./nexus classifyDo 5 >> obs.txt 2>> obs.err
	./nexus classifyDo 50 >> obs.txt 2>> obs.err
	./nexus classifyDo 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-let-cpp/exp.txt
================================================
5
3
0
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-let-cpp/main.loc
================================================
module main (absLet, classifyDo)

import root-cpp

absLet :: Int -> Int
absLet x =
  let result ? x >= 0 = x
             : neg x
  in result

classifyDo :: Int -> <IO> Str
classifyDo x = do
  let label ? x > 100 = "big"
            ? x > 10 = "medium"
            : "small"
  label


================================================
FILE: test-suite/golden-tests/guards-let-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus absLet 5 > obs.txt 2> obs.err
	./nexus absLet -- -3 >> obs.txt 2>> obs.err
	./nexus absLet 0 >> obs.txt 2>> obs.err
	./nexus classifyDo 5 >> obs.txt 2>> obs.err
	./nexus classifyDo 50 >> obs.txt 2>> obs.err
	./nexus classifyDo 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-let-py/exp.txt
================================================
5
3
0
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-let-py/main.loc
================================================
module main (absLet, classifyDo)

import root-py

absLet :: Int -> Int
absLet x =
  let result ? x >= 0 = x
             : neg x
  in result

classifyDo :: Int -> <IO> Str
classifyDo x = do
  let label ? x > 100 = "big"
            ? x > 10 = "medium"
            : "small"
  label


================================================
FILE: test-suite/golden-tests/guards-let-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus absLet 5 > obs.txt 2> obs.err
	./nexus absLet -- -3 >> obs.txt 2>> obs.err
	./nexus absLet 0 >> obs.txt 2>> obs.err
	./nexus classifyDo 5 >> obs.txt 2>> obs.err
	./nexus classifyDo 50 >> obs.txt 2>> obs.err
	./nexus classifyDo 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-let-r/exp.txt
================================================
5
3
0
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-let-r/main.loc
================================================
module main (absLet, classifyDo)

import root-r

absLet :: Int -> Int
absLet x =
  let result ? x >= 0 = x
             : neg x
  in result

classifyDo :: Int -> <IO> Str
classifyDo x = do
  let label ? x > 100 = "big"
            ? x > 10 = "medium"
            : "small"
  label


================================================
FILE: test-suite/golden-tests/guards-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus myabs 5 > obs.txt 2> obs.err
	./nexus myabs 0 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 5 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 1 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 10 >> obs.txt 2>> obs.err
	./nexus classify 5 >> obs.txt 2>> obs.err
	./nexus classify 50 >> obs.txt 2>> obs.err
	./nexus classify 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-py/exp.txt
================================================
5
0
5
2
8
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-py/main.loc
================================================
module main (myabs, clamp, classify)

import root-py

myabs :: Int -> Int
myabs x
  ? x >= 0 = x
  : neg x

clamp :: Int -> Int -> Int -> Int
clamp lo hi x
  ? x < lo = lo
  ? x > hi = hi
  : x

classify :: Int -> Str
classify x
  ? x > big = "big"
  ? x > small = "medium"
  : "small"
  where
    big = 100
    small = 10


================================================
FILE: test-suite/golden-tests/guards-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus myabs 5 > obs.txt 2> obs.err
	./nexus myabs 0 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 5 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 1 >> obs.txt 2>> obs.err
	./nexus clamp 2 8 10 >> obs.txt 2>> obs.err
	./nexus classify 5 >> obs.txt 2>> obs.err
	./nexus classify 50 >> obs.txt 2>> obs.err
	./nexus classify 200 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/guards-r/exp.txt
================================================
5
0
5
2
8
"small"
"medium"
"big"


================================================
FILE: test-suite/golden-tests/guards-r/main.loc
================================================
module main (myabs, clamp, classify)

import root-r

myabs :: Int -> Int
myabs x
  ? x >= 0 = x
  : neg x

clamp :: Int -> Int -> Int -> Int
clamp lo hi x
  ? x < lo = lo
  ? x > hi = hi
  : x

classify :: Int -> Str
classify x
  ? x > big = "big"
  ? x > small = "medium"
  : "small"
  where
    big = 100
    small = 10


================================================
FILE: test-suite/golden-tests/higher-kinded-types/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus foo1 12 2>> obs.err  >> obs.txt
	./nexus foo2 12 2>> obs.err  >> obs.txt
	./nexus foo3 12 2>> obs.err  >> obs.txt
	./nexus foo4 12 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/higher-kinded-types/exp.txt
================================================
["1","2","12"]
["1","2","12"]
["1","2","12"]
["1","2","12"]


================================================
FILE: test-suite/golden-tests/higher-kinded-types/foo.py
================================================
def morloc_map(f, xs):
    return list(map(f, xs))

def testshow(x):
    return str(x)


================================================
FILE: test-suite/golden-tests/higher-kinded-types/main.loc
================================================
module main (foo1, foo2, foo3, foo4)

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

source Py from "foo.py" ("morloc_map" as listMap, "morloc_map" as functorMap)
listMap :: (a -> b) -> [a] -> [b]
functorMap :: (a -> b) -> f a -> f b

class TestFunctor f where
  classFMap :: (a -> b) -> f a -> f b

instance TestFunctor List where
  source Py from "foo.py" ("morloc_map" as classFMap)


class TestList f where
  classMap :: (a -> b) -> f a -> f b

instance TestList List where
  source Py from "foo.py" ("morloc_map" as classMap)

source Py from "foo.py" ("testshow")
testshow :: Int -> Str

foo1 x = listMap testshow [1,2,x]
foo2 x = functorMap testshow [1,2,x]
foo3 x = classMap testshow [1,2,x]
foo4 x = classFMap testshow [1,2,x]


================================================
FILE: test-suite/golden-tests/higher-kinded-types/notes
================================================
morloc: see: AppU (VarU (TV {unTVar = "List"})) [VarU (TV {unTVar = "Int"})]
  bnd: fromList []
CallStack (from HasCallStack):
  error, called at library/Morloc/TypeEval.hs:124:24 in morloc-0.55.0-6B2a5tHeUon5TyP9WSJ7Sf:Morloc.TypeEval

scope: fromList [
  (TV {unTVar = "Int"},[([],VarU (TV {unTVar = "int"}),True)]),
  (TV {unTVar = "List"},[(
    [Left (TV {unTVar = "a"})],
    AppU (VarU (TV {unTVar = "list"})) [VarU (TV {unTVar = "a"})],
    True)]
  )
]


================================================
FILE: test-suite/golden-tests/hofs-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf .R*


================================================
FILE: test-suite/golden-tests/hofs-1/eq.py
================================================
import sys

def eq(x, y):
    if x == y:
        return True
    else:
        print("Test failed:", file=sys.stderr)
        print(f"  Expected: {y!s}", file=sys.stderr)
        print(f"  Observed: {x!s}", file=sys.stderr)
        return False

def check(xs):
    for (msg, x) in xs:
        if not x:
            return False
    return True


================================================
FILE: test-suite/golden-tests/hofs-1/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/hofs-1/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/hofs-1/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

template <class A, class B, class C, class F>
std::vector<C> czipWith(
        F f,
        const std::vector<A>& xs,
        const std::vector<B>& ys
    )
{
    static_assert(std::is_invocable_r_v<C, F, A, B>, 
                  "Function f must be callable with type A and return type B");
    std::size_t N = std::min(xs.size(), ys.size());
    std::vector<C> zs(N);
    for(std::size_t i = 0; i < N; i++){
        zs[i] = f(xs[i], ys[i]);
    }
    return zs;
}

#endif


================================================
FILE: test-suite/golden-tests/hofs-1/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Tuple2 a b = "tuple" a b
type R => Tuple2 a b = "tuple" a b
type Cpp => Tuple2 a b = "std::tuple<$1, $2>" a b

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"

type Py => Str = "str"
type R => Str = "character"
type Cpp => Str = "std::string"

type Py => Bool = "bool"
type R => Bool = "logical"
type Cpp => Bool = "bool"


================================================
FILE: test-suite/golden-tests/hofs-1/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))

def pzipWith(f, xs, ys):
    return list(map(f, xs, ys))


================================================
FILE: test-suite/golden-tests/hofs-1/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 
czipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap", "czipWith")


================================================
FILE: test-suite/golden-tests/hofs-1/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 
pzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap", "pzipWith")


================================================
FILE: test-suite/golden-tests/hofs-1/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/hofs-1/main.loc
================================================
module main (test)

import foor
import foopy

source Py from "eq.py" ("eq", "check")
eq :: a -> a -> Bool
check :: [(Str, Bool)] -> Bool

radd3 x y z = radd x (radd y z)
padd3 x y z = padd x (padd y z)

test = check
  [ ("0", eq (pzipWith radd [1,2] [5,6]) [6,8])
  , ("1", eq (pzipWith (\x y -> 1) [1,2] [5,6]) [1,1])
  , ("2", eq (pzipWith (\x y -> x) [1,2] [5,6]) [1,2])
  , ("3", eq (pzipWith (\x y -> y) [1,2] [5,6]) [5,6])
  , ("4", eq (pzipWith (\x y -> radd x 10) [1,2] [5,6]) [11,12])
  , ("5", eq (pzipWith (\x y -> radd 10 y) [1,2] [5,6]) [15,16])
  , ("6", eq (pzipWith (\x y -> radd x x) [1,2] [5,6]) [2,4])
  , ("7", eq (pzipWith (\x y -> radd y y) [1,2] [5,6]) [10,12])
  , ("8", eq (pzipWith (\x y -> radd x (radd x 5)) [1,2] [5,6]) [7,9])
  , ("9", eq (pzipWith (\x y -> radd (radd x 5) 1) [1,2] [5,6]) [7,8])
  , ("a", eq (pzipWith (\x y -> rneg (radd x y)) [1,2] [5,6]) [-6,-8])
  , ("b", eq (pzipWith (\x y -> [x,y]) [1,2] [5,6]) [[1,5],[2,6]])
  , ("c", eq (pzipWith (\x y -> (x,y)) [1,2] [5,6]) [(1,5),(2,6)])
  , ("d", eq (pzipWith (\x y -> [radd 1 x]) [1,2] [5,6]) [[2],[3]])
  , ("e", eq (pzipWith (\x y -> (x,radd 1 y)) [1,2] [5,6]) [(1,6),(2,7)])
  -----------------------
  , ("f", eq (pzipWith (radd3 10) [1,2] [5,6]) [16,18])
  , ("10", eq (pzipWith (\x y -> radd3 x y 10) [1,2] [5,6]) [16,18])
  , ("11", eq (pmap (\x -> radd3 x x 10) [1,2]) [12,14])
  , ("12", eq (pzipWith (\x y -> rneg (radd3 x y 10)) [1,2] [5,6]) [-16,-18])
  ------ cis
  , ("13", eq (pzipWith padd [1,2] [5,6]) [6,8])
  , ("14", eq (pzipWith (\x y -> 1) [1,2] [5,6]) [1,1])
  , ("15", eq (pzipWith (\x y -> x) [1,2] [5,6]) [1,2])
  , ("16", eq (pzipWith (\x y -> y) [1,2] [5,6]) [5,6])
  , ("17", eq (pzipWith (\x y -> padd x 10) [1,2] [5,6]) [11,12])
  , ("18", eq (pzipWith (\x y -> padd 10 y) [1,2] [5,6]) [15,16])
  , ("19", eq (pzipWith (\x y -> padd x x) [1,2] [5,6]) [2,4])
  , ("1a", eq (pzipWith (\x y -> padd y y) [1,2] [5,6]) [10,12])
  , ("1b", eq (pzipWith (\x y -> padd x (padd x 5)) [1,2] [5,6]) [7,9])
  , ("1c", eq (pzipWith (\x y -> padd (padd x 5) 1) [1,2] [5,6]) [7,8])
  , ("1d", eq (pzipWith (\x y -> pneg (padd x y)) [1,2] [5,6]) [-6,-8])
  , ("1e", eq (pzipWith (\x y -> [x,y]) [1,2] [5,6]) [[1,5],[2,6]])
  , ("20", eq (pzipWith (\x y -> (x,y)) [1,2] [5,6]) [(1,5),(2,6)])
  , ("21", eq (pzipWith (\x y -> [padd 1 x]) [1,2] [5,6]) [[2],[3]])
  , ("22", eq (pzipWith (\x y -> (x,padd 1 y)) [1,2] [5,6]) [(1,6),(2,7)])
  -----------------------
  , ("23", eq (pzipWith (padd3 10) [1,2] [5,6]) [16,18])
  , ("24", eq (pzipWith (\x y -> padd3 x y 10) [1,2] [5,6]) [16,18])
  , ("25", eq (pmap (\x -> padd3 x x 10) [1,2]) [12,14])
  , ("26", eq (pzipWith (\x y -> pneg (padd3 x y 10)) [1,2] [5,6]) [-16,-18])
  ]


================================================
FILE: test-suite/golden-tests/holes-func/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf __pycache__ nexus log


================================================
FILE: test-suite/golden-tests/holes-func/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/holes-func/main.loc
================================================
module main (test)

import root-py

test = fold (&&) True
  [ (==) (map ((-) _ 1) [1,2,3]) [0,1,2]
  , (==) (((-) _ 1) 8) 7
  , (==) (((-) _ _) 8 1) 7
  ]


================================================
FILE: test-suite/golden-tests/holes-record/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf __pycache__ nexus log


================================================
FILE: test-suite/golden-tests/holes-record/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/holes-record/main.loc
================================================
module main (test)

import root-py

record Person = Person
  { name :: Str
  , age :: Int
  }
record Py => Person = "dict"

-- This defines how Python works when it doesn't know the type
type Py => Record = "dict"

bar :: Str -> Person
bar = { name = _, age = 0 }

test = fold (&&) True
  [ map bar ["Alice", "Bob"] == [{name = "Alice", age = 0 }, {name = "Bob", age = 0}]

  -- Requires the Record def, there is something wrong in type inference.
  , map {name = _, age = 0} ["Alice", "Bob"] == [{name = "Alice", age = 0 }, {name = "Bob", age = 0}]

  -- anonymous records (works in Python and R, would fail in C++ currently)
  , map {foo = _, bar = 0} ["Alice", "Bob"] == [{foo = "Alice", bar = 0 }, {foo = "Bob", bar = 0}]
  ]


================================================
FILE: test-suite/golden-tests/holes-simple/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf __pycache__ nexus log


================================================
FILE: test-suite/golden-tests/holes-simple/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/holes-simple/main.loc
================================================
module main (test)

import root-py

foo = [_,_,_]
foo2 = [(_,3),(_,2),(_,1)]
point = (_,_,_)
point2 = (_,_,(_, 42))

test = fold (&&) True
  [ (==) (map (_, 5) [1,2]) [(1,5),(2,5)]
  , (==) (foo 1 2 3) [1,2,3]
  , (==) (foo2 1 2 3) [(1,3),(2,2),(3,1)]
  , (==) (point 1 2 3) (1,2,3)
  , (==) (point2 1 2 3) (1,2,(3,42))
  , (==) ([_] 1) [1]
  , (==) ((_, 5) 1) (1,5)
  , (==) ((1, _) 5) (1,5)
  , (==) ((1, (_,2)) 5) (1,(5,2))
  , (==) ([(_, (_, _)), _] 1 2 3 (4,(5,6))) [(1,(2,3)), (4,(5,6))]
  ]


================================================
FILE: test-suite/golden-tests/import-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/import-1/exp.txt
================================================
3.74165738677394


================================================
FILE: test-suite/golden-tests/import-1/main.loc
================================================
module main (foo)

import root-cpp
import math-cpp (sqrt)

sum = fold (+) zero

square x = x * x

foo :: [Real] -> Real
foo xs = sqrt (sum (map square xs))


================================================
FILE: test-suite/golden-tests/import-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus person '"Bob"' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/import-2/exp.txt
================================================
[["Bob"],[42]]


================================================
FILE: test-suite/golden-tests/import-2/localmap/main.loc
================================================
module localmap (Map, person)

source py from "main.py" ( "morloc_person" as person )

type py => Str = "str"
type py => Int = "int"
type py => (Map key val) = "dict" key val
type py => (Tuple2 a b) = "tuple" a b
type py => (List a) = "list" a

class Packable a b where
  pack :: a -> b
  unpack :: b -> a

instance Packable ([key],[val]) (Map key val) where
  source py from "main.py"
   ( "morloc_packMap" as pack
   , "morloc_unpackMap" as unpack
   )

person :: Str -> Map Str Int


================================================
FILE: test-suite/golden-tests/import-2/localmap/main.py
================================================
def morloc_packMap (xs):
  d = dict()
  ks, vs = xs
  for (k,v) in zip(ks, vs):
    d[k] = v
  return d

def morloc_unpackMap (d):
  return (list(d.keys()), list(d.values()))

def morloc_person(name):
    return {name : 42}


================================================
FILE: test-suite/golden-tests/import-2/main.loc
================================================
-- test for gitub issue #16

-- The index for `person` should link to the scope where person was defined

-- Since `person` was defined in `localmap`, it should have access to `Map`,
-- `List`, and all the other type terms defined there. These types should not
-- need to be imported here. Indeed, if they are imported here from other sources,
-- there should be no conflict.

module main (person)
import localmap (person)


================================================
FILE: test-suite/golden-tests/infix/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_arithmetic       > obs.txt 2> obs.err
	./nexus test_precedence       2>> obs.err  >> obs.txt
	./nexus test_exponentiation   2>> obs.err  >> obs.txt
	./nexus test_append           2>> obs.err  >> obs.txt
	./nexus test_application      2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/infix/exp.txt
================================================
8
14
8
[1,2,3,4]
10


================================================
FILE: test-suite/golden-tests/infix/impl.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y

def pow(x, y):
    return x ** y

def cons(x, xs):
    return [x] + xs

def append(xs, ys):
    return xs + ys

def cons(x, xs):
    return [x] + xs

def append(xs, ys):
    return xs + ys


================================================
FILE: test-suite/golden-tests/infix/main.loc
================================================
module main
  ( test_arithmetic
  , test_precedence
  , test_exponentiation
  , test_append
  , test_application
  )

type Py => Int = "int"
type Py => (List a) = "list" a

-- Mathematical operators - source from Python
source py from "impl.py"
  ( "add" as (+)
  , "mul" as (*)
  , "pow" as (**)
  , "append" as (<>)
  )

-- Define infix operators as wrappers
infixl 6 +
infixl 7 *
infixr 8 **
infixr 5 <>
infixr 0 $

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int
(**) :: Int -> Int -> Int
(<>) :: [Int] -> [Int] -> [Int]

-- Function application operator
($) :: (Int -> Int) -> Int -> Int
($) f x = f x

-- Test cases

-- Basic arithmetic
test_arithmetic :: Int
test_arithmetic = 5 + 3

-- Precedence: multiplication before addition
test_precedence :: Int
test_precedence = 2 + 3 * 4

-- Exponentiation (right associative, highest precedence)
test_exponentiation :: Int
test_exponentiation = 2 ** 3

-- List append operator
test_append :: [Int]
test_append = [1, 2] <> [3, 4]

-- Function application operator
test_application :: Int
test_application = (*) 2 $ 5


================================================
FILE: test-suite/golden-tests/infix-generic/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus x > obs.txt 2> obs.err
	./nexus y 2>> obs.err  >> obs.txt
	./nexus z 2>> obs.err  >> obs.txt
	./nexus f 99 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/infix-generic/exp.txt
================================================
"11"
[7,8,9]
"13"
"141"


================================================
FILE: test-suite/golden-tests/infix-generic/foo.py
================================================
def add(x, y):
    return x + y

def morloc_map(f, xs):
    return [f(x) for x in xs]

def morloc_str(x):
    return str(x)


================================================
FILE: test-suite/golden-tests/infix-generic/main.loc
================================================
module main (x,y,z,f)

type Py => Str = "str"
type Py => Int = "int"
type Py => (List a) = "list" a

infixl 9 .
(.) :: (b -> c) -> (a -> b) -> a -> c
(.) g f x = g (f x)

infixr 0 $
($) :: (a -> b) -> a -> b
($) f x = f x

infixl 6 +
(+) :: Int -> Int -> Int
source Py from "foo.py"
  ( "add" as (+)
  , "morloc_str" as show
  , "morloc_map" as map
  )

show :: a -> Str
map :: (a -> b) -> [a] -> [b]

x = show ((+) 6 5)
y = map  ((+) 6) [1,2,3]
z = show ((+) 6 $ 7)
f = show . (+) 42


================================================
FILE: test-suite/golden-tests/infix-import/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_addition > obs.txt 2> obs.err
	./nexus test_multiplication 2>> obs.err  >> obs.txt
	./nexus test_exponentiation 2>> obs.err  >> obs.txt
	./nexus test_concat 2>> obs.err  >> obs.txt
	./nexus test_combined 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-import/exp.txt
================================================
8
28
1024
[1,2,3,4]
27


================================================
FILE: test-suite/golden-tests/infix-import/foo.py
================================================
def add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/infix-import/main.loc
================================================
module main
  ( test_addition
  , test_multiplication
  , test_exponentiation
  , test_concat
  , test_combined
  )

-- Import infix operators from ops module
import ops ((+), (*), (**), (<>))

type Py => Int = "int"
type Py => (List a) = "list" a

-- Test cases using imported operators

-- Basic addition
test_addition :: Int
test_addition = 5 + 3

-- Multiplication
test_multiplication :: Int
test_multiplication = 4 * 7

-- Exponentiation
test_exponentiation :: Int
test_exponentiation = 2 ** 10

-- List concatenation
test_concat :: [Int]
test_concat = [1, 2] <> [3, 4]

-- Combined: uses operator precedence
test_combined :: Int
test_combined = 2 + 3 * 2 ** 3 + 1


================================================
FILE: test-suite/golden-tests/infix-import/ops/main.loc
================================================
module ops
  ( (+)
  , (*)
  , (**)
  , (<>)
  )

type Py => Int = "int"
type Py => (List a) = "list" a

source py from "ops.py"
  ( "add" as (+)
  , "mul" as (*)
  , "pow" as (**)
  , "concat" as (<>)
  )

infixl 6 +
(+) :: Int -> Int -> Int

infixl 7 *
(*) :: Int -> Int -> Int

infixr 8 **
(**) :: Int -> Int -> Int

infixr 5 <> 
(<>) :: [a] -> [a] -> [a]


================================================
FILE: test-suite/golden-tests/infix-import/ops/ops.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y

def pow(x, y):
    return x ** y

def concat(xs, ys):
    return xs + ys


================================================
FILE: test-suite/golden-tests/infix-local-fixity/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_a > obs.txt 2> obs.err
	./nexus test_b 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-local-fixity/exp.txt
================================================
25
209


================================================
FILE: test-suite/golden-tests/infix-local-fixity/main.loc
================================================
module main (test_a, test_b)

import ops-a ((&) as (&~))
import ops-b ((&))

type Py => Int = "int"

-- Test operator from ops-a with its fixity (infixl 5 &)
-- 2 &~ 3 &~ 4 should be (2 & 3) & 4 = 14 (left-associative)
test_a :: Int
test_a = 2 &~ 3 &~ 4

-- Test operator from ops-b with its fixity (infixr 7 &)
-- 2 & 3 & 4 should be 2 & (3 & 4) = 18 (right-associative)
test_b :: Int
test_b = 2 & 3 & 4


================================================
FILE: test-suite/golden-tests/infix-local-fixity/ops-a/main.loc
================================================
module ops-a (*)

type Py => Int = "int"

-- Left-associative &
infixl 5 &
(&) :: Int -> Int -> Int
source Py from "ops.py" ("left_assoc" as (&))


================================================
FILE: test-suite/golden-tests/infix-local-fixity/ops-a/ops.py
================================================
def left_assoc(x, y):
    # (x & y) = x + y + 10
    # This way we can distinguish left vs right associativity
    return x + y + 10


================================================
FILE: test-suite/golden-tests/infix-local-fixity/ops-b/main.loc
================================================
module ops-b (*)

type Py => Int = "int"

-- Right-associative &
infixr 7 &
(&) :: Int -> Int -> Int
source Py from "ops.py" ("right_assoc" as (&))


================================================
FILE: test-suite/golden-tests/infix-local-fixity/ops-b/ops.py
================================================
def right_assoc(x, y):
    # (x & y) = x + y + 100
    # Different value to distinguish from left_assoc
    return x + y + 100


================================================
FILE: test-suite/golden-tests/infix-polyglot/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_sum_py > obs.txt 2> obs.err
	./nexus test_product_py 2>> obs.err  >> obs.txt
	./nexus test_chain_py 2>> obs.err  >> obs.txt
	./nexus test_sum_cpp 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-polyglot/exp.txt
================================================
15
42
14
123


================================================
FILE: test-suite/golden-tests/infix-polyglot/main.loc
================================================
module main (test_sum_py, test_sum_cpp, test_product_py, test_chain_py)

import ops-py
import ops-cpp

type Py => Int = "int"
type Cpp => Int = "int"

-- Python tests
test_sum_py :: Int
test_sum_py = 10 <+> 5

test_product_py :: Int
test_product_py = 6 <*> 7

-- Test precedence: <*> (infixl 7) > <+> (infixl 6)
-- Should be: 2 <+> (3 <*> 4) = 2 + 12 = 14
test_chain_py :: Int
test_chain_py = 2 <+> 3 <*> 4

-- C++ test
test_sum_cpp :: Int
test_sum_cpp = 100 <+> 23


================================================
FILE: test-suite/golden-tests/infix-polyglot/ops/main.loc
================================================
module ops (*)

-- Language-agnostic operator signatures and fixity declarations
(<+>) :: Int -> Int -> Int
(<*>) :: Int -> Int -> Int

infixl 6 <+>
infixl 7 <*>


================================================
FILE: test-suite/golden-tests/infix-polyglot/ops-cpp/main.loc
================================================
module ops-cpp (*)

import ops

type Cpp => Int = "int"

source Cpp from "ops.hpp" ("add" as (<+>), "mul" as (<*>))


================================================
FILE: test-suite/golden-tests/infix-polyglot/ops-cpp/ops.hpp
================================================
#include <cppmorloc.hpp>

int add(int x, int y) { return x + y; }
int mul(int x, int y) { return x * y; }


================================================
FILE: test-suite/golden-tests/infix-polyglot/ops-py/main.loc
================================================
module ops-py (*)

import ops

type Py => Int = "int"

source Py from "ops.py" ("add" as (<+>), "mul" as (<*>))


================================================
FILE: test-suite/golden-tests/infix-polyglot/ops-py/ops.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_comp > obs.txt 2> obs.err
	./nexus test_min 2>> obs.err  >> obs.txt
	./nexus test_not_equal 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/exp.txt
================================================
true
17
true


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/foo.py
================================================
def le(x, y):
    return x <= y


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/main.loc
================================================
module main (test_comp, test_min, test_not_equal)

import .numops (Ord, (<), (>), (>=), min)

type Py => Int = "int"
type Py => Bool = "bool"

instance Ord Int where
  source Py from "foo.py" ("le" as (<=))

-- Test imported infix operators
test_comp :: Bool
test_comp = 5 < 10

-- Test method using infix operators
test_min :: Int
test_min = min 42 17

-- Test combined expression
test_not_equal :: Bool
test_not_equal = 3 <= 5


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/numops/main.loc
================================================
module (Ord, (<), (>), (>=), min)

type Py => Bool = "bool"

class Ord a where
  (<=) :: a -> a -> Bool

infixl 4 <
infixl 4 >
infixl 4 <=
infixl 4 >=

source Py from "ops.py"
  ( "morloc_not" as not
  , "morloc_and" as (&&)
  , "morloc_if" as ifelse
  )
not :: Bool -> Bool
(&&) :: Bool -> Bool -> Bool
ifelse :: Bool -> a -> a -> a

(<) :: a -> a -> Bool
(<) x y = (x <= y) && not (y <= x)

(>) :: a -> a -> Bool
(>) x y = y < x

(>=) :: a -> a -> Bool
(>=) x y = y <= x

min :: a -> a -> a
min x y = ifelse (x < y) x y


================================================
FILE: test-suite/golden-tests/infix-typeclass-import/numops/ops.py
================================================
def morloc_not(b):
    return not b

def morloc_and(p, q):
    return p and q

def morloc_if(cond, t, f):
    return t if cond else f


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_sum_py > obs.txt 2> obs.err
	./nexus test_product_py 2>> obs.err  >> obs.txt
	./nexus test_chain_py 2>> obs.err  >> obs.txt
	./nexus test_sum_cpp 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/exp.txt
================================================
15
42
14
123


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/main.loc
================================================
module main (test_sum_py, test_sum_cpp, test_product_py, test_chain_py)

import .semiring-py (Semiring)
import .semiring-cpp (Semiring)

type Py => Int = "int"
type Cpp => Int = "int"

-- Python tests
test_sum_py :: Int
test_sum_py = 10 <+> 5

test_product_py :: Int
test_product_py = 6 <*> 7

-- Test precedence: <*> (infixl 7) > <+> (infixl 6)
-- Should be: 2 <+> (3 <*> 4) = 2 + 12 = 14
test_chain_py :: Int
test_chain_py = 2 <+> 3 <*> 4

-- C++ test
test_sum_cpp :: Int
test_sum_cpp = 100 <+> 23


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/semiring/main.loc
================================================
module (Semiring)

-- Semiring typeclass with additive and multiplicative operators
class Semiring a where
  zero :: a
  one :: a
  (<+>) :: a -> a -> a  -- additive operation
  (<*>) :: a -> a -> a  -- multiplicative operation

infixl 6 <+>
infixl 7 <*>


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/semiring-cpp/main.loc
================================================
module (*)

import .semiring (Semiring)

type Cpp => Int = "int"

instance Semiring Int where
  source Cpp from "ops.hpp" ("add" as (<+>), "mul" as (<*>))
  zero = 0
  one = 1


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/semiring-cpp/ops.hpp
================================================
#include <cppmorloc.hpp>

int add(int x, int y) { return x + y; }
int mul(int x, int y) { return x * y; }


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/semiring-py/main.loc
================================================
module (*)

import .semiring (Semiring)

type Py => Int = "int"

instance Semiring Int where
  source Py from "ops.py" ("add" as (<+>), "mul" as (<*>))
  zero = 0
  one = 1


================================================
FILE: test-suite/golden-tests/infix-typeclass-polyglot/semiring-py/ops.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/infix-typeclass-simple/Makefile
================================================
all:
	rm -f *.err obs.txt *.err
	morloc make -o nexus main.loc 2> build.err
	./nexus test_add 5 > obs.txt 2> obs.err
	./nexus test_mul 5 2>> obs.err  >> obs.txt
	./nexus test_expr 2>> obs.err  >> obs.txt
	./nexus test_negate 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/infix-typeclass-simple/exp.txt
================================================
8
20
31
-42


================================================
FILE: test-suite/golden-tests/infix-typeclass-simple/foo.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y

def neg(x):
    return -x


================================================
FILE: test-suite/golden-tests/infix-typeclass-simple/main.loc
================================================
module main (test_add, test_mul, test_expr, test_negate)

type Py => Int = "int"

-- Typeclass with infix operators
class Num a where
  zero :: a
  negate :: a -> a
  (+) :: a -> a -> a
  (*) :: a -> a -> a

infixl 6 +
infixl 7 *

instance Num Int where
  source Py from "foo.py" ("add" as (+), "mul" as (*), "neg" as negate)
  zero = 0

-- Test basic infix usage
test_add :: Int -> Int
test_add x = x + 3

test_mul :: Int -> Int
test_mul x = 4 * x

-- Test precedence: should be 4 * 7 + 3 = 31
test_expr :: Int
test_expr = 4 * 7 + 3

-- Test prefix method
test_negate :: Int
test_negate = negate 42


================================================
FILE: test-suite/golden-tests/inline-block-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testAdd 3 4 > obs.txt 2> obs.err
	./nexus testExpr 2 3 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-block-py/exp.txt
================================================
7
10


================================================
FILE: test-suite/golden-tests/inline-block-py/main.loc
================================================
-- Test %inline before an entire source ... where block
-- Expected: ALL functions in the block should be inlined
module main (testAdd, testExpr)

type Py => Int = "int"

-- %inline before the whole source block should make both (+) and (*) inline
%inline source Py where
  (+)
  (*)

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int

testAdd :: Int -> Int -> Int
testAdd x y = x + y

-- If inlined: (x * y) + z with native operators
-- Either way, result should be correct: 2*3 + 4 = 10
testExpr :: Int -> Int -> Int -> Int
testExpr x y z = x * y + z


================================================
FILE: test-suite/golden-tests/inline-cross-lang/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1.5 2.5 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-cross-lang/exp.txt
================================================
8


================================================
FILE: test-suite/golden-tests/inline-cross-lang/foo.R
================================================
rDouble <- function(x) {
    x * 2
}


================================================
FILE: test-suite/golden-tests/inline-cross-lang/foo.py
================================================
def add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/inline-cross-lang/main.loc
================================================
-- Test that %inline is silently ignored for cross-language calls
-- The inline Python add is called from an R context via composition
module main (foo)

type Py => Int = "int"
type Py => Real = "float"
type Py => List a = "list" a

type R => Int = "integer"
type R => Real = "numeric"
type R => List a = "list" a

source Py from "foo.py" where
  %inline add

source R from "foo.R" ("rDouble" as double)

add :: Real -> Real -> Real
double :: Real -> Real

-- double is R, add is Python with %inline
-- The inline should be silently ignored for the cross-language call
foo :: Real -> Real -> Real
foo x y = double (add x y)


================================================
FILE: test-suite/golden-tests/inline-deep-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus deep 1 2 3 4 5 6 7 8 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-deep-py/exp.txt
================================================
186


================================================
FILE: test-suite/golden-tests/inline-deep-py/main.loc
================================================
-- Test deeply nested inline operators with precedence
module main (deep)

type Py => Int = "int"

source Py where
  %inline (+)
  %inline (*)

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int

infixl 6 +
infixl 7 *

deep :: Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int -> Int
deep a b c d e f g h = (a + b) * (c + d) + (e + f) * (g + h)


================================================
FILE: test-suite/golden-tests/inline-func-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testAdd 3 4 > obs.txt 2> obs.err
	./nexus testDouble 5 >> obs.txt 2>> obs.err
	./nexus testMixed 2 3 >> obs.txt 2>> obs.err
	./nexus testRepeated 3 4 >> obs.txt 2>> obs.err
	./nexus testNested 2 3 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-func-py/exp.txt
================================================
7
20
15
14
20


================================================
FILE: test-suite/golden-tests/inline-func-py/foo.py
================================================
def add(x, y):
    return x + y

def double(x):
    return x * 2

def triple(x):
    return x * 3


================================================
FILE: test-suite/golden-tests/inline-func-py/main.loc
================================================
-- Test %inline pragma on non-operator functions
module main (testAdd, testDouble, testMixed, testRepeated, testNested)

type Py => Int = "int"

source Py from "foo.py" where
  %inline add
  %inline double
  triple

add :: Int -> Int -> Int
double :: Int -> Int
triple :: Int -> Int

-- Inline non-operator function
testAdd :: Int -> Int -> Int
testAdd x y = add x y

-- Inline unary function
testDouble :: Int -> Int
testDouble x = double (add x x)

-- Mix of inline (add, double) and non-inline (triple) from same source
-- triple(add(2, 3)) = triple(5) = 15
testMixed :: Int -> Int -> Int
testMixed x y = triple (add x y)

-- Inline function called many times in one expression
-- add(add(x, x), add(y, y)) = add(2x, 2y) = 2x + 2y
-- with x=3, y=4: add(6, 8) = 14
testRepeated :: Int -> Int -> Int
testRepeated x y = add (add x x) (add y y)

-- Deeply nested inline: double(double(add(x, y)))
-- with x=2, y=3: double(double(5)) = double(10) = 20
testNested :: Int -> Int -> Int
testNested x y = double (double (add x y))


================================================
FILE: test-suite/golden-tests/inline-ho-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMapDouble '[1,2,3]' > obs.txt 2> obs.err
	./nexus testDirectDouble 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-ho-py/exp.txt
================================================
[2,4,6]
10


================================================
FILE: test-suite/golden-tests/inline-ho-py/foo.py
================================================
def double(x):
    return x * 2

def mymap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/inline-ho-py/main.loc
================================================
-- Test inline function passed as higher-order argument
-- Expected: inline flag silently ignored, function works as normal value
module main (testMapDouble, testDirectDouble)

type Py => Int = "int"
type Py => List a = "list" a

source Py from "foo.py" where
  %inline double
  mymap

double :: Int -> Int
mymap :: (a -> b) -> [a] -> [b]

-- Inline function passed as argument to higher-order function
-- Should work: double is passed as a value, inlining is silently skipped
testMapDouble :: [Int] -> [Int]
testMapDouble xs = mymap double xs

-- Direct inline call (for comparison -- this should inline normally)
testDirectDouble :: Int -> Int
testDirectDouble x = double x


================================================
FILE: test-suite/golden-tests/inline-mixed-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	-./nexus mixedOps 3 4 2 3 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-mixed-py/exp.txt
================================================
1


================================================
FILE: test-suite/golden-tests/inline-mixed-py/main.loc
================================================
-- Test mix of inline and non-inline operators from same source where block
-- BUG: non-inline operator (-) sourced via where-syntax is emitted as a bare
-- symbol for the function name. In Python this generates "-(n24, n25)" which
-- is unary negation applied to a tuple, not a binary subtraction call.
-- The underlying issue: operators sourced via "source Py where (-)" without
-- %inline need the code generator to handle their non-alphanumeric name
-- (e.g., emit as operator.sub or wrap appropriately).
module main (mixedOps)

type Py => Int = "int"

source Py where
  %inline (+)
  %inline (*)
  (-)

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int
(-) :: Int -> Int -> Int

-- (3 + 4) - (2 * 3) = 7 - 6 = 1
mixedOps :: Int -> Int -> Int -> Int -> Int
mixedOps a b c d = (a + b) - (c * d)


================================================
FILE: test-suite/golden-tests/inline-old-style-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testAdd 3 4 > obs.txt 2> obs.err
	./nexus testExpr 2 3 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-old-style-py/exp.txt
================================================
7
10


================================================
FILE: test-suite/golden-tests/inline-old-style-py/foo.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/inline-old-style-py/main.loc
================================================
-- Test %inline with old-style source syntax
-- %inline before old-style source inlines all functions in the block
module main (testAdd, testExpr)

type Py => Int = "int"

%inline source Py from "foo.py" ("add" as (+), "mul" as (*))

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int

infixl 6 +
infixl 7 *

testAdd :: Int -> Int -> Int
testAdd x y = x + y

-- 2 * 3 + 4 = 10
testExpr :: Int -> Int -> Int -> Int
testExpr x y z = x * y + z


================================================
FILE: test-suite/golden-tests/inline-op-ho-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testFold '[1,2,3,4]' > obs.txt 2> obs.err
	./nexus testDirect 3 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-op-ho-py/exp.txt
================================================
10
7


================================================
FILE: test-suite/golden-tests/inline-op-ho-py/foo.py
================================================
def fold(f, b, xs):
    for x in xs:
        b = f(b, x)
    return b


================================================
FILE: test-suite/golden-tests/inline-op-ho-py/main.loc
================================================
-- Test inline operator passed as higher-order argument
-- Expected: inline flag silently ignored for HO usage, operator works as value
-- This is tricky because operators like (+) are not callable values in most languages.
-- The compiler needs to handle this by wrapping the operator in a lambda or using
-- a language-specific mechanism.
module main (testFold, testDirect)

type Py => Int = "int"
type Py => List a = "list" a

source Py from "foo.py" where
  fold

source Py where
  %inline (+)

(+) :: Int -> Int -> Int
fold :: (b -> a -> b) -> b -> [a] -> b

-- Inline operator passed as value to fold
-- fold (+) 0 [1,2,3,4] = 10
testFold :: [Int] -> Int
testFold xs = fold (+) 0 xs

-- Direct inline usage (for comparison)
testDirect :: Int -> Int -> Int
testDirect x y = x + y


================================================
FILE: test-suite/golden-tests/inline-op-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus addTwo 3 4 > obs.txt 2> obs.err
	./nexus mulAdd 2 3 10 >> obs.txt 2>> obs.err
	./nexus nested 1 2 3 4 >> obs.txt 2>> obs.err
	./nexus letExpr 3 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-op-py/exp.txt
================================================
7
16
21
49


================================================
FILE: test-suite/golden-tests/inline-op-py/main.loc
================================================
-- Test %inline pragma on operators in source where blocks
module main (addTwo, mulAdd, nested, letExpr)

type Py => Int = "int"

source Py where
  %inline (+)
  %inline (*)

(+) :: Int -> Int -> Int
(*) :: Int -> Int -> Int

-- Simple inline operator
addTwo :: Int -> Int -> Int
addTwo x y = x + y

-- Nested inline operators
mulAdd :: Int -> Int -> Int -> Int
mulAdd x y z = x * y + z

-- Test operator precedence with parenthesization
nested :: Int -> Int -> Int -> Int -> Int
nested a b c d = (a + b) * (c + d)

-- Inline operator inside let binding
letExpr :: Int -> Int -> Int
letExpr x y =
  let s = x + y
  in s * s


================================================
FILE: test-suite/golden-tests/inline-typeclass-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus addInts 3 4 > obs.txt 2> obs.err
	./nexus addReals 1.5 2.5 >> obs.txt 2>> obs.err
	./nexus expr1 3 4 5 6 >> obs.txt 2>> obs.err
	./nexus expr2 2 3 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/inline-typeclass-py/exp.txt
================================================
7
4
77
10


================================================
FILE: test-suite/golden-tests/inline-typeclass-py/main.loc
================================================
-- Test %inline pragma inside typeclass instances with source ... where syntax
module main (addInts, addReals, expr1, expr2)

type Py => Int = "int"
type Py => Real = "float"

class Addable a where
  (+) :: a -> a -> a
  (*) :: a -> a -> a

infixl 6 +
infixl 7 *

instance Addable Int where
  source Py where
    %inline (+)
    %inline (*)

instance Addable Real where
  source Py where
    %inline (+)
    %inline (*)

-- Basic typeclass inline operator usage
addInts :: Int -> Int -> Int
addInts x y = x + y

addReals :: Real -> Real -> Real
addReals x y = x + y

-- Complex expression with typeclass-dispatched inline operators
-- (3 + 4) * (5 + 6) = 7 * 11 = 77
expr1 :: Int -> Int -> Int -> Int -> Int
expr1 a b c d = (a + b) * (c + d)

-- Precedence: 2 * 3 + 4 = 6 + 4 = 10
expr2 :: Int -> Int -> Int -> Int
expr2 x y z = x * y + z


================================================
FILE: test-suite/golden-tests/inline-typeclass-py/ops.py
================================================
def add(x, y):
    return x + y

def mul(x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/interop-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus py2c 3 4 > obs.txt 2> obs.err
	./nexus c2py 3 4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/interop-1-py/exp.txt
================================================
112
700


================================================
FILE: test-suite/golden-tests/interop-1-py/main.loc
================================================
module main (py2c, c2py)

import root-py
import root-cpp

padd x = idpy . (+) x
cmul x = idcpp . (*) x

py2c x y = padd (cmul x y) (100.0 :: Real)
c2py x y = cmul (padd x y) (100.0 :: Real)


================================================
FILE: test-suite/golden-tests/interop-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus r2c 3 4 > obs.txt 2> obs.err
	./nexus c2r 3 4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/interop-1-r/exp.txt
================================================
112
700


================================================
FILE: test-suite/golden-tests/interop-1-r/main.loc
================================================
module main (r2c, c2r)

import root ((.))
import root-r (Real, Integral, idr)
import root-cpp (Real, Numeric, idcpp)

radd x = idr . (+) x
cmul x = idcpp . (*) x

r2c x y = radd (cmul x y) (100.0 :: Real)
c2r x y = cmul (radd x y) (100.0 :: Real)


================================================
FILE: test-suite/golden-tests/interop-10/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"asdf"' 3.14 > obs.txt 2> obs.err

.PHONY: clean
clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/interop-10/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/interop-10/foo.hpp
================================================
#include <algorithm>
#include <functional>
#include <type_traits>

// f :: (a -> b) -> a -> b
// g :: Str -> Int
// h :: (Str, Int) -> Str

// f :: (a -> b) -> a -> b
template <typename a, typename F>
auto f(F func, a x) -> std::invoke_result_t<F, a> {
  return(func(x));
}

// g :: Bool -> Int
int g(bool x){
  return(42);
}


================================================
FILE: test-suite/golden-tests/interop-10/foo.py
================================================
#  h :: (Str, Int) -> Str
def h(x):
    return True


================================================
FILE: test-suite/golden-tests/interop-10/main.loc
================================================
module main (foo)

import root-cpp (Str, Int, Real, Bool, Tuple2)
import root-py (Str, Int, Real, Bool, Tuple2)

source Cpp from "foo.hpp" ("f", "g")
source Py from "foo.py" ("h")

f :: (a -> b) -> a -> b
g :: Bool -> Int
h :: (Str, Real) -> Bool

foo x y = f g (h (x, y))


================================================
FILE: test-suite/golden-tests/interop-11/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 14 > obs.txt 2> obs.err
	./nexus foo2 2 2>> obs.err  >> obs.txt
	./nexus foo3 3 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/interop-11/exp.txt
================================================
15
6
8


================================================
FILE: test-suite/golden-tests/interop-11/incdef.hpp
================================================
#ifndef FOO
#define FOO

typedef struct bar_s {
  int sass;
  int fass;
} bar_t;


int inc(int x) {
  return x + 1;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-11/main.loc
================================================
module main (foo, foo2, foo3)

type Py => Int = "int"
type Py => List a = "list" a
type Py => Tuple2 a b = "tuple" a b

type Cpp => Int = "int"
type Cpp => List a = "std::vector<$1>" a
type Cpp => Tuple2 a b = "std::tuple<$1,$2>" a b

record Bar = Bar
  { sass :: Int
  , fass :: Int
  }
record Cpp => Bar = "bar_t"

source Py ("sum")
source Py from "pysum.py" ("sum2", "sumDict" as sumBar)
sum :: [Int] -> Int
sum2 :: (Int, Int) -> Int
sumBar :: Bar -> Int

source Cpp from "incdef.hpp" ("inc")
inc :: Int -> Int

foo x = sum [inc x]
foo2 x = sum2 (inc x, inc x)
foo3 x = sumBar {sass = inc x, fass = inc x}


================================================
FILE: test-suite/golden-tests/interop-11/pysum.py
================================================
def sum2(xs):
    return xs[0] + xs[1]

def sumDict(bar):
    return sum(bar.values())


================================================
FILE: test-suite/golden-tests/interop-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-2/exp.txt
================================================
9


================================================
FILE: test-suite/golden-tests/interop-2/foo.R
================================================
morloc_fold <- function(f, b, xs){
  for(x in xs){
    b <- f(b, x)
  }
  b
}

morloc_add <- function(x, y){
  x + y
}


================================================
FILE: test-suite/golden-tests/interop-2/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a

type Py => Real = "float"
type R => Real = "numeric"

add :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/interop-2/foo.py
================================================
def morloc_map(f, xs):
    return list(map(f, xs))

def morloc_add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/interop-2/foopy.loc
================================================
module (*)

import .foo

source Py from "foo.py" ("morloc_map" as map, "morloc_add" as add)
map :: (a -> b) -> [a] -> [b]


================================================
FILE: test-suite/golden-tests/interop-2/foor.loc
================================================
module (*)

import .foo

source R from "foo.R" ("morloc_fold" as fold, "morloc_add" as add)
fold :: (b -> a -> b) -> b -> [a] -> b


================================================
FILE: test-suite/golden-tests/interop-2/main.loc
================================================
module main (foo)

import .foo (List, Real)
import .foopy (map, add)
import .foor (fold, add)

sum xs b = fold add b xs

foo xs = sum (map (add 1.0) xs) 0.0


================================================
FILE: test-suite/golden-tests/interop-3a-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf __pycache__


================================================
FILE: test-suite/golden-tests/interop-3a-cp/exp.txt
================================================
[-1,-2,-3]


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3a-cp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3a-cp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3a-cp/main.loc
================================================
module main (foo)

import .foo (List, Int)
import .fooc (cmap)
import .foopy (pneg)

foo :: [Int] -> [Int]
foo xs = cmap pneg xs


================================================
FILE: test-suite/golden-tests/interop-3a-pp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3a-pp/exp.txt
================================================
[-1,-2,-3]


================================================
FILE: test-suite/golden-tests/interop-3a-pp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3a-pp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3a-pp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3a-pp/main.loc
================================================
module main (foo)

import .foopy

foo :: [Int] -> [Int]
foo xs = pmap pneg xs


================================================
FILE: test-suite/golden-tests/interop-3a-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3a-pr/exp.txt
================================================
[-1,-2,-3]


================================================
FILE: test-suite/golden-tests/interop-3a-pr/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3a-pr/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3a-pr/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3a-pr/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3a-pr/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3a-pr/main.loc
================================================
module main (foo)

import .foo (List, Int)
import .foopy
import .foor

foo :: [Int] -> [Int]
foo xs = pmap rneg xs


================================================
FILE: test-suite/golden-tests/interop-3a-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3a-rc/exp.txt
================================================
[-1,-2,-3]


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3a-rc/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3a-rc/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3a-rc/main.loc
================================================
module main (foo)

import .foo
import .foor
import .fooc

foo :: [Int] -> [Int]
foo xs = rmap cneg xs


================================================
FILE: test-suite/golden-tests/interop-3b-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf __pycache__


================================================
FILE: test-suite/golden-tests/interop-3b-cp/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3b-cp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3b-cp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3b-cp/main.loc
================================================
module main (foo)

import .foo
import .fooc
import .foopy

foo :: [Int] -> [Int]
foo xs = cmap (padd 1) xs


================================================
FILE: test-suite/golden-tests/interop-3b-pp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3b-pp/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3b-pp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pp/main.loc
================================================
module main (foo)

import .foo
import .foopy

foo xs = pmap (padd 1) xs


================================================
FILE: test-suite/golden-tests/interop-3b-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3b-pr/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3b-pr/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pr/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3b-pr/main.loc
================================================
module main (foo)

import .foo
import .foopy
import .foor

foo xs = pmap (radd 1) xs


================================================
FILE: test-suite/golden-tests/interop-3b-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3b-rc/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3b-rc/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3b-rc/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3b-rc/main.loc
================================================
module main (foo)

import .foo
import .foor
import .fooc

foo xs = rmap (cadd 1) xs


================================================
FILE: test-suite/golden-tests/interop-3c-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3c-cp/exp.txt
================================================
[43,44,45]


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3c-cp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3c-cp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3c-cp/main.loc
================================================
module main (foo)

import .foo
import .fooc
import .foopy

foo x xs = cmap (padd x) xs


================================================
FILE: test-suite/golden-tests/interop-3c-pp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 4 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3c-pp/exp.txt
================================================
[5,6,7]


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3c-pp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pp/main.loc
================================================
module main (foo)

import .foo
import .foopy

foo x xs = pmap (padd x) xs


================================================
FILE: test-suite/golden-tests/interop-3c-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 4 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3c-pr/exp.txt
================================================
[5,6,7]


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3c-pr/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pr/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3c-pr/main.loc
================================================
module main (foo)

import .foo
import .foopy
import .foor

foo x xs = pmap (radd x) xs


================================================
FILE: test-suite/golden-tests/interop-3c-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3c-rc/exp.txt
================================================
[43,44,45]


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3c-rc/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3c-rc/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3c-rc/main.loc
================================================
module main (foo)

import .foo
import .foor (rmap)
import .fooc (cadd)

foo :: Int -> [Int] -> [Int]
foo x xs = rmap (cadd x) xs


================================================
FILE: test-suite/golden-tests/interop-3d-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3d-cp/exp.txt
================================================
[4,3,2]


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3d-cp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3d-cp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3d-cp/main.loc
================================================
module main (foo)

import .foo (Int, List)
import .fooc (cmap)
import .foopy (padd, pneg)

foo :: Int -> [Int] -> [Int]
foo x ys = cmap (\y -> padd x (pneg y)) ys


================================================
FILE: test-suite/golden-tests/interop-3d-pp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3d-pp/exp.txt
================================================
[4,3,2]


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3d-pp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pp/main.loc
================================================
module main (foo)

import .foo (List, Int)
import .foopy (pmap, padd, pneg)

foo x ys = pmap (\y -> padd x (pneg y)) ys


================================================
FILE: test-suite/golden-tests/interop-3d-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3d-pr/exp.txt
================================================
[4,3,2]


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3d-pr/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pr/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3d-pr/main.loc
================================================
module main (foo)

import .foo
import .foopy (pmap)
import .foor (radd, rneg)

foo x ys = pmap (\y -> radd x (rneg y)) ys


================================================
FILE: test-suite/golden-tests/interop-3d-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3d-rc/exp.txt
================================================
[4,3,2]


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3d-rc/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3d-rc/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3d-rc/main.loc
================================================
module main (foo)

import .foo
import .foor (rmap, rneg)
import .fooc (cadd)

foo x ys = rmap (\y -> cadd x (rneg y)) ys


================================================
FILE: test-suite/golden-tests/interop-3e-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] [4,5,6] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf __pycache__ main


================================================
FILE: test-suite/golden-tests/interop-3e-cp/exp.txt
================================================
[7,11,15]


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)
rzipWith <- function(f, xs, ys) sapply(seq_along(xs), function(i) f(xs[i], ys[i]))


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

template <class A, class B, class F>
auto czipWith(
        F f,
        const std::vector<A>& xs,
        const std::vector<B>& ys
    ) -> std::vector<std::invoke_result_t<F, A, B>>
{
    using C = std::invoke_result_t<F, A, B>;
    std::size_t N = std::min(xs.size(), ys.size());
    std::vector<C> zs(N);
    for(std::size_t i = 0; i < N; i++){
        zs[i] = f(xs[i], ys[i]);
    }
    return zs;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foo.loc
================================================
module (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))

def pzipWith(f, xs, ys):
    return list(map(f, xs, ys))


================================================
FILE: test-suite/golden-tests/interop-3e-cp/fooc.loc
================================================
module (*)

import .foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 
czipWith :: (a -> b -> c) -> [a] -> [b] -> [c] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap", "czipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foopy.loc
================================================
module (*)

import .foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 
pzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap", "pzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-cp/foor.loc
================================================
module (*)

import .foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 
rzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source R from "foo.R" ("rneg", "radd", "rmul", "rmap", "rzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-cp/main.loc
================================================
module main (foo)

import .foo
import .fooc (czipWith, cmul)
import .foopy (padd)

add3 x y z = padd x (padd y z)

foo x = czipWith (\y -> add3 (cmul x y) y)

--                          |-> z <-|
-- Tests the case where z is dependent on both a context argument (x) and a
-- lambda argument (y)


================================================
FILE: test-suite/golden-tests/interop-3e-pp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] [4,5,6] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3e-pp/exp.txt
================================================
[7,11,15]


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)
rzipWith <- function(f, xs, ys) sapply(seq_along(xs), function(i) f(xs[i], ys[i]))


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))

def pzipWith(f, xs, ys):
    return list(map(f, xs, ys))


================================================
FILE: test-suite/golden-tests/interop-3e-pp/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 
pzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap", "pzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-pp/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 
rzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source R from "foo.R" ("rneg", "radd", "rmul", "rmap", "rzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-pp/main.loc
================================================
module main (foo)

import foo
import foopy (pzipWith, pmul, padd)

add3 x y z = padd x (padd y z)

foo x = pzipWith (\y -> add3 (pmul x y) y)


================================================
FILE: test-suite/golden-tests/interop-3e-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] [4,5,6] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3e-pr/exp.txt
================================================
[6,14,24]


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)
rzipWith <- function(f, xs, ys) sapply(seq_along(xs), function(i) f(xs[i], ys[i]))


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))

def pzipWith(f, xs, ys):
    return list(map(f, xs, ys))


================================================
FILE: test-suite/golden-tests/interop-3e-pr/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 
pzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap", "pzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-pr/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 
rzipWith :: (a -> b -> c) -> [a] -> [b] -> [c] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap", "rzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-pr/main.loc
================================================
module main (foo)

import foo
import foopy (pzipWith, pmul)
import foor (radd, rmul)

foo x ys zs = pzipWith (\y z -> radd (pmul x y) (rmul y z)) ys zs


================================================
FILE: test-suite/golden-tests/interop-3e-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 [1,2,3] [4,5,6] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3e-rc/exp.txt
================================================
[7,11,15]


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)
rzipWith <- function(f, xs, ys) sapply(seq_along(xs), function(i) f(xs[i], ys[i]))


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))

def pzipWith(f, xs, ys):
    return list(map(f, xs, ys))


================================================
FILE: test-suite/golden-tests/interop-3e-rc/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 
pzipWith :: (a -> b -> c) -> [a] -> [b] -> [c]

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap", "pzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-rc/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 
rzipWith :: (a -> b -> c) -> [a] -> [b] -> [c] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap", "rzipWith")


================================================
FILE: test-suite/golden-tests/interop-3e-rc/main.loc
================================================
module main (foo)

import foo
import foor (rzipWith, rmul)
import fooc (cadd)

add3 x y z = cadd x (cadd y z)

foo :: Int -> [Int] -> [Int] -> [Int]
foo x = rzipWith (\y -> add3 (rmul x y) y)


================================================
FILE: test-suite/golden-tests/interop-3f/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-3f/exp.txt
================================================
420


================================================
FILE: test-suite/golden-tests/interop-3f/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)


================================================
FILE: test-suite/golden-tests/interop-3f/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class B, class F>
std::vector<B> cmap(F f, const std::vector<A>& xs) {
    static_assert(std::is_invocable_r_v<B, F, A>, 
                  "Function f must be callable with type A and return type B");
    
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-3f/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-3f/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-3f/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-3f/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-3f/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 

source R from "foo.R" ("rneg", "radd", "rmul", "rmap")


================================================
FILE: test-suite/golden-tests/interop-3f/main.loc
================================================
module main (foo)

import foo (Int)
import foopy
import foor
import fooc

foo x = pmul (cadd (rmul 20 x) x) 10


================================================
FILE: test-suite/golden-tests/interop-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 9 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-4/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/interop-4/main.loc
================================================
module main (foo)

import root (Real)
import root-py (id)
import root-cpp (Integral)

foo :: Real -> Real
foo x = id (1.0 + x)


================================================
FILE: test-suite/golden-tests/interop-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf __pycache__


================================================
FILE: test-suite/golden-tests/interop-5/exp.txt
================================================
[2,3,4]


================================================
FILE: test-suite/golden-tests/interop-5/foo.hpp
================================================
#ifndef MORLOC_FOO_HPP
#define MORLOC_FOO_HPP

#include <vector>
#include <algorithm>
#include <functional>
#include <type_traits>
#include <utility>

int cneg(int x){
    return (-1) * x;
}

int cadd(int x, int y){
    return x + y;
}

int cmul(int x, int y){
    return x * y;
}

template <class A, class F>
auto cmap(F f, const std::vector<A>& xs) -> std::vector<std::invoke_result_t<F, A>> {
    using B = std::invoke_result_t<F, A>;
    std::vector<B> ys;
    ys.reserve(xs.size());
    for(const auto& x : xs) {
        ys.push_back(f(x));
    }
    return ys;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-5/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-5/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-5/fooc.loc
================================================
module fooc (*)

import foo

cneg :: Int -> Int
cadd :: Int -> Int -> Int
cmul :: Int -> Int -> Int
cmap :: (a -> b) -> [a] -> [b] 

source Cpp from "foo.hpp" ("cneg", "cadd", "cmul", "cmap")


================================================
FILE: test-suite/golden-tests/interop-5/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-5/main.loc
================================================
module main (foo)

import foo (List, Int)
import foopy (padd)
import fooc (cmap)

foo xs = cmap (\x -> padd 1 x) xs


================================================
FILE: test-suite/golden-tests/interop-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/interop-6/exp.txt
================================================
9


================================================
FILE: test-suite/golden-tests/interop-6/foo.R
================================================
rneg <- function(x) (-1) * x
radd <- function(x, y) x + y
rmul <- function(x, y) x * y
rmap <- function(f, xs) sapply(xs, f)
rfold <- function(f, b, xs) Reduce(f=f, x=xs, init=b)


================================================
FILE: test-suite/golden-tests/interop-6/foo.loc
================================================
module foo (*)

type Py => List a = "list" a
type R => List a = "list" a
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type R => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/interop-6/foo.py
================================================
def pneg(x):
    return (-1) * x

def padd(x, y):
    return x + y

def pmul(x, y):
    return x * y

def pmap(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/interop-6/foopy.loc
================================================
module foopy (*)

import foo

pneg :: Int -> Int
padd :: Int -> Int -> Int
pmul :: Int -> Int -> Int
pmap :: (a -> b) -> [a] -> [b] 

source Py from "foo.py" ("pneg", "padd", "pmul", "pmap")


================================================
FILE: test-suite/golden-tests/interop-6/foor.loc
================================================
module foor (*)

import foo

rneg :: Int -> Int
radd :: Int -> Int -> Int
rmul :: Int -> Int -> Int
rmap :: (a -> b) -> [a] -> [b] 
rfold :: (b -> a -> b) -> b -> [a] -> b

source R from "foo.R" ("rneg", "radd", "rmul", "rmap", "rfold")


================================================
FILE: test-suite/golden-tests/interop-6/main.loc
================================================
module main (foo)

import foo (List, Int)
import foopy (pmap, padd)
import foor (rfold)

-- yes, this is an odd definition of `sum`
sum xs b = rfold padd b xs

foo xs = sum (pmap (padd 1) xs) 0
-- foo xs = fold add (map (add 1) xs) 0
--          R    Py   Py   Py


================================================
FILE: test-suite/golden-tests/interop-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 13 > obs.txt 2> obs.err
	diff exp.txt obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/interop-7/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/interop-7/foo.R
================================================
f <- function(x){
  list("asdf", 4.2, x)
}


================================================
FILE: test-suite/golden-tests/interop-7/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <algorithm>
#include <assert.h>
#include <functional>
#include <iostream>
#include <map>
#include <utility>
#include <variant>
#include <vector>

// foldTree :: (l -> a -> a)
//          -> (n -> e -> a -> a)
//          -> a
//          -> (n, e, l)
//          -> a
template<typename N, typename E, typename L, typename A, typename F1, typename F2>
A g(
  F1 laa,
  F2 anea,
  A b,
  const std::tuple<N,E,L>& x
){
    A a1 = laa(std::get<2>(x), b);
    A a2 = anea(std::get<0>(x), std::get<1>(x), a1);
    return a2;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-7/main.loc
================================================
module main (foo)

import root((.))
import root-r (Str, Int, Real, Bool, Tuple3)
import root-cpp (Str, Int, Real, Bool, Tuple3)

source R from "foo.R" ("f")
source Cpp from "foo.hpp" ("g")

f :: Int -> (Str, Real, Int)

-- template<typename N, typename E, typename L, typename A>
g :: (l -> a -> a)
  -> (n -> e -> a -> a)
  -> a
  -> (n, e, l)
  -> a

foo = g (\l a -> a) (\n e a -> a) True . f


================================================
FILE: test-suite/golden-tests/interop-8-py-to-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo "true" > obs.txt 2> obs.err
	diff exp.txt obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/interop-8-py-to-r/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/interop-8-py-to-r/foo.R
================================================
g <- function(f, b, x){
    f(x, b)
}


================================================
FILE: test-suite/golden-tests/interop-8-py-to-r/foo.py
================================================
def f(n):
    return True


================================================
FILE: test-suite/golden-tests/interop-8-py-to-r/main.loc
================================================
module main (foo)

import root ((.))
import root-r (Bool, List)
import root-py (Bool, List)

source R from "foo.R" ("g")
source Py from "foo.py" ("f")

f :: Bool -> Bool

g :: (n -> a -> a) -> a -> n -> a

bar = g (\n a -> [n]) []

foo = bar . f


================================================
FILE: test-suite/golden-tests/interop-8-r-to-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo "true" > obs.txt 2> obs.err
	diff exp.txt obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/interop-8-r-to-c/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/interop-8-r-to-c/foo.R
================================================
f <- function(n){ TRUE }


================================================
FILE: test-suite/golden-tests/interop-8-r-to-c/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

template<typename A, typename C, typename F>
C g(F down, C b, A x){
    C b2 = down(x, b);
    return b2;
}

#endif


================================================
FILE: test-suite/golden-tests/interop-8-r-to-c/main.loc
================================================
module main (foo)

import root ((.))
import root-r (Bool, List)
import root-cpp (Bool, List)

source R from "foo.R" ("f")
source Cpp from "foo.hpp" ("g")

f :: Bool -> Bool

g :: (n -> a -> a) -> a -> n -> a

bar = g (\n a -> [n]) []

foo = bar . f


================================================
FILE: test-suite/golden-tests/interop-8-r-to-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo "true" > obs.txt 2> obs.err
	diff exp.txt obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/interop-8-r-to-py/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/interop-8-r-to-py/foo.R
================================================
f <- function(n){ TRUE }


================================================
FILE: test-suite/golden-tests/interop-8-r-to-py/foo.py
================================================
def g(f, b, x):
    return f(x, b)


================================================
FILE: test-suite/golden-tests/interop-8-r-to-py/main.loc
================================================
module main (foo)

import root ((.))
import root-r (Bool, List)
import root-py (Bool, List)

source R from "foo.R" ("f")
source Py from "foo.py" ("g")

f :: Bool -> Bool

g :: (n -> a -> a) -> a -> n -> a

bar = g (\n a -> [n]) []

foo = bar . f


================================================
FILE: test-suite/golden-tests/interop-9/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/interop-9/exp.txt
================================================
0


================================================
FILE: test-suite/golden-tests/interop-9/foo.R
================================================
add <- function(x, y){ x + y}


================================================
FILE: test-suite/golden-tests/interop-9/foo.py
================================================
def sub(x, y):
    return (x - y)

def add(x, y):
    return (x + y)


================================================
FILE: test-suite/golden-tests/interop-9/main.loc
================================================
module main (foo)

type R => Int = "integer"
type Py => Int = "int"

source R from "foo.R" ("add")
source py from "foo.py" ("sub")

sub :: Int -> Int -> Int
add :: Int -> Int -> Int

foo x = (sub (sub (add 1 x) x) x)


================================================
FILE: test-suite/golden-tests/intrinsic-agnostic/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err
	cat obs-saved.txt >> obs.txt
	echo >> obs.txt

clean:
	rm -rf nexus pools *err obs-saved.txt


================================================
FILE: test-suite/golden-tests/intrinsic-agnostic/exp.txt
================================================
["26c7827d889f6da3","d756d7b62fc50bf1","b5148cb100a911fc"]
["26c7827d889f6da3","d756d7b62fc50bf1","b5148cb100a911fc"]


================================================
FILE: test-suite/golden-tests/intrinsic-agnostic/hello.json
================================================
"hello"


================================================
FILE: test-suite/golden-tests/intrinsic-agnostic/main.loc
================================================
module main (test)

-- Test intrinsics in a language-independent (nexus-only) context.
-- No language-specific root imports — all evaluation happens in the nexus.

test = do
  let y = ( @hash "hello"
          , @hash 42
          , @hash (1, 2, 3)
          )
  @savej y "obs-saved.txt"
  y


================================================
FILE: test-suite/golden-tests/intrinsic-constants/.gitignore
================================================
z
zj
zp


================================================
FILE: test-suite/golden-tests/intrinsic-constants/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus langstr > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err z zj zp


================================================
FILE: test-suite/golden-tests/intrinsic-constants/exp.txt
================================================
[["hi","py"],["hi","py"],["hi","py"],null]


================================================
FILE: test-suite/golden-tests/intrinsic-constants/main.loc
================================================
module main (langstr)

import root-py (idpy)
import root-cpp (idcpp)
import root-r (idr)

langstr :: <IO> (?[Str],?[Str],?[Str],?[Str])
langstr = do
  @save  (idpy ["hi", @lang])  "z"
  @savem (idpy ["hi", @lang]) "zp"
  @savej (idpy ["hi", @lang]) "zj"
  xs  <- @load "z"
  ys  <- @load "zp"
  zs  <- @load "zj"
  bad <- @load "zany"
  (xs, ys, zs, bad)


================================================
FILE: test-suite/golden-tests/intrinsic-hash/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/intrinsic-hash/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/intrinsic-hash/foo.hpp
================================================
#include <string>

int identity_int(int x) {
    return x;
}

std::string identity_str(std::string x) {
    return x;
}


================================================
FILE: test-suite/golden-tests/intrinsic-hash/foo.py
================================================
def identity(x):
    return x


================================================
FILE: test-suite/golden-tests/intrinsic-hash/main.loc
================================================
module main (test)

import root-cpp
import root-py
import root-r

source Cpp from "foo.hpp" ("identity_int" as identityInt, "identity_str" as identityStr)

equalHashes :: [a] -> Bool
equalHashes xs =
  let headHash = @hash (at 0 xs)
      isSame = map ((==) headHash) (map @hash xs)
  in fold (==) True isSame

test :: Bool
test =
  equalHashes [idcpp 45, idpy 45, idr 45] &&
  equalHashes [idcpp "asdf", idpy "asdf", idr "asdf"] &&
  equalHashes [idcpp 5, idpy 5, idr 5] &&
  equalHashes [idcpp (5,"asdf"), idpy (5,"asdf"), idr (5,"asdf")]


================================================
FILE: test-suite/golden-tests/intrinsic-show-ho-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testShowHO > obs.txt 2> obs.err
	./nexus testMapMaybeShow >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/intrinsic-show-ho-r/exp.txt
================================================
"42"
"42"


================================================
FILE: test-suite/golden-tests/intrinsic-show-ho-r/main.loc
================================================
module main (testShowHO, testMapMaybeShow)

import maybe (tryMaybe, mapMaybe)
import maybe-r
import root
import root-r

testShowHO :: Str
testShowHO = tryMaybe show "none" 42

testMapMaybeShow :: ?Str
testMapMaybeShow = mapMaybe show 42


================================================
FILE: test-suite/golden-tests/intrinsic-show-read/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testShow > obs.txt 2> obs.err
	./nexus testRead >> obs.txt 2>> obs.err
	./nexus testRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/intrinsic-show-read/exp.txt
================================================
true
42
99


================================================
FILE: test-suite/golden-tests/intrinsic-show-read/foo.hpp
================================================
int identity_int(int x) {
    return x;
}


================================================
FILE: test-suite/golden-tests/intrinsic-show-read/main.loc
================================================
module main (testShow, testRead, testRoundTrip)

import root-cpp
import root-py

source Cpp from "foo.hpp" ("identity_int" as identityInt)

identityInt :: Int -> Int

-- @show in C++ pool context
showCpp :: Int -> Str
showCpp x = @show (identityInt x)

-- @show in nexus (no pool context)
showNexus :: Int -> Str
showNexus x = @show x

-- round-trip: show then read should recover the original value
roundTrip :: Int -> ?Int
roundTrip x = @read (@show x)

testShow :: Bool
testShow = showCpp 42 == "42" && showNexus 42 == "42"

testRead :: ?Int
testRead = @read "42"

testRoundTrip :: ?Int
testRoundTrip = roundTrip 99


================================================
FILE: test-suite/golden-tests/intrinsic-show-read-nexus/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus showInt > obs.txt 2> obs.err
	./nexus showReal >> obs.txt 2>> obs.err
	./nexus showBool >> obs.txt 2>> obs.err
	./nexus showStr >> obs.txt 2>> obs.err
	./nexus showList >> obs.txt 2>> obs.err
	./nexus showTuple >> obs.txt 2>> obs.err
	./nexus showRecord >> obs.txt 2>> obs.err
	./nexus showNested >> obs.txt 2>> obs.err
	./nexus showOptSome >> obs.txt 2>> obs.err
	./nexus showOptNone >> obs.txt 2>> obs.err
	./nexus showEmptyList >> obs.txt 2>> obs.err
	./nexus readInt >> obs.txt 2>> obs.err
	./nexus readReal >> obs.txt 2>> obs.err
	./nexus readBool >> obs.txt 2>> obs.err
	./nexus readStr >> obs.txt 2>> obs.err
	./nexus readList >> obs.txt 2>> obs.err
	./nexus readTuple >> obs.txt 2>> obs.err
	./nexus readRecord >> obs.txt 2>> obs.err
	./nexus readInvalid >> obs.txt 2>> obs.err
	./nexus readTypeMismatch >> obs.txt 2>> obs.err
	./nexus readEmptyStr >> obs.txt 2>> obs.err
	./nexus roundTripInt >> obs.txt 2>> obs.err
	./nexus roundTripReal >> obs.txt 2>> obs.err
	./nexus roundTripBool >> obs.txt 2>> obs.err
	./nexus roundTripStr >> obs.txt 2>> obs.err
	./nexus roundTripList >> obs.txt 2>> obs.err
	./nexus roundTripTuple >> obs.txt 2>> obs.err
	./nexus roundTripRecord >> obs.txt 2>> obs.err
	./nexus roundTripNested >> obs.txt 2>> obs.err
	./nexus showShowInt >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/intrinsic-show-read-nexus/exp.txt
================================================
"42"
"3.14"
"true"
"\"hello\""
"[1,2,3]"
"[10,\"abc\"]"
"{\"x\":1,\"y\":2}"
"[[1,2],[3,4]]"
"42"
"null"
"[]"
42
3.14
true
"hello"
[1,2,3]
[10,"abc"]
{"x":1,"y":2}
null
null
null
42
3.14
true
"hello"
[1,2,3]
[10,"abc"]
{"x":1,"y":2}
[[1,2],[3,4]]
"\"42\""


================================================
FILE: test-suite/golden-tests/intrinsic-show-read-nexus/main.loc
================================================
module main
  ( showInt
  , showReal
  , showBool
  , showStr
  , showList
  , showTuple
  , showRecord
  , showNested
  , showOptSome
  , showOptNone
  , showEmptyList
  , readInt
  , readReal
  , readBool
  , readStr
  , readList
  , readTuple
  , readRecord
  , readInvalid
  , readTypeMismatch
  , readEmptyStr
  , roundTripInt
  , roundTripReal
  , roundTripBool
  , roundTripStr
  , roundTripList
  , roundTripTuple
  , roundTripRecord
  , roundTripNested
  , showShowInt
  )

-- No language-specific imports: all nexus-level evaluation

record Point where
  x :: Int
  y :: Int

-- === @show tests ===

showInt :: Str
showInt = @show 42

showReal :: Str
showReal = @show 3.14

showBool :: Str
showBool = @show True

showStr :: Str
showStr = @show "hello"

showList :: Str
showList = @show [1, 2, 3]

showTuple :: Str
showTuple = @show (10, "abc")

showRecord :: Str
showRecord = @show {x = 1, y = 2}

showNested :: Str
showNested = @show [[1, 2], [3, 4]]

showOptSome :: Str
showOptSome = @show (@read "42" :: ?Int)

showOptNone :: Str
showOptNone = @show (@read "bad" :: ?Int)

showEmptyList :: Str
showEmptyList = @show ([] :: [Int])

-- === @read tests ===

readInt :: ?Int
readInt = @read "42"

readReal :: ?Real
readReal = @read "3.14"

readBool :: ?Bool
readBool = @read "true"

readStr :: ?Str
readStr = @read "\"hello\""

readList :: ?[Int]
readList = @read "[1,2,3]"

readTuple :: ?(Int, Str)
readTuple = @read "[10,\"abc\"]"

readRecord :: ?Point
readRecord = @read "{\"x\":1,\"y\":2}"

readInvalid :: ?Int
readInvalid = @read "not_a_number"

readTypeMismatch :: ?Int
readTypeMismatch = @read "\"hello\""

readEmptyStr :: ?Int
readEmptyStr = @read ""

-- === round-trip tests ===

roundTripInt :: ?Int
roundTripInt = @read (@show 42)

roundTripReal :: ?Real
roundTripReal = @read (@show 3.14)

roundTripBool :: ?Bool
roundTripBool = @read (@show True)

roundTripStr :: ?Str
roundTripStr = @read (@show "hello")

roundTripList :: ?[Int]
roundTripList = @read (@show [1, 2, 3])

roundTripTuple :: ?(Int, Str)
roundTripTuple = @read (@show (10, "abc"))

roundTripRecord :: ?Point
roundTripRecord = @read (@show {x = 1, y = 2})

roundTripNested :: ?[[Int]]
roundTripNested = @read (@show [[1, 2], [3, 4]])

-- === edge case: @show of @show ===

showShowInt :: Str
showShowInt = @show (@show 42)


================================================
FILE: test-suite/golden-tests/let-crosslang/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- letMinimal ---" > obs.txt
	./nexus letMinimal >> obs.txt 2> obs.err
	echo "--- letMinimalReverse ---" >> obs.txt
	./nexus letMinimalReverse >> obs.txt 2>> obs.err
	echo "--- letTripleChain ---" >> obs.txt
	./nexus letTripleChain >> obs.txt 2>> obs.err
	echo "--- letDiamond ---" >> obs.txt
	./nexus letDiamond >> obs.txt 2>> obs.err
	echo "--- letTripleUse ---" >> obs.txt
	./nexus letTripleUse >> obs.txt 2>> obs.err
	echo "--- letDeepChain ---" >> obs.txt
	./nexus letDeepChain >> obs.txt 2>> obs.err
	echo "--- letInDoBlock ---" >> obs.txt
	./nexus letInDoBlock >> obs.txt 2>> obs.err
	echo "--- letListFanOut ---" >> obs.txt
	./nexus letListFanOut >> obs.txt 2>> obs.err
	echo "--- letListDeepChain ---" >> obs.txt
	./nexus letListDeepChain >> obs.txt 2>> obs.err
	echo "--- letStrIdChain ---" >> obs.txt
	./nexus letStrIdChain >> obs.txt 2>> obs.err
	echo "--- letMixedTypes ---" >> obs.txt
	./nexus letMixedTypes >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/let-crosslang/exp.txt
================================================
--- letMinimal ---
10
--- letMinimalReverse ---
10
--- letTripleChain ---
5
--- letDiamond ---
100
--- letTripleUse ---
300
--- letDeepChain ---
155
--- letInDoBlock ---
4
--- letListFanOut ---
40
--- letListDeepChain ---
115
--- letStrIdChain ---
7
--- letMixedTypes ---
20


================================================
FILE: test-suite/golden-tests/let-crosslang/f.hpp
================================================
#ifndef __F_HPP__
#define __F_HPP__

#include <string>
#include <vector>

std::string makeStr(int n) {
    return std::string(n, 'x');
}

int strLen(const std::string& s) {
    return (int)s.size();
}

int doubleIt(int x) {
    return x * 2;
}

int addTwo(int a, int b) {
    return a + b;
}

std::vector<int> makeRange(int n) {
    std::vector<int> result(n);
    for (int i = 0; i < n; i++) result[i] = i + 1;
    return result;
}

int sumList(const std::vector<int>& xs) {
    int total = 0;
    for (int x : xs) total += x;
    return total;
}

std::vector<int> incAll(const std::vector<int>& xs) {
    std::vector<int> result(xs.size());
    for (size_t i = 0; i < xs.size(); i++) result[i] = xs[i] + 1;
    return result;
}

std::string idStr(const std::string& s) {
    return s;
}

std::vector<int> idList(const std::vector<int>& xs) {
    return xs;
}

int counter() {
    static int n = 0;
    return ++n;
}

#endif


================================================
FILE: test-suite/golden-tests/let-crosslang/f.py
================================================
def makeStr(n):
    return "y" * n

def strLen(s):
    return len(s)

def doubleIt(x):
    return x * 2

def addTwo(a, b):
    return a + b

def makeRange(n):
    return list(range(1, n + 1))

def sumList(xs):
    return sum(xs)

def incAll(xs):
    return [x + 1 for x in xs]

def idStr(s):
    return s

def idList(xs):
    return list(xs)

_counter = 0
def counter():
    global _counter
    _counter += 1
    return _counter


================================================
FILE: test-suite/golden-tests/let-crosslang/main.loc
================================================
-- Regression tests for let bindings with cross-language foreign calls.
-- Covers type changes across let boundaries, diamond patterns, fan-out,
-- deep chains, do-blocks with lets, and mixed types.

module main
  ( letMinimal
  , letMinimalReverse
  , letTripleChain
  , letDiamond
  , letTripleUse
  , letDeepChain
  , letInDoBlock
  , letListFanOut
  , letListDeepChain
  , letStrIdChain
  , letMixedTypes
  )

import root-cpp
import root-py

source Cpp from "f.hpp"
  ( "makeStr" as cppMakeStr
  , "strLen" as cppStrLen
  , "doubleIt" as cppDouble
  , "addTwo" as cppAdd
  , "makeRange" as cppMakeRange
  , "sumList" as cppSumList
  , "incAll" as cppIncAll
  , "idStr" as cppIdStr
  , "idList" as cppIdList
  , "counter" as cppCounter
  )

source Py from "f.py"
  ( "makeStr" as pyMakeStr
  , "strLen" as pyStrLen
  , "doubleIt" as pyDouble
  , "addTwo" as pyAdd
  , "makeRange" as pyMakeRange
  , "sumList" as pySumList
  , "incAll" as pyIncAll
  , "idStr" as pyIdStr
  , "idList" as pyIdList
  , "counter" as pyCounter
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

cppMakeStr :: Int -> Str
cppStrLen :: Str -> Int
cppDouble :: Int -> Int
cppAdd :: Int -> Int -> Int
cppMakeRange :: Int -> [Int]
cppSumList :: [Int] -> Int
cppIncAll :: [Int] -> [Int]
cppIdStr :: Str -> Str
cppIdList :: [Int] -> [Int]
cppCounter :: <IO> Int

pyMakeStr :: Int -> Str
pyStrLen :: Str -> Int
pyDouble :: Int -> Int
pyAdd :: Int -> Int -> Int
pyMakeRange :: Int -> [Int]
pySumList :: [Int] -> Int
pyIncAll :: [Int] -> [Int]
pyIdStr :: Str -> Str
pyIdList :: [Int] -> [Int]
pyCounter :: <IO> Int

------------------------------------------------------------
-- PATTERN 1: Minimal reproducer - 2 consecutive foreign calls
-- from C++ pool to Python pool with type change (Str -> Int -> Str)
--
-- cppMakeStr(10) = "xxxxxxxxxx" (local)
-- pyStrLen("xxxxxxxxxx") = 10 (foreign to py, returns Int)
-- pyMakeStr(10) = "yyyyyyyyyy" (foreign to py, returns Str)
-- cppStrLen("yyyyyyyyyy") = 10 (local)
-- Expected: 10
------------------------------------------------------------
letMinimal :: Int
letMinimal =
    let s1 = cppMakeStr 10
        n1 = pyStrLen s1
        s2 = pyMakeStr n1
    in cppStrLen s2

------------------------------------------------------------
-- PATTERN 2: Reverse direction - C++ is the foreign pool
-- pyMakeStr(10) = "yyyyyyyyyy" (local in py)
-- cppStrLen("yyyyyyyyyy") = 10 (foreign to cpp, returns Int)
-- cppMakeStr(10) = "xxxxxxxxxx" (foreign to cpp, returns Str)
-- pyStrLen("xxxxxxxxxx") = 10 (local in py)
-- Expected: 10
------------------------------------------------------------
letMinimalReverse :: Int
letMinimalReverse =
    let s1 = pyMakeStr 10
        n1 = cppStrLen s1
        s2 = cppMakeStr n1
    in pyStrLen s2

------------------------------------------------------------
-- PATTERN 3: Three consecutive foreign calls with alternating types
-- cppMakeStr(5) = "xxxxx" (local)
-- pyStrLen("xxxxx") = 5 (foreign, Int)
-- pyMakeStr(5) = "yyyyy" (foreign, Str)
-- pyStrLen("yyyyy") = 5 (foreign, Int)
-- Expected: 5
------------------------------------------------------------
letTripleChain :: Int
letTripleChain =
    let s1 = cppMakeStr 5
        n1 = pyStrLen s1
        s2 = pyMakeStr n1
        n2 = pyStrLen s2
    in n2

------------------------------------------------------------
-- PATTERN 4: Diamond - single let-bound value used in two foreign calls
-- cppMakeStr(50) = "xxx...x" (50 chars, local)
-- pyStrLen(s) = 50 (foreign)
-- pyIdStr(s) -> cppStrLen = 50 (foreign + local)
-- Expected: 100
------------------------------------------------------------
letDiamond :: Int
letDiamond =
    let s = cppMakeStr 50
        a = pyStrLen s
        b = cppStrLen (pyIdStr s)
    in a + b

------------------------------------------------------------
-- PATTERN 5: Let-bound foreign result used 3 times
-- cppMakeStr(100) = "xxx...x" (100 chars, local)
-- pyStrLen used 3 times, each a foreign call
-- Expected: 300
------------------------------------------------------------
letTripleUse :: Int
letTripleUse =
    let s = cppMakeStr 100
    in pyStrLen s + pyStrLen s + pyStrLen s

------------------------------------------------------------
-- PATTERN 6: Deep chain of 10 alternating let-bound foreign calls
-- cppMakeRange(10) = [1..10] (local)
-- pyIncAll 10 times: each adds 1 to all elements
-- [1..10] + 10 = [11..20], sum = sum(11..20) = 155
-- Expected: 155
------------------------------------------------------------
letDeepChain :: Int
letDeepChain =
    let xs = cppMakeRange 10
        xs2 = pyIncAll xs
        xs3 = cppIncAll xs2
        xs4 = pyIncAll xs3
        xs5 = cppIncAll xs4
        xs6 = pyIncAll xs5
        xs7 = cppIncAll xs6
        xs8 = pyIncAll xs7
        xs9 = cppIncAll xs8
        xs10 = pyIncAll xs9
        xs11 = cppIncAll xs10
    in pySumList xs11

------------------------------------------------------------
-- PATTERN 7: Do-block with let bindings and foreign calls
-- cppCounter returns 1, pyDouble(1) = 2
-- cppCounter returns 2, pyAdd(2,2) = 4
-- Expected: 4
------------------------------------------------------------
letInDoBlock :: <IO> Int
letInDoBlock = do
    a <- cppCounter
    let b = pyDouble a
    c <- cppCounter
    pyAdd b c

------------------------------------------------------------
-- PATTERN 8: Let-bound list forwarded to two different foreign calls
-- cppMakeRange(5) = [1,2,3,4,5] (local)
-- pyIncAll([1..5]) = [2..6] (foreign)
-- pySumList([2..6]) = 20 (foreign)
-- pyIncAll([1..5]) = [2..6] (foreign again on same data)
-- pySumList([2..6]) = 20 (foreign)
-- Expected: 40
------------------------------------------------------------
letListFanOut :: Int
letListFanOut =
    let xs = cppMakeRange 5
        a = pySumList (cppIncAll xs)
        b = pySumList (cppIncAll xs)
    in a + b

------------------------------------------------------------
-- PATTERN 9: Deep chain with list types changing in let bindings
-- pyMakeRange(10) = [1..10] (local in py)
-- 6 alternating incAll calls across languages
-- [1..10] + 6 = [7..16], sum = sum(7..16) = 115
-- Expected: 115
------------------------------------------------------------
letListDeepChain :: Int
letListDeepChain =
    let xs = pyMakeRange 10
        xs2 = cppIncAll xs
        xs3 = pyIncAll xs2
        xs4 = cppIncAll xs3
        xs5 = pyIncAll xs4
        xs6 = cppIncAll xs5
        xs7 = pyIncAll xs6
    in cppSumList xs7

------------------------------------------------------------
-- PATTERN 10: Consecutive string identity calls through let bindings
-- Each call should preserve the string but crosses a language boundary
-- cppMakeStr(7) = "xxxxxxx" (local)
-- pyIdStr -> cppIdStr -> pyIdStr -> cppIdStr (4 foreign calls)
-- cppStrLen = 7
-- Expected: 7
------------------------------------------------------------
letStrIdChain :: Int
letStrIdChain =
    let s = cppMakeStr 7
        s2 = pyIdStr s
        s3 = cppIdStr s2
        s4 = pyIdStr s3
        s5 = cppIdStr s4
    in cppStrLen s5

------------------------------------------------------------
-- PATTERN 11: Mixed types in lets - Int and Str interleaved
-- 5 = 5 (literal)
-- pyDouble(5) = 10 (foreign, returns Int)
-- pyMakeStr(10) = "yyyyyyyyyy" (foreign, returns Str) <-- type change!
-- pyStrLen("yyyyyyyyyy") = 10 (foreign, returns Int)
-- pyDouble(10) = 20 (foreign, returns Int)
-- Expected: 20
------------------------------------------------------------
letMixedTypes :: Int
letMixedTypes =
    let n1 = pyDouble 5
        s1 = pyMakeStr n1
        n2 = pyStrLen s1
        n3 = pyDouble n2
    in n3


================================================
FILE: test-suite/golden-tests/let-expressions/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testCppOnce ---" > obs.txt
	./nexus testCppOnce 5 >> obs.txt 2>&1
	echo "--- testPyOnce ---" >> obs.txt
	./nexus testPyOnce 5 >> obs.txt 2>&1
	echo "--- testROnce ---" >> obs.txt
	./nexus testROnce 5 >> obs.txt 2>&1
	echo "--- testCppSeq ---" >> obs.txt
	./nexus testCppSeq 5 >> obs.txt 2>&1
	echo "--- testPySeq ---" >> obs.txt
	./nexus testPySeq 5 >> obs.txt 2>&1
	echo "--- testRSeq ---" >> obs.txt
	./nexus testRSeq 5 >> obs.txt 2>&1
	echo "--- testShadow ---" >> obs.txt
	./nexus testShadow 5 >> obs.txt 2>&1

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/let-expressions/exp.txt
================================================
--- testCppOnce ---
EVAL 5
20
--- testPyOnce ---
EVAL 5
20
--- testROnce ---
EVAL 5
20
--- testCppSeq ---
EVAL 5
EVAL 10
30
--- testPySeq ---
EVAL 5
EVAL 10
30
--- testRSeq ---
EVAL 5
EVAL 10
30
--- testShadow ---
EVAL 5
20


================================================
FILE: test-suite/golden-tests/let-expressions/foo.R
================================================
sideEffectR <- function(x) {
    cat(paste0("EVAL ", x, "\n"), file = stderr())
    x * 2L
}


================================================
FILE: test-suite/golden-tests/let-expressions/foo.hpp
================================================
#include <iostream>

int sideEffectCpp(int x) {
    std::cerr << "EVAL " << x << std::endl;
    return x * 2;
}


================================================
FILE: test-suite/golden-tests/let-expressions/foo.py
================================================
import sys

def sideEffectPy(x):
    print("EVAL " + str(x), file=sys.stderr)
    return x * 2


================================================
FILE: test-suite/golden-tests/let-expressions/main.loc
================================================
module main
  ( testCppOnce
  , testPyOnce
  , testROnce
  , testCppSeq
  , testPySeq
  , testRSeq
  , testShadow
  )

import root-cpp
import root-py
import root-r

-- Each sideEffect function prints "EVAL <input>" to stderr and returns input * 2.
-- This lets us verify: (1) how many times it is called, and (2) in what order.

source Cpp from "foo.hpp" ("sideEffectCpp")
source Py from "foo.py" ("sideEffectPy")
source R from "foo.R" ("sideEffectR")

sideEffectCpp :: Int -> Int
sideEffectPy :: Int -> Int
sideEffectR :: Int -> Int

-- Single let, value used twice: side effect should happen exactly once.
-- With input 5: sideEffect 5 prints "EVAL 5", a = 10, result = 10 + 10 = 20.
testCppOnce :: Int -> Int
testCppOnce x = let a = sideEffectCpp x in a + a

testPyOnce :: Int -> Int
testPyOnce x = let a = sideEffectPy x in a + a

testROnce :: Int -> Int
testROnce x = let a = sideEffectR x in a + a

-- Sequential lets: first binding evaluated before second, each exactly once.
-- With input 5: sideEffect 5 prints "EVAL 5", a = 10,
--               sideEffect 10 prints "EVAL 10", b = 20,
--               result = 10 + 20 = 30.
testCppSeq :: Int -> Int
testCppSeq x =
  let a = sideEffectCpp x
      b = sideEffectCpp a
  in a + b

testPySeq :: Int -> Int
testPySeq x =
  let a = sideEffectPy x
      b = sideEffectPy a
  in a + b

testRSeq :: Int -> Int
testRSeq x =
  let a = sideEffectR x
      b = sideEffectR a
  in a + b

-- Shadowing: let-bound variable shadows the lambda parameter.
-- The `x` in `sideEffectCpp x` refers to the lambda parameter (5).
-- The `x` in `x + x` refers to the let-bound variable (10).
-- Result: 10 + 10 = 20.
testShadow :: Int -> Int
testShadow x = let x = sideEffectCpp x in x + x


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/bar/baz/main.loc
================================================
module (*)

import .bif.biz (mul)

source Py from "main.py" ("add")

type Py => Real = "float"

add :: Real -> Real -> Real

compute :: Real -> Real -> Real
compute x y = add x (mul y y)


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/bar/baz/main.py
================================================
def add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/bif/biz/main.loc
================================================
module (*)

source Py from "main.py" ("mul")

type Py => Real = "float"

mul :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/bif/biz/main.py
================================================
def mul(x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/exp.txt
================================================
18


================================================
FILE: test-suite/golden-tests/local-import-cousin-py/main.loc
================================================
module main (foo)

type Py => Real = "float"

import .bar.baz (compute)

foo :: Real -> Real -> Real
foo x y = compute x y


================================================
FILE: test-suite/golden-tests/local-import-nested-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 3 2>> obs.err  >> obs.txt
	./nexus bar 3 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/local-import-nested-py/exp.txt
================================================
-9
9


================================================
FILE: test-suite/golden-tests/local-import-nested-py/lib/math/main.loc
================================================
module (*)

source Py from "main.py" ("square")

type Py => Real = "float"

square :: Real -> Real


================================================
FILE: test-suite/golden-tests/local-import-nested-py/lib/math/main.py
================================================
def square(x):
    return x * x


================================================
FILE: test-suite/golden-tests/local-import-nested-py/main.loc
================================================
module (foo, bar)

type Py => Real = "float"

import .util (negate)
import .lib.math (square)

foo :: Real -> Real
foo x = negate (square x)

bar :: Real -> Real
bar x = square (negate x)


================================================
FILE: test-suite/golden-tests/local-import-nested-py/package.yaml
================================================
name: main
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []


================================================
FILE: test-suite/golden-tests/local-import-nested-py/util.loc
================================================
module (*)

source Py from "util.py" ("negate")

type Py => Real = "float"

negate :: Real -> Real


================================================
FILE: test-suite/golden-tests/local-import-nested-py/util.py
================================================
def negate(x):
    return -x


================================================
FILE: test-suite/golden-tests/local-import-root-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 21 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/local-import-root-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/local-import-root-py/main.loc
================================================
module main (foo)

type Py => Real = "float"

import .root (double)

foo :: Real -> Real
foo x = double x


================================================
FILE: test-suite/golden-tests/local-import-root-py/root/main.loc
================================================
module (*)

source Py from "main.py" ("double")

type Py => Real = "float"

double :: Real -> Real


================================================
FILE: test-suite/golden-tests/local-import-root-py/root/main.py
================================================
def double(x):
    return x * 2


================================================
FILE: test-suite/golden-tests/manifold-form-0/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t0.loc 2> build.err
	./nexus checkInt 2>> obs.err  >> obs.txt
	./nexus checkInt8 2>> obs.err  >> obs.txt
	./nexus checkInt16 2>> obs.err  >> obs.txt
	./nexus checkInt32 2>> obs.err  >> obs.txt
	./nexus checkInt64 2>> obs.err  >> obs.txt
	./nexus checkUInt8 2>> obs.err  >> obs.txt
	./nexus checkUInt16 2>> obs.err  >> obs.txt
	./nexus checkUInt32 2>> obs.err  >> obs.txt
	./nexus checkUInt64 2>> obs.err  >> obs.txt
	./nexus checkReal 2>> obs.err  >> obs.txt
	./nexus checkBool 2>> obs.err  >> obs.txt
	./nexus checkStr 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-0/exp.txt
================================================
1
2
3
4
5
6
7
8
9
420.69
true
"abcd"


================================================
FILE: test-suite/golden-tests/manifold-form-0/t0.loc
================================================
module main (*)

import root (Int, Int8, Int16, Int32, Int64, UInt8, UInt16, UInt32, UInt64, Real, Bool, Str)

checkInt    = 1 :: Int
checkInt8   = 2 :: Int8
checkInt16  = 3 :: Int16
checkInt32  = 4 :: Int32
checkInt64  = 5 :: Int64
checkUInt8  = 6 :: UInt8
checkUInt16 = 7 :: UInt16
checkUInt32 = 8 :: UInt32
checkUInt64 = 9 :: UInt64
checkReal   = 420.69 :: Real
checkBool   = True
checkStr    = "abcd"


================================================
FILE: test-suite/golden-tests/manifold-form-0x/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 12 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *pdf


================================================
FILE: test-suite/golden-tests/manifold-form-0x/exp.txt
================================================
12


================================================
FILE: test-suite/golden-tests/manifold-form-0x/main.loc
================================================
module main (foo)

foo :: Int -> Int
foo x = x


================================================
FILE: test-suite/golden-tests/manifold-form-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t1.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-1/exp.txt
================================================
[]


================================================
FILE: test-suite/golden-tests/manifold-form-1/t1.loc
================================================
module main (foo)

foo :: [Int]
foo = []


================================================
FILE: test-suite/golden-tests/manifold-form-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t2.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-2/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/manifold-form-2/t2.loc
================================================
module main (foo)

foo = [True]


================================================
FILE: test-suite/golden-tests/manifold-form-2x/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t2.loc 2> build.err
	./nexus foo 99 > obs.txt 2> obs.err
	./nexus bar true '"Alice"' 2>> obs.err  >> obs.txt
	./nexus baz 4.3 -5 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-2x/exp.txt
================================================
[99,99]
[true,"Alice"]
[-5,4.3,4.3]


================================================
FILE: test-suite/golden-tests/manifold-form-2x/t2.loc
================================================
module main (foo, bar, baz)

foo :: Int -> [Int] 
foo x = [x,x]

bar :: Bool -> Str -> (Bool, Str)
bar x y = (x,y)

baz :: Real -> Real -> [Real]
baz x y = [y,x,x]


================================================
FILE: test-suite/golden-tests/manifold-form-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t3.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-3/exp.txt
================================================
[[true],42,"hello"]


================================================
FILE: test-suite/golden-tests/manifold-form-3/t3.loc
================================================
module main (foo)

foo = ([True], 42, "hello")


================================================
FILE: test-suite/golden-tests/manifold-form-3x/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t3.loc 2> build.err
	./nexus foo '[true]' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-3x/exp.txt
================================================
[[true],42,"hello"]


================================================
FILE: test-suite/golden-tests/manifold-form-3x/t3.loc
================================================
module main (foo)

foo :: [Bool] -> ([Bool], Int, Str)
foo x = (x, 42, "hello")


================================================
FILE: test-suite/golden-tests/manifold-form-4_c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t4.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *out


================================================
FILE: test-suite/golden-tests/manifold-form-4_c/exp.txt
================================================
[[true,42],4]


================================================
FILE: test-suite/golden-tests/manifold-form-4_c/t4.loc
================================================
module main (foo)

import root-cpp

foo = ((True, 42.0), 1.0 * 4.0)


================================================
FILE: test-suite/golden-tests/manifold-form-4_py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t4.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-4_py/exp.txt
================================================
[[42,true],4]


================================================
FILE: test-suite/golden-tests/manifold-form-4_py/t4.loc
================================================
module main (foo)

import root-py

foo = ((42.0, True), 1.0 * 4.0)


================================================
FILE: test-suite/golden-tests/manifold-form-4_r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-4_r/exp.txt
================================================
[[true,4.2],4]


================================================
FILE: test-suite/golden-tests/manifold-form-4_r/main.loc
================================================
module main (foo)

import root-r

foo = ((True, 4.2), 1.0 * 4.0)


================================================
FILE: test-suite/golden-tests/manifold-form-5_c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t5.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *out


================================================
FILE: test-suite/golden-tests/manifold-form-5_c/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/manifold-form-5_c/t5.loc
================================================
module main (foo)

import root-cpp

foo = fold (+) 0.0 [1.0, 2.0, 3.0, 1.0 * 4.0]


================================================
FILE: test-suite/golden-tests/manifold-form-5_py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t5.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-5_py/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/manifold-form-5_py/t5.loc
================================================
module main (foo)

import root-py

foo = fold (+) 0.0 [1.0, 2.0, 3.0, 1.0 * 4.0]


================================================
FILE: test-suite/golden-tests/manifold-form-5_r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t5.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-5_r/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/manifold-form-5_r/t5.loc
================================================
module main (foo)

import root-r

foo = fold (+) 0.0 [1.0, 2.0, 3.0, 1.0 * 4.0]


================================================
FILE: test-suite/golden-tests/manifold-form-6_c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t6.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *out


================================================
FILE: test-suite/golden-tests/manifold-form-6_c/exp.txt
================================================
[true,16,0.25]


================================================
FILE: test-suite/golden-tests/manifold-form-6_c/t6.loc
================================================
module main (foo)

import root-cpp

foo x = (True, x, 4.0 / x)


================================================
FILE: test-suite/golden-tests/manifold-form-6_py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t6.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolspy


================================================
FILE: test-suite/golden-tests/manifold-form-6_py/exp.txt
================================================
[true,16,0.25]


================================================
FILE: test-suite/golden-tests/manifold-form-6_py/t6.loc
================================================
module main (foo)

import root-py

foo x = (True, x, 4.0 / x)


================================================
FILE: test-suite/golden-tests/manifold-form-6_r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t6.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolsR


================================================
FILE: test-suite/golden-tests/manifold-form-6_r/exp.txt
================================================
[true,16,0.25]


================================================
FILE: test-suite/golden-tests/manifold-form-6_r/t6.loc
================================================
module main (foo)

import root-r

foo x = (True, x, 4.0 / x)


================================================
FILE: test-suite/golden-tests/manifold-form-7_c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t7.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-7_c/exp.txt
================================================
26


================================================
FILE: test-suite/golden-tests/manifold-form-7_c/t7.loc
================================================
module main (foo)

import root-cpp

foo x = fold (+) 0.0 [1.0, 2.0, 3.0, x, x / 4.0]


================================================
FILE: test-suite/golden-tests/manifold-form-7_py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t7.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-7_py/exp.txt
================================================
26


================================================
FILE: test-suite/golden-tests/manifold-form-7_py/t7.loc
================================================
module main (foo)

import root-py

foo x = fold (+) 0.0 [1.0, 2.0, 3.0, x, x / 4.0]


================================================
FILE: test-suite/golden-tests/manifold-form-7_r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus t7.loc 2> build.err
	./nexus foo 16 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/manifold-form-7_r/exp.txt
================================================
26


================================================
FILE: test-suite/golden-tests/manifold-form-7_r/t7.loc
================================================
module main (foo)

import root-r

foo x = fold (+) 0.0 [1.0, 2.0, 3.0, x, x / 4.0]


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testOptRealCppToPy > obs.txt 2> obs.err
	./nexus testOptRealPyToCpp >> obs.txt 2>> obs.err
	./nexus testRecordCppToPy >> obs.txt 2>> obs.err
	./nexus testRecordPyToCpp >> obs.txt 2>> obs.err
	./nexus testOptRealChain >> obs.txt 2>> obs.err
	./nexus testRecordChain >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/cppfuncs.loc
================================================
module (*)

import .types

cMakeOptReal :: Real -> ?Real
cFromNullReal :: Real -> ?Real -> Real
cDoubleOptReal :: ?Real -> ?Real
cMakePair :: Bool -> Real -> PairBR
cGetPairValue :: PairBR -> Real

source Cpp from "foo.hpp"
  ( "cMakeOptReal"
  , "cFromNullReal"
  , "cDoubleOptReal"
  , "cMakePair"
  , "cGetPairValue"
  )


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/exp.txt
================================================
3.14
3.14
2.718
2.718
3
3


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/foo.hpp
================================================
#ifndef MORLOC_MEMORY_INTEROP_MISALIGN_HPP
#define MORLOC_MEMORY_INTEROP_MISALIGN_HPP

#include <optional>

struct pair_br_t {
    bool flag;
    double value;
};

std::optional<double> cMakeOptReal(double x) {
    return std::optional<double>(x);
}

double cFromNullReal(double def, const std::optional<double>& x) {
    if (!x.has_value()) return def;
    return *x;
}

std::optional<double> cDoubleOptReal(const std::optional<double>& x) {
    if (!x.has_value()) return std::nullopt;
    return std::optional<double>(*x * 2.0);
}

pair_br_t cMakePair(bool flag, double value) {
    return pair_br_t{flag, value};
}

double cGetPairValue(const pair_br_t& p) {
    return p.value;
}

#endif


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/foo.py
================================================
def pMakeOptReal(x):
    return x

def pFromNullReal(default_val, x):
    if x is None:
        return default_val
    return x

def pMakePair(flag, value):
    return {"flag": flag, "value": value}

def pGetPairValue(p):
    return p["value"]

def pDoublePairValue(p):
    return {"flag": p["flag"], "value": p["value"] * 2.0}


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/main.loc
================================================
-- Tests misaligned data crossing C++ <-> Python boundary through shared memory.
-- ?Real and {flag :: Bool, value :: Real} force misaligned reads/writes
-- in the voidstar serialization format when crossing language boundaries.

module main
  ( testOptRealCppToPy
  , testOptRealPyToCpp
  , testRecordCppToPy
  , testRecordPyToCpp
  , testOptRealChain
  , testRecordChain
  )

import .types
import .cppfuncs
import .pyfuncs

testOptRealCppToPy :: Real
testOptRealCppToPy = pFromNullReal 0.0 (cMakeOptReal 3.14)

testOptRealPyToCpp :: Real
testOptRealPyToCpp = cFromNullReal 0.0 (pMakeOptReal 3.14)

testRecordCppToPy :: Real
testRecordCppToPy = pGetPairValue (cMakePair True 2.718)

testRecordPyToCpp :: Real
testRecordPyToCpp = cGetPairValue (pMakePair True 2.718)

testOptRealChain :: Real
testOptRealChain = pFromNullReal 0.0 (cDoubleOptReal (pMakeOptReal 1.5))

testRecordChain :: Real
testRecordChain = cGetPairValue (pDoublePairValue (cMakePair False 1.5))


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/pyfuncs.loc
================================================
module (*)

import .types

pMakeOptReal :: Real -> ?Real
pFromNullReal :: Real -> ?Real -> Real
pMakePair :: Bool -> Real -> PairBR
pGetPairValue :: PairBR -> Real
pDoublePairValue :: PairBR -> PairBR

source Py from "foo.py"
  ( "pMakeOptReal"
  , "pFromNullReal"
  , "pMakePair"
  , "pGetPairValue"
  , "pDoublePairValue"
  )


================================================
FILE: test-suite/golden-tests/memory-interop-misalign-cp/types.loc
================================================
module (*)

type Py => Bool = "bool"
type Py => Int = "int"
type Py => Real = "float"
type Cpp => Bool = "bool"
type Cpp => Int = "int"
type Cpp => Real = "double"

record PairBR where
  flag :: Bool
  value :: Real
record Cpp => PairBR = "pair_br_t"
record Py => PairBR = "dict"


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testOptRecord > obs.txt 2> obs.err
	./nexus testOptRecordNull >> obs.txt 2>> obs.err
	./nexus testListRecords >> obs.txt 2>> obs.err
	./nexus testRecordWithOpt >> obs.txt 2>> obs.err
	./nexus testRecordWithOptNull >> obs.txt 2>> obs.err
	./nexus testNestedRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-cpp/exp.txt
================================================
{"flag":true,"value":3.14}
{"flag":false,"value":0}
6.6
9.99
null
{"flag":true,"value":2.5}


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-cpp/foo.hpp
================================================
#ifndef MORLOC_MEMORY_NESTED_MISALIGN_HPP
#define MORLOC_MEMORY_NESTED_MISALIGN_HPP

#include <optional>
#include <vector>

struct pair_br_t {
    bool flag;
    double value;
};

struct record_with_opt_t {
    bool flag;
    std::optional<double> opt;
};

template <typename T>
std::optional<T> toNull(const T& x) {
    return std::optional<T>(x);
}

std::optional<pair_br_t> makeOptRecord(bool flag, double value) {
    return std::optional<pair_br_t>(pair_br_t{flag, value});
}

pair_br_t fromNullRecord(const pair_br_t& def, const std::optional<pair_br_t>& x) {
    if (!x.has_value()) return def;
    return *x;
}

double sumRecordValues(const std::vector<pair_br_t>& records) {
    double sum = 0.0;
    for (const auto& r : records) {
        sum += r.value;
    }
    return sum;
}

record_with_opt_t makeRecordWithOpt(bool flag, const std::optional<double>& opt) {
    return record_with_opt_t{flag, opt};
}

std::optional<double> getRecordOpt(const record_with_opt_t& r) {
    return r.opt;
}

std::optional<pair_br_t> nestedRoundTrip(const std::optional<pair_br_t>& x) {
    if (!x.has_value()) return std::nullopt;
    return std::optional<pair_br_t>(pair_br_t{x->flag, x->value});
}

#endif


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-cpp/main.loc
================================================
-- Tests compound misalignment from nested containers in C++.
-- ?PairBR: optional wrapping a record with misaligned fields
-- [PairBR]: array of records whose element width is misaligned
-- RecordWithOpt: record containing a ?Real field (misaligned optional inside record)

module main
  ( testOptRecord
  , testOptRecordNull
  , testListRecords
  , testRecordWithOpt
  , testRecordWithOptNull
  , testNestedRoundTrip
  )

type Cpp => Bool = "bool"
type Cpp => Int = "int"
type Cpp => Real = "double"
type Cpp => List a = "std::vector<$1>" a

record PairBR where
  flag :: Bool
  value :: Real
record Cpp => PairBR = "pair_br_t"

record RecordWithOpt where
  flag :: Bool
  opt :: ?Real
record Cpp => RecordWithOpt = "record_with_opt_t"

makeOptRecord :: Bool -> Real -> ?PairBR
fromNullRecord :: PairBR -> ?PairBR -> PairBR
sumRecordValues :: [PairBR] -> Real
makeRecordWithOpt :: Bool -> ?Real -> RecordWithOpt
getRecordOpt :: RecordWithOpt -> ?Real
nestedRoundTrip :: ?PairBR -> ?PairBR

source Cpp from "foo.hpp"
  ( "makeOptRecord"
  , "fromNullRecord"
  , "sumRecordValues"
  , "makeRecordWithOpt"
  , "getRecordOpt"
  , "nestedRoundTrip"
  )

toNull :: a -> ?a
source Cpp from "foo.hpp" ("toNull")

testOptRecord :: PairBR
testOptRecord = fromNullRecord {flag = False, value = 0.0} (makeOptRecord True 3.14)

testOptRecordNull :: PairBR
testOptRecordNull = fromNullRecord {flag = False, value = 0.0} Null

testListRecords :: Real
testListRecords = sumRecordValues [{flag = True, value = 1.1}, {flag = False, value = 2.2}, {flag = True, value = 3.3}]

testRecordWithOpt :: ?Real
testRecordWithOpt = getRecordOpt (makeRecordWithOpt True (toNull 9.99))

testRecordWithOptNull :: ?Real
testRecordWithOptNull = getRecordOpt (makeRecordWithOpt False Null)

testNestedRoundTrip :: PairBR
testNestedRoundTrip = fromNullRecord {flag = False, value = 0.0} (nestedRoundTrip (makeOptRecord True 2.5))


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testOptRecord > obs.txt 2> obs.err
	./nexus testOptRecordNull >> obs.txt 2>> obs.err
	./nexus testListRecords >> obs.txt 2>> obs.err
	./nexus testRecordWithOpt >> obs.txt 2>> obs.err
	./nexus testRecordWithOptNull >> obs.txt 2>> obs.err
	./nexus testNestedRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-py/exp.txt
================================================
{"flag":true,"value":3.14}
{"flag":false,"value":0}
6.6
9.99
null
{"flag":true,"value":2.5}


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-py/foo.py
================================================
def toNull(x):
    return x

def makeOptRecord(flag, value):
    return {"flag": flag, "value": value}

def fromNullRecord(default_val, x):
    if x is None:
        return default_val
    return x

def sumRecordValues(records):
    return sum(r["value"] for r in records)

def makeRecordWithOpt(flag, opt):
    return {"flag": flag, "opt": opt}

def getRecordOpt(r):
    return r["opt"]

def nestedRoundTrip(x):
    if x is None:
        return None
    return {"flag": x["flag"], "value": x["value"]}


================================================
FILE: test-suite/golden-tests/memory-nested-misalign-py/main.loc
================================================
-- Tests compound misalignment from nested containers in Python.
-- ?PairBR: optional wrapping a record with misaligned fields
-- [PairBR]: array of records whose element width is misaligned
-- RecordWithOpt: record containing a ?Real field (misaligned optional inside record)

module main
  ( testOptRecord
  , testOptRecordNull
  , testListRecords
  , testRecordWithOpt
  , testRecordWithOptNull
  , testNestedRoundTrip
  )

type Py => Bool = "bool"
type Py => Int = "int"
type Py => Real = "float"
type Py => List a = "list" a

record PairBR where
  flag :: Bool
  value :: Real
record Py => PairBR = "dict"

record RecordWithOpt where
  flag :: Bool
  opt :: ?Real
record Py => RecordWithOpt = "dict"

makeOptRecord :: Bool -> Real -> ?PairBR
fromNullRecord :: PairBR -> ?PairBR -> PairBR
sumRecordValues :: [PairBR] -> Real
makeRecordWithOpt :: Bool -> ?Real -> RecordWithOpt
getRecordOpt :: RecordWithOpt -> ?Real
nestedRoundTrip :: ?PairBR -> ?PairBR

source Py from "foo.py"
  ( "makeOptRecord"
  , "fromNullRecord"
  , "sumRecordValues"
  , "makeRecordWithOpt"
  , "getRecordOpt"
  , "nestedRoundTrip"
  )

toNull :: a -> ?a
source Py from "foo.py" ("toNull")

testOptRecord :: PairBR
testOptRecord = fromNullRecord {flag = False, value = 0.0} (makeOptRecord True 3.14)

testOptRecordNull :: PairBR
testOptRecordNull = fromNullRecord {flag = False, value = 0.0} Null

testListRecords :: Real
testListRecords = sumRecordValues [{flag = True, value = 1.1}, {flag = False, value = 2.2}, {flag = True, value = 3.3}]

testRecordWithOpt :: ?Real
testRecordWithOpt = getRecordOpt (makeRecordWithOpt True (toNull 9.99))

testRecordWithOptNull :: ?Real
testRecordWithOptNull = getRecordOpt (makeRecordWithOpt False Null)

testNestedRoundTrip :: PairBR
testNestedRoundTrip = fromNullRecord {flag = False, value = 0.0} (nestedRoundTrip (makeOptRecord True 2.5))


================================================
FILE: test-suite/golden-tests/memory-optional-double-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testOptRealValue > obs.txt 2> obs.err
	./nexus testOptRealNull >> obs.txt 2>> obs.err
	./nexus testOptRealRoundTrip >> obs.txt 2>> obs.err
	./nexus testOptIntValue >> obs.txt 2>> obs.err
	./nexus testOptIntNull >> obs.txt 2>> obs.err
	./nexus testOptIntRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/memory-optional-double-cpp/exp.txt
================================================
3.14
false
3
42
false
30


================================================
FILE: test-suite/golden-tests/memory-optional-double-cpp/foo.hpp
================================================
#ifndef MORLOC_MEMORY_OPTIONAL_DOUBLE_HPP
#define MORLOC_MEMORY_OPTIONAL_DOUBLE_HPP

#include <optional>

template <typename T>
std::optional<T> toNull(const T& x) {
    return std::optional<T>(x);
}

template <typename T>
bool isNull(const std::optional<T>& x) {
    return !x.has_value();
}

template <typename T>
T fromNull(const T& def, const std::optional<T>& x) {
    if (!x.has_value()) return def;
    return *x;
}

std::optional<double> doubleOptReal(const std::optional<double>& x) {
    if (!x.has_value()) return std::nullopt;
    return std::optional<double>(*x * 2.0);
}

std::optional<int> addOptInt(const std::optional<int>& x, const std::optional<int>& y) {
    if (!x.has_value() || !y.has_value()) return std::nullopt;
    return std::optional<int>(*x + *y);
}

#endif


================================================
FILE: test-suite/golden-tests/memory-optional-double-cpp/main.loc
================================================
-- Tests memory alignment of optional types.
-- ?Real stores a 1-byte tag at offset 0, then an 8-byte double at offset 1.
-- On strict-alignment platforms, this causes SIGBUS.

module main
  ( testOptRealValue
  , testOptRealNull
  , testOptRealRoundTrip
  , testOptIntValue
  , testOptIntNull
  , testOptIntRoundTrip
  )

type Cpp => Bool = "bool"
type Cpp => Int = "int"
type Cpp => Real = "double"

toNull :: a -> ?a
isNull :: ?a -> Bool
fromNull :: a -> ?a -> a
doubleOptReal :: ?Real -> ?Real
addOptInt :: ?Int -> ?Int -> ?Int

source Cpp from "foo.hpp"
  ( "toNull"
  , "isNull"
  , "fromNull"
  , "doubleOptReal"
  , "addOptInt"
  )

testOptRealValue :: ?Real
testOptRealValue = toNull 3.14

testOptRealNull :: Bool
testOptRealNull = isNull (toNull 3.14)

testOptRealRoundTrip :: Real
testOptRealRoundTrip = fromNull 0.0 (doubleOptReal (toNull 1.5))

testOptIntValue :: ?Int
testOptIntValue = toNull 42

testOptIntNull :: Bool
testOptIntNull = isNull (toNull 42)

testOptIntRoundTrip :: Int
testOptIntRoundTrip = fromNull 0 (addOptInt (toNull 10) (toNull 20))


================================================
FILE: test-suite/golden-tests/memory-optional-double-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testOptRealValue > obs.txt 2> obs.err
	./nexus testOptRealNull >> obs.txt 2>> obs.err
	./nexus testOptRealRoundTrip >> obs.txt 2>> obs.err
	./nexus testOptIntValue >> obs.txt 2>> obs.err
	./nexus testOptIntNull >> obs.txt 2>> obs.err
	./nexus testOptIntRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/memory-optional-double-py/exp.txt
================================================
3.14
false
3
42
false
30


================================================
FILE: test-suite/golden-tests/memory-optional-double-py/foo.py
================================================
def toNull(x):
    return x

def isNull(x):
    return x is None

def fromNull(default_val, x):
    if x is None:
        return default_val
    return x

def doubleOptReal(x):
    if x is None:
        return None
    return x * 2.0

def addOptInt(x, y):
    if x is None or y is None:
        return None
    return x + y


================================================
FILE: test-suite/golden-tests/memory-optional-double-py/main.loc
================================================
-- Tests memory alignment of optional types in Python.
-- ?Real stores a 1-byte tag at offset 0, then an 8-byte double at offset 1.
-- On strict-alignment platforms, this causes SIGBUS.

module main
  ( testOptRealValue
  , testOptRealNull
  , testOptRealRoundTrip
  , testOptIntValue
  , testOptIntNull
  , testOptIntRoundTrip
  )

type Py => Bool = "bool"
type Py => Int = "int"
type Py => Real = "float"

toNull :: a -> ?a
isNull :: ?a -> Bool
fromNull :: a -> ?a -> a
doubleOptReal :: ?Real -> ?Real
addOptInt :: ?Int -> ?Int -> ?Int

source Py from "foo.py"
  ( "toNull"
  , "isNull"
  , "fromNull"
  , "doubleOptReal"
  , "addOptInt"
  )

testOptRealValue :: ?Real
testOptRealValue = toNull 3.14

testOptRealNull :: Bool
testOptRealNull = isNull (toNull 3.14)

testOptRealRoundTrip :: Real
testOptRealRoundTrip = fromNull 0.0 (doubleOptReal (toNull 1.5))

testOptIntValue :: ?Int
testOptIntValue = toNull 42

testOptIntNull :: Bool
testOptIntNull = isNull (toNull 42)

testOptIntRoundTrip :: Int
testOptIntRoundTrip = fromNull 0 (addOptInt (toNull 10) (toNull 20))


================================================
FILE: test-suite/golden-tests/memory-record-pack-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMakePair > obs.txt 2> obs.err
	./nexus testGetPairFlag >> obs.txt 2>> obs.err
	./nexus testGetPairValue >> obs.txt 2>> obs.err
	./nexus testPairRoundTrip >> obs.txt 2>> obs.err
	./nexus testMakeTriple >> obs.txt 2>> obs.err
	./nexus testGetTripleCount >> obs.txt 2>> obs.err
	./nexus testGetTripleValue >> obs.txt 2>> obs.err
	./nexus testTripleRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/memory-record-pack-cpp/exp.txt
================================================
{"flag":true,"value":3.14}
true
3.14
{"flag":false,"value":2.718}
{"flag":true,"count":42,"value":3.14}
42
3.14
{"flag":false,"count":99,"value":1.618}


================================================
FILE: test-suite/golden-tests/memory-record-pack-cpp/foo.hpp
================================================
#ifndef MORLOC_MEMORY_RECORD_PACK_HPP
#define MORLOC_MEMORY_RECORD_PACK_HPP

struct pair_br_t {
    bool flag;
    double value;
};

struct triple_bir_t {
    bool flag;
    int count;
    double value;
};

pair_br_t makePair(bool flag, double value) {
    return pair_br_t{flag, value};
}

bool getPairFlag(const pair_br_t& p) {
    return p.flag;
}

double getPairValue(const pair_br_t& p) {
    return p.value;
}

pair_br_t pairRoundTrip(const pair_br_t& p) {
    return pair_br_t{p.flag, p.value};
}

triple_bir_t makeTriple(bool flag, int count, double value) {
    return triple_bir_t{flag, count, value};
}

int getTripleCount(const triple_bir_t& t) {
    return t.count;
}

double getTripleValue(const triple_bir_t& t) {
    return t.value;
}

triple_bir_t tripleRoundTrip(const triple_bir_t& t) {
    return triple_bir_t{t.flag, t.count, t.value};
}

#endif


================================================
FILE: test-suite/golden-tests/memory-record-pack-cpp/main.loc
================================================
-- Tests memory alignment of record field packing.
-- {flag :: Bool, value :: Real} puts Real at offset 1 (needs 8-byte alignment).
-- {flag :: Bool, count :: Int, value :: Real} puts Int at offset 1, Real at offset 5.
-- On strict-alignment platforms, misaligned field access causes SIGBUS.

module main
  ( testMakePair
  , testGetPairFlag
  , testGetPairValue
  , testPairRoundTrip
  , testMakeTriple
  , testGetTripleCount
  , testGetTripleValue
  , testTripleRoundTrip
  )

type Cpp => Bool = "bool"
type Cpp => Int = "int"
type Cpp => Real = "double"

record PairBR where
  flag :: Bool
  value :: Real
record Cpp => PairBR = "pair_br_t"

record TripleBIR where
  flag :: Bool
  count :: Int
  value :: Real
record Cpp => TripleBIR = "triple_bir_t"

makePair :: Bool -> Real -> PairBR
getPairFlag :: PairBR -> Bool
getPairValue :: PairBR -> Real
pairRoundTrip :: PairBR -> PairBR

makeTriple :: Bool -> Int -> Real -> TripleBIR
getTripleCount :: TripleBIR -> Int
getTripleValue :: TripleBIR -> Real
tripleRoundTrip :: TripleBIR -> TripleBIR

source Cpp from "foo.hpp"
  ( "makePair"
  , "getPairFlag"
  , "getPairValue"
  , "pairRoundTrip"
  , "makeTriple"
  , "getTripleCount"
  , "getTripleValue"
  , "tripleRoundTrip"
  )

testMakePair :: PairBR
testMakePair = makePair True 3.14

testGetPairFlag :: Bool
testGetPairFlag = getPairFlag (makePair True 3.14)

testGetPairValue :: Real
testGetPairValue = getPairValue (makePair True 3.14)

testPairRoundTrip :: PairBR
testPairRoundTrip = pairRoundTrip (makePair False 2.718)

testMakeTriple :: TripleBIR
testMakeTriple = makeTriple True 42 3.14

testGetTripleCount :: Int
testGetTripleCount = getTripleCount (makeTriple True 42 3.14)

testGetTripleValue :: Real
testGetTripleValue = getTripleValue (makeTriple True 42 3.14)

testTripleRoundTrip :: TripleBIR
testTripleRoundTrip = tripleRoundTrip (makeTriple False 99 1.618)


================================================
FILE: test-suite/golden-tests/memory-record-pack-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMakePair > obs.txt 2> obs.err
	./nexus testGetPairFlag >> obs.txt 2>> obs.err
	./nexus testGetPairValue >> obs.txt 2>> obs.err
	./nexus testPairRoundTrip >> obs.txt 2>> obs.err
	./nexus testMakeTriple >> obs.txt 2>> obs.err
	./nexus testGetTripleCount >> obs.txt 2>> obs.err
	./nexus testGetTripleValue >> obs.txt 2>> obs.err
	./nexus testTripleRoundTrip >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/memory-record-pack-py/exp.txt
================================================
{"flag":true,"value":3.14}
true
3.14
{"flag":false,"value":2.718}
{"flag":true,"count":42,"value":3.14}
42
3.14
{"flag":false,"count":99,"value":1.618}


================================================
FILE: test-suite/golden-tests/memory-record-pack-py/foo.py
================================================
def makePair(flag, value):
    return {"flag": flag, "value": value}

def getPairFlag(p):
    return p["flag"]

def getPairValue(p):
    return p["value"]

def pairRoundTrip(p):
    return {"flag": p["flag"], "value": p["value"]}

def makeTriple(flag, count, value):
    return {"flag": flag, "count": count, "value": value}

def getTripleCount(t):
    return t["count"]

def getTripleValue(t):
    return t["value"]

def tripleRoundTrip(t):
    return {"flag": t["flag"], "count": t["count"], "value": t["value"]}


================================================
FILE: test-suite/golden-tests/memory-record-pack-py/main.loc
================================================
-- Tests memory alignment of record field packing in Python.
-- {flag :: Bool, value :: Real} puts Real at offset 1 (needs 8-byte alignment).
-- {flag :: Bool, count :: Int, value :: Real} puts Int at offset 1, Real at offset 5.
-- On strict-alignment platforms, misaligned field access causes SIGBUS.

module main
  ( testMakePair
  , testGetPairFlag
  , testGetPairValue
  , testPairRoundTrip
  , testMakeTriple
  , testGetTripleCount
  , testGetTripleValue
  , testTripleRoundTrip
  )

type Py => Bool = "bool"
type Py => Int = "int"
type Py => Real = "float"

record PairBR where
  flag :: Bool
  value :: Real
record Py => PairBR = "dict"

record TripleBIR where
  flag :: Bool
  count :: Int
  value :: Real
record Py => TripleBIR = "dict"

makePair :: Bool -> Real -> PairBR
getPairFlag :: PairBR -> Bool
getPairValue :: PairBR -> Real
pairRoundTrip :: PairBR -> PairBR

makeTriple :: Bool -> Int -> Real -> TripleBIR
getTripleCount :: TripleBIR -> Int
getTripleValue :: TripleBIR -> Real
tripleRoundTrip :: TripleBIR -> TripleBIR

source Py from "foo.py"
  ( "makePair"
  , "getPairFlag"
  , "getPairValue"
  , "pairRoundTrip"
  , "makeTriple"
  , "getTripleCount"
  , "getTripleValue"
  , "tripleRoundTrip"
  )

testMakePair :: PairBR
testMakePair = makePair True 3.14

testGetPairFlag :: Bool
testGetPairFlag = getPairFlag (makePair True 3.14)

testGetPairValue :: Real
testGetPairValue = getPairValue (makePair True 3.14)

testPairRoundTrip :: PairBR
testPairRoundTrip = pairRoundTrip (makePair False 2.718)

testMakeTriple :: TripleBIR
testMakeTriple = makeTriple True 42 3.14

testGetTripleCount :: Int
testGetTripleCount = getTripleCount (makeTriple True 42 3.14)

testGetTripleValue :: Real
testGetTripleValue = getTripleValue (makeTriple True 42 3.14)

testTripleRoundTrip :: TripleBIR
testTripleRoundTrip = tripleRoundTrip (makeTriple False 99 1.618)


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testBoolChain > obs.txt 2> obs.err
	./nexus testShortStrChain >> obs.txt 2>> obs.err
	./nexus testMixedChain >> obs.txt 2>> obs.err
	./nexus testMultiHop >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__ *err


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/cppfuncs.loc
================================================
module cppfuncs (*)

import types

cNotBool :: Bool -> Bool
cAppendStr :: Str -> Str -> Str
cBoolToStr :: Bool -> Str
cStrLen :: Str -> Int

source Cpp from "foo.hpp" ("cNotBool", "cAppendStr", "cBoolToStr", "cStrLen")


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/exp.txt
================================================
false
"abcd"
"false"
6


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/foo.hpp
================================================
#ifndef MORLOC_MEMORY_SPLIT_BLOCK_HPP
#define MORLOC_MEMORY_SPLIT_BLOCK_HPP

#include <string>

bool cNotBool(bool x) {
    return !x;
}

std::string cAppendStr(const std::string& a, const std::string& b) {
    return a + b;
}

std::string cBoolToStr(bool x) {
    return x ? "true" : "false";
}

int cStrLen(const std::string& s) {
    return static_cast<int>(s.size());
}

#endif


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/foo.py
================================================
def pNotBool(x):
    return not x

def pAppendStr(a, b):
    return a + b

def pBoolToStr(x):
    return "true" if x else "false"


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/main.loc
================================================
-- Tests split_block header alignment in shared memory allocator.
-- When shmalloc(N) where N is not 8-aligned, the next block_header_t
-- gets placed at a misaligned address. The _Atomic(unsigned int) reference_count
-- and size_t size fields in the header get misaligned, causing bus errors on
-- atomic operations on strict-alignment platforms.
--
-- Strategy: Chain cross-language calls with odd-sized intermediates (Bool = 1 byte,
-- short strings) to force multiple shared memory allocations and block splits
-- at non-8-byte boundaries.

module main
  ( testBoolChain
  , testShortStrChain
  , testMixedChain
  , testMultiHop
  )

import types
import cppfuncs
import pyfuncs

-- Bool is 1 byte; crossing languages forces serialization through shared memory
testBoolChain :: Bool
testBoolChain = cNotBool (pNotBool (cNotBool True))

-- Short strings have odd byte counts, forcing odd-sized allocations
testShortStrChain :: Str
testShortStrChain = pAppendStr (cAppendStr "ab" "c") "d"

-- Mix Bool and Str across languages to create varied allocation sizes
testMixedChain :: Str
testMixedChain = cBoolToStr (pNotBool (cNotBool False))

-- Multiple hops to increase chance of hitting a split_block boundary
testMultiHop :: Int
testMultiHop = cStrLen (pAppendStr (cAppendStr (pBoolToStr True) "x") "y")


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/pyfuncs.loc
================================================
module pyfuncs (*)

import types

pNotBool :: Bool -> Bool
pAppendStr :: Str -> Str -> Str
pBoolToStr :: Bool -> Str

source Py from "foo.py" ("pNotBool", "pAppendStr", "pBoolToStr")


================================================
FILE: test-suite/golden-tests/memory-split-block-cpp/types.loc
================================================
module types (*)

type Py => Bool = "bool"
type Py => Int = "int"
type Py => Str = "str"
type Cpp => Bool = "bool"
type Cpp => Int = "int"
type Cpp => Str = "std::string"


================================================
FILE: test-suite/golden-tests/module-form-00n/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-00n/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-00n/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + (-1 * y)
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-00n/main.loc
================================================
module main (foo)

-- 00n - declare n

import fooroot

foo x y = x + -1 * y
foo x y = 0 + x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-011/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-011/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-011/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-011/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-011/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-011/main.loc
================================================
module main (foo)

-- 011 - source0, import 1, declare 1

import fooroot
import foopy (foo)

foo x y = x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-01n/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-01n/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-01n/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-01n/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-01n/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-01n/main.loc
================================================
module main (foo)

-- 01n - source 0, import 1, declare n

import fooroot
import foopy (foo)

foo x y = x + -1 * y
foo x y = 0 + (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-0n0/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-0n0/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-0n0/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-0n0/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-0n0/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-0n0/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-0n0/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-0n0/main.loc
================================================
module main (foo)

-- 0n0 - source 0, import n, declare 0

import fooroot
import foopy (foo)
import foor (foo)


================================================
FILE: test-suite/golden-tests/module-form-0n1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-0n1/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-0n1/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-0n1/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-0n1/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-0n1/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-0n1/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + (-1 * y)
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-0n1/main.loc
================================================
module main (foo)

-- 0n1 - source 0, import n, declare 1

import fooroot
import foopy (foo)
import foor (foo)

foo x y = x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-101/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-101/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-101/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-101/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-101/main.loc
================================================
module main (foo)

-- 101 - source 1, import 0, declare 1

import fooroot

source Py from "foo.py" ("foo")

foo x y = x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-10n/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-10n/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-10n/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-10n/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-10n/main.loc
================================================
module main (foo)

-- 10n - source 1, import 0, declare n

import fooroot

source Py from "foo.py" ("foo")

foo x y = x + -1 * y
foo x y = 0 + x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-110/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-110/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-110/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-110/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-110/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-110/main.loc
================================================
module main (foo)

-- 110 - source 1, import 1, declare 0

import fooroot
import foopy (foo)

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-111/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-111/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-111/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-111/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-111/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + (-1 * y)
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-111/main.loc
================================================
module main (foo)

-- 111 - source 1, import 1, declare 1

import fooroot
import foopy (foo)

source Py from "foo.py" ("foo")

foo x y = x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-1n0/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolsgc __pycache__


================================================
FILE: test-suite/golden-tests/module-form-1n0/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-1n0/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-1n0/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-1n0/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-1n0/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-1n0/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-1n0/main.loc
================================================
module main (foo)

-- 1n0 - source 1, import n, declare 0

import fooroot
import foopy (foo)
import foor (foo)

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n00/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus poolsgc __pycache__


================================================
FILE: test-suite/golden-tests/module-form-n00/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-n00/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-n00/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-n00/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n00/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n00/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-n00/main.loc
================================================
module main (foo)

-- n00 - source n, import 0, declare 0

import fooroot

source Py from "foo.py" ("foo")
source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n01/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-n01/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-n01/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-n01/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-n01/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n01/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n01/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + -1 * y
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-n01/main.loc
================================================
module main (foo)

-- n01 - source n, import 0, declare 1

import fooroot

source Py from "foo.py" ("foo")
source Py from "foo.R" ("foo")

foo x y = x + -1 * y


================================================
FILE: test-suite/golden-tests/module-form-n10/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 7 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/module-form-n10/exp.txt
================================================
-2


================================================
FILE: test-suite/golden-tests/module-form-n10/foo.R
================================================
foo <- function(x,y){
  x + (-1) * y
}


================================================
FILE: test-suite/golden-tests/module-form-n10/foo.py
================================================
def foo(x,y):
  return x + (-1) * y


================================================
FILE: test-suite/golden-tests/module-form-n10/foopy.loc
================================================
module foopy (foo)

import fooroot

source Py from "foo.py" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n10/foor.loc
================================================
module foor (foo)

import fooroot

source R from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/module-form-n10/fooroot.loc
================================================
module fooroot (*)

import root-r
import root-py

foo :: Int -> Int -> Int
foo x y = x + (-1 * y)
foo x y = 1 * (x + -1 * y)


================================================
FILE: test-suite/golden-tests/module-form-n10/main.loc
================================================
module main (foo)

-- n10 - source n, import 1, declare 0

import fooroot
import foopy (foo)

source Py from "foo.py" ("foo")
source Py from "foo.R" ("foo")


================================================
FILE: test-suite/golden-tests/multi-lang-mempty-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/multi-lang-mempty-py/exp.txt
================================================
[1,2,3,4]


================================================
FILE: test-suite/golden-tests/multi-lang-mempty-py/main.loc
================================================
module main (test)

import root
import root-py
import root-cpp

test :: [Int]
test = concat [[1,2],[3,4]]


================================================
FILE: test-suite/golden-tests/multiple-instances-1-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/multiple-instances-1-c/exp.txt
================================================
2.16024689946929


================================================
FILE: test-suite/golden-tests/multiple-instances-1-c/main.loc
================================================
-- NOTE: currently not used, the compiler cannot yet distinguish between sourced functions

module main (rms)

import root-cpp

source cpp from "rms.h"
  ( "rms1" as rms
  , "rms2" as rms
  )

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-1-c/rms.h
================================================
#ifndef __RMS_H__
#define __RMS_H__

#include <math.h>
#include <vector>
#include <array>

double rms1(std::vector<double>);
double rms2(std::vector<double>);

double rms1(std::vector<double> xs){
    double x = 0;
    for(size_t i = 0; i < xs.size(); i++){
        x += xs[i] * xs[i];
    }
    return sqrt(x / xs.size());
}

// Only slightly different from rms1
double rms2(std::vector<double> xs){
    double x = 0;
    for(size_t i = 0; i < xs.size(); i++){
        x += pow(xs[i], 2);
    }
    return sqrt(x / xs.size());
}

#endif


================================================
FILE: test-suite/golden-tests/multiple-instances-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/multiple-instances-1-py/exp.txt
================================================
2.16024689946929


================================================
FILE: test-suite/golden-tests/multiple-instances-1-py/main.loc
================================================
-- NOTE: currently not used, the compiler cannot yet distinguish between sourced functions

module main (rms)

import root-py

source py from "rms.py"
  ( "rms1" as rms
  , "rms2" as rms
  )

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-1-py/rms.py
================================================
import math

def rms1(xs):
    return math.sqrt(sum([x*x for x in xs])/len(xs))

def rms2(xs):
    y = 0
    for x in xs:
        y += x*x
    y = y / len(xs)
    return math.sqrt(y)


================================================
FILE: test-suite/golden-tests/multiple-instances-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/multiple-instances-1-r/exp.txt
================================================
2.16024689946929


================================================
FILE: test-suite/golden-tests/multiple-instances-1-r/main.loc
================================================
-- NOTE: currently not used, the compiler cannot yet distinguish between sourced functions

module main (rms)

import root-r

source r from "rms.R"
  ( "rms1" as rms
  , "rms2" as rms
  )

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-1-r/rms.R
================================================
# the smart way
rms1 <- function(xs){
  sqrt(mean(xs^2))
}

# the dumb way
rms2 <- function(xs){
  result = 0
  for (x in xs){
    result = result + x ^ 2
  }
  result = result / length(xs)
  result = sqrt(result)
  return(result)
}


================================================
FILE: test-suite/golden-tests/multiple-instances-2-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/multiple-instances-2-c/exp.txt
================================================
2.16024689946929


================================================
FILE: test-suite/golden-tests/multiple-instances-2-c/main.loc
================================================
module main (rms)

import math-cpp (sqrt)
import root-cpp (Functor, Integral)

source cpp from "rms.h"
 ( "rms1" as rms
 , "mean"
 )

mean :: [Real] -> Real

square x = x * x
rms xs = sqrt (mean (map square xs))

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-2-c/rms.h
================================================
#ifndef __RMS_H__
#define __RMS_H__

#include <math.h>
#include <vector>
#include <array>

double rms1(std::vector<double>);
double rms2(std::vector<double>);

double rms1(std::vector<double> xs){
    double x = 0;
    for(size_t i = 0; i < xs.size(); i++){
        x += xs[i] * xs[i];
    }
    return sqrt(x / xs.size());
}

// Only slightly different from rms1
double rms2(std::vector<double> xs){
    double x = 0;
    for(size_t i = 0; i < xs.size(); i++){
        x += pow(xs[i], 2);
    }
    return sqrt(x / xs.size());
}

double mean(std::vector<double> xs){
    double s = 0;
    for(size_t i = 0; i < xs.size(); i++){
        s += xs[i];
    }
    return s / xs.size();
}

#endif


================================================
FILE: test-suite/golden-tests/multiple-instances-2-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [2,4,4,8] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/multiple-instances-2-py/exp.txt
================================================
5


================================================
FILE: test-suite/golden-tests/multiple-instances-2-py/main.loc
================================================
module main (rms)

import math-py (sqrt)
import root-py

source py from "rms.py"
  ( "rms1" as rms
  , "mean"
  )

mean :: [Real] -> Real

square x = x * x
rms xs = sqrt (mean (map square xs))

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-2-py/rms.py
================================================
import math

def rms1(xs):
    return math.sqrt(sum([x*x for x in xs])/len(xs))

def rms2(xs):
    y = 0
    for x in xs:
        y += x*x
    y = y / len(xs)
    return math.sqrt(y)

def mean(xs):
    return sum(xs) / len(xs)


================================================
FILE: test-suite/golden-tests/multiple-instances-2-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus rms [2,4,4,8] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/multiple-instances-2-r/exp.txt
================================================
5


================================================
FILE: test-suite/golden-tests/multiple-instances-2-r/main.loc
================================================
module main (rms)

import math-r (sqrt)
import root-r (Functor, Integral)

source r from "rms.R"
  ( "rms1" as rms
  , "mean_list" as mean
  )

mean :: [Real] -> Real

square x = x * x
rms xs = sqrt (mean (map square xs))

rms :: [Real] -> Real


================================================
FILE: test-suite/golden-tests/multiple-instances-2-r/rms.R
================================================
# the smart way
rms1 <- function(xs){
  sqrt(mean(xs^2))
}

# the dumb way
rms2 <- function(xs){
  result = 0
  for (x in xs){
    result = result + x ^ 2
  }
  result = result / length(xs)
  result = sqrt(result)
  return(result)
}

mean_list <- function(xs) {
  mean(xs)
}


================================================
FILE: test-suite/golden-tests/multiple-instances-2-r/rms.py
================================================
import math

def rms1(xs):
    return math.sqrt(sum([x*x for x in xs])/len(xs))

def rms2(xs):
    y = 0
    for x in xs:
        y += x*x
    y = y / len(xs)
    return math.sqrt(y)


================================================
FILE: test-suite/golden-tests/multiprocessing-py-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus bar   [1,2,3] > obs.txt 2> obs.err
	./nexus foo 5 [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/multiprocessing-py-1/exp.txt
================================================
[6,7,8]
[6,7,8]


================================================
FILE: test-suite/golden-tests/multiprocessing-py-1/foo.py
================================================
import multiprocessing as mp
import os

n_workers = max(1, os.cpu_count() // 2)

def pmap(f, xs):
    with mp.Pool(processes=n_workers) as pool:
        results = pool.map(f, xs)
    return results

def add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/multiprocessing-py-1/main.loc
================================================
module main (bar, foo)

source Py from "foo.py" ("pmap", "add")

type Py => Int = "int"
type Py => List a = "list" a

pmap :: (a -> b) -> [a] -> [b] 
add :: Int -> Int -> Int

bar   = pmap (add 5)
foo x = pmap (add x)


================================================
FILE: test-suite/golden-tests/namespace-basic/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-basic/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-basic/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x

triple :: Int -> Int
triple x = x + x + x


================================================
FILE: test-suite/golden-tests/namespace-basic/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: [Bool]
test =
  [ h.double 5 == 10
  , h.triple 3 == 9
  ]


================================================
FILE: test-suite/golden-tests/namespace-disambiguation/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-disambiguation/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-disambiguation/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-disambiguation/main.loc
================================================
module main (test)

import root-py
import .helpers as h

-- Test that h.double (namespace qualified) and .0 (getter) work in same file
test :: [Bool]
test =
  [ h.double 5 == 10
  , (.0 (42, 7)) == 42
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-composition/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-composition/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-composition/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x

triple :: Int -> Int
triple x = x + x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-composition/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: [Bool]
test =
  [ (h.double . h.triple) 2 == 12
  , (h.triple . h.double) 2 == 12
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-double-import/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-double-import/exp.txt
================================================
[true,true,true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-double-import/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x

triple :: Int -> Int
triple x = x + x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-double-import/main.loc
================================================
module main (test)

import root-py
import .helpers
import .helpers as h

test :: [Bool]
test =
  [ double 5 == 10
  , h.double 5 == 10
  , triple 3 == 9
  , h.triple 3 == 9
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-exported/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus myDouble 5 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-exported/exp.txt
================================================
10


================================================
FILE: test-suite/golden-tests/namespace-ns-exported/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-exported/main.loc
================================================
module main (myDouble)

import root-py
import .helpers as h

myDouble :: Int -> Int
myDouble x = h.double x


================================================
FILE: test-suite/golden-tests/namespace-ns-guard/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-guard/exp.txt
================================================
[true,true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-guard/helpers.loc
================================================
module (*)

import root

isPositive :: Int -> Bool
isPositive x = x > 0

negate :: Int -> Int
negate x = 0 - x


================================================
FILE: test-suite/golden-tests/namespace-ns-guard/main.loc
================================================
module main (test)

import root-py
import .helpers as h

absVal :: Int -> Int
absVal x
  ? h.isPositive x = x
  : h.negate x

test :: [Bool]
test =
  [ absVal 5 == 5
  , absVal (-3) == 3
  , absVal 0 == 0
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-hof/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-hof/exp.txt
================================================
[2,4,6]


================================================
FILE: test-suite/golden-tests/namespace-ns-hof/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-hof/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: [Int]
test = map h.double [1, 2, 3]


================================================
FILE: test-suite/golden-tests/namespace-ns-let/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-let/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/namespace-ns-let/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-let/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: [Bool]
test =
  let x = h.double 5
  in [x == 10]


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/exp.txt
================================================
[true,true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/main.loc
================================================
module main (test)

import root-py
import .mod-a as a
import .mod-b as b
import .mod-c as c

test :: [Bool]
test =
  [ a.inc 0 == 1
  , b.inc 0 == 10
  , c.inc 0 == 100
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/mod-a.loc
================================================
module (*)

import root

inc :: Int -> Int
inc x = x + 1


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/mod-b.loc
================================================
module (*)

import root

inc :: Int -> Int
inc x = x + 10


================================================
FILE: test-suite/golden-tests/namespace-ns-multi/mod-c.loc
================================================
module (*)

import root

inc :: Int -> Int
inc x = x + 100


================================================
FILE: test-suite/golden-tests/namespace-ns-nested-getter/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-nested-getter/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-nested-getter/helpers.loc
================================================
module (*)

import root

makePair :: Int -> Int -> (Int, Int)
makePair a b = (a, b)


================================================
FILE: test-suite/golden-tests/namespace-ns-nested-getter/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: [Bool]
test =
  [ (.0 (h.makePair 42 7)) == 42
  , (.1 (h.makePair 42 7)) == 7
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-reexport/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-reexport/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/namespace-ns-reexport/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-reexport/main.loc
================================================
module main (test)

import root-py
import .middle

test :: [Bool]
test = [quadruple 3 == 12]


================================================
FILE: test-suite/golden-tests/namespace-ns-reexport/middle.loc
================================================
module (*)

import root
import .helpers as h

quadruple :: Int -> Int
quadruple x = h.double (h.double x)


================================================
FILE: test-suite/golden-tests/namespace-ns-same-func-name/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-same-func-name/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-same-func-name/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-same-func-name/main.loc
================================================
module main (test)

import root-py
import .helpers as map

inc :: Int -> Int
inc x = x + 1

test :: [Bool]
test =
  [ map.double 5 == 10
  , map inc [1, 2, 3] == [2, 3, 4]
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-shadow/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-shadow/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-ns-shadow/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-shadow/main.loc
================================================
module main (test)

import root-py
import .helpers as h

h :: Int -> Int
h x = x + 1

test :: [Bool]
test =
  [ h 5 == 6
  , h.double 5 == 10
  ]


================================================
FILE: test-suite/golden-tests/namespace-ns-unqualified/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc > obs.txt 2> build.err; grep -c "Undefined term" build.err > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-ns-unqualified/exp.txt
================================================
1


================================================
FILE: test-suite/golden-tests/namespace-ns-unqualified/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x


================================================
FILE: test-suite/golden-tests/namespace-ns-unqualified/main.loc
================================================
module main (test)

import root-py
import .helpers as h

test :: Int
test = double 5


================================================
FILE: test-suite/golden-tests/namespace-selective/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-selective/exp.txt
================================================
[true]


================================================
FILE: test-suite/golden-tests/namespace-selective/helpers.loc
================================================
module (*)

import root

double :: Int -> Int
double x = x + x

triple :: Int -> Int
triple x = x + x + x


================================================
FILE: test-suite/golden-tests/namespace-selective/main.loc
================================================
module main (test)

import root-py
import .helpers as h (double)

test :: [Bool]
test =
  [ h.double 5 == 10
  ]


================================================
FILE: test-suite/golden-tests/namespace-separate-impls/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/namespace-separate-impls/exp.txt
================================================
[true,true]


================================================
FILE: test-suite/golden-tests/namespace-separate-impls/main.loc
================================================
module main (test)

import root-py
import .mod-a as a
import .mod-b as b

test :: [Bool]
test =
  [ a.transform 5 == 15
  , b.transform 5 == 10
  ]


================================================
FILE: test-suite/golden-tests/namespace-separate-impls/mod-a.loc
================================================
module (*)

import root

transform :: Int -> Int
transform x = x + 10


================================================
FILE: test-suite/golden-tests/namespace-separate-impls/mod-b.loc
================================================
module (*)

import root

transform :: Int -> Int
transform x = x * 2


================================================
FILE: test-suite/golden-tests/nat-typecheck/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testAdd ---" > obs.txt
	./nexus testAdd >> obs.txt 2>> obs.err
	echo "--- testTranspose ---" >> obs.txt
	./nexus testTranspose >> obs.txt 2>> obs.err
	echo "--- testMatmul ---" >> obs.txt
	./nexus testMatmul >> obs.txt 2>> obs.err
	echo "--- testTrace ---" >> obs.txt
	./nexus testTrace >> obs.txt 2>> obs.err
	echo "--- testDiag ---" >> obs.txt
	./nexus testDiag >> obs.txt 2>> obs.err
	echo "--- testVstack ---" >> obs.txt
	./nexus testVstack >> obs.txt 2>> obs.err
	echo "--- testHstack ---" >> obs.txt
	./nexus testHstack >> obs.txt 2>> obs.err
	echo "--- testOuter ---" >> obs.txt
	./nexus testOuter >> obs.txt 2>> obs.err
	echo "--- testDot ---" >> obs.txt
	./nexus testDot >> obs.txt 2>> obs.err
	echo "--- testFlatten ---" >> obs.txt
	./nexus testFlatten >> obs.txt 2>> obs.err
	echo "--- testKron ---" >> obs.txt
	./nexus testKron >> obs.txt 2>> obs.err
	echo "--- testSlice ---" >> obs.txt
	./nexus testSlice >> obs.txt 2>> obs.err
	echo "--- testTake ---" >> obs.txt
	./nexus testTake >> obs.txt 2>> obs.err
	echo "--- testSliceAdd ---" >> obs.txt
	./nexus testSliceAdd >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/nat-typecheck/exp.txt
================================================
--- testAdd ---
24
--- testTranspose ---
12
--- testMatmul ---
12
--- testTrace ---
5
--- testDiag ---
4
--- testVstack ---
18
--- testHstack ---
18
--- testOuter ---
12
--- testDot ---
5
--- testFlatten ---
12
--- testKron ---
24
--- testSlice ---
6
--- testTake ---
3
--- testSliceAdd ---
12


================================================
FILE: test-suite/golden-tests/nat-typecheck/main.loc
================================================
-- Comprehensive nat-parameterized type tests.
-- Tests Category 1 (fully checked), Category 2 (deferred/ground),
-- and Category 3 (opaque dimensions) from the nat type system.
module main
  ( testAdd
  , testTranspose
  , testMatmul
  , testTrace
  , testDiag
  , testVstack
  , testHstack
  , testOuter
  , testDot
  , testFlatten
  , testKron
  , testSlice
  , testTake
  , testSliceAdd
  )

import root
import root-cpp

source Cpp from "src.hpp"
  ( "ones34"
  , "ones23"
  , "ones32"
  , "ones22"
  , "ones43"
  , "ones56"
  , "onesV3"
  , "onesV4"
  , "onesV5"
  , "onesV10"
  , "eye33"
  , "eye55"
  , "add2d"
  , "transpose2d"
  , "matmul2d"
  , "dot1d"
  , "tsum1d"
  , "trace2d"
  , "diag2d"
  , "diagMat1d"
  , "flatten2d"
  , "outer1d"
  , "vstack2d"
  , "hstack2d"
  , "kron2d"
  , "slice2d"
  , "ttake1d"
  )

-- -- This is what `ones` SHOULD be, but this would require dependent types:
-- ones :: i:Int -> j:Int -> Tensor2 i j Real

-- Tensor constructors with specific dimensions
ones34 :: Tensor2 3 4 Real
ones23 :: Tensor2 2 3 Real
ones32 :: Tensor2 3 2 Real
ones22 :: Tensor2 2 2 Real
ones43 :: Tensor2 4 3 Real
ones56 :: Tensor2 5 6 Real
onesV3 :: Tensor1 3 Real
onesV4 :: Tensor1 4 Real
onesV5 :: Tensor1 5 Real
onesV10 :: Tensor1 10 Real
eye33 :: Tensor2 3 3 Real
eye55 :: Tensor2 5 5 Real

-- Category 1: Fully checked operations (explicit forall via var list)
add2d :: Tensor2 m n Real -> Tensor2 m n Real -> Tensor2 m n Real
transpose2d :: Tensor2 m n Real -> Tensor2 n m Real
matmul2d :: Tensor2 m k Real -> Tensor2 k n Real -> Tensor2 m n Real
dot1d :: Tensor1 n Real -> Tensor1 n Real -> Real
tsum1d :: Tensor1 n Real -> Real
trace2d :: Tensor2 n n Real -> Real
diag2d :: Tensor2 n n Real -> Tensor1 n Real
diagMat1d :: Tensor1 n Real -> Tensor2 n n Real
outer1d :: Tensor1 m Real -> Tensor1 n Real -> Tensor2 m n Real

-- Category 2: Nat arithmetic (deferred with variables, checked at ground)
flatten2d :: Tensor2 m n Real -> Tensor1 (m * n) Real
vstack2d :: Tensor2 m n Real -> Tensor2 p n Real -> Tensor2 (m + p) n Real
hstack2d :: Tensor2 m n Real -> Tensor2 m p Real -> Tensor2 m (n + p) Real
kron2d :: Tensor2 m n Real -> Tensor2 p q Real -> Tensor2 (m * p) (n * q) Real

-- Category 3: Opaque output dimensions
slice2d :: Int -> Int -> Tensor2 m n Real -> Tensor2 i j Real
ttake1d :: Int -> Tensor1 n Real -> Tensor1 i Real

-- === Category 1 tests ===

-- add two 3x4 ones matrices -> 3x4 of 2s -> flatten -> sum = 24
testAdd :: Real
testAdd = tsum1d (flatten2d (add2d ones34 ones34))

-- transpose 3x4 ones -> 4x3 ones -> flatten -> sum = 12
testTranspose :: Real
testTranspose = tsum1d (flatten2d (transpose2d ones34))

-- matmul I(3x3) * ones(3x4) = ones(3x4) -> flatten -> sum = 12
testMatmul :: Real
testMatmul = tsum1d (flatten2d (matmul2d eye33 ones34))

-- trace of 5x5 identity = 5
testTrace :: Real
testTrace = trace2d eye55

-- diagMat(ones(4)) = 4x4 diag matrix, diag extracts [1,1,1,1], sum = 4
testDiag :: Real
testDiag = tsum1d (diag2d (diagMat1d onesV4))

-- vstack ones(2x3) ones(4x3) = ones(6x3) -> flatten -> sum = 18
testVstack :: Real
testVstack = tsum1d (flatten2d (vstack2d ones23 ones43))

-- hstack ones(3x2) ones(3x4) = ones(3x6) -> flatten -> sum = 18
testHstack :: Real
testHstack = tsum1d (flatten2d (hstack2d ones32 ones34))

-- outer [1,1,1] [1,1,1,1] = ones(3x4) -> flatten -> sum = 12
testOuter :: Real
testOuter = tsum1d (flatten2d (outer1d onesV3 onesV4))

-- dot [1,1,1,1,1] [1,1,1,1,1] = 5
testDot :: Real
testDot = dot1d onesV5 onesV5

-- === Category 2 tests ===

-- flatten ones(3x4) -> ones(12) -> sum = 12
testFlatten :: Real
testFlatten = tsum1d (flatten2d ones34)

-- kron ones(2x3) ones(2x2) = ones(4x6) -> flatten -> sum = 24
testKron :: Real
testKron = tsum1d (flatten2d (kron2d ones23 ones22))

-- === Category 3 tests ===

-- slice 2 3 from ones(5x6) -> ones(2x3) -> flatten -> sum = 6
testSlice :: Real
testSlice = tsum1d (flatten2d (slice2d 2 3 ones56))

-- take 3 from ones(10) -> ones(3) -> sum = 3
testTake :: Real
testTake = tsum1d (ttake1d 3 onesV10)

-- slice used twice (same free vars) -> add -> flatten -> sum = 12
testSliceAdd :: Real
testSliceAdd =
  let s = slice2d 2 3 ones56
  in tsum1d (flatten2d (add2d s s))


================================================
FILE: test-suite/golden-tests/nat-typecheck/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__

#include "mlc_tensor.hpp"
#include <cstring>

// --- Tensor constructors (specific sizes) ---

mlc::Tensor2<double> ones34() {
    mlc::Tensor2<double> t({3, 4});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> ones23() {
    mlc::Tensor2<double> t({2, 3});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> ones32() {
    mlc::Tensor2<double> t({3, 2});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> ones22() {
    mlc::Tensor2<double> t({2, 2});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> ones43() {
    mlc::Tensor2<double> t({4, 3});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> ones56() {
    mlc::Tensor2<double> t({5, 6});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor1<double> onesV3() {
    mlc::Tensor1<double> t({3});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor1<double> onesV4() {
    mlc::Tensor1<double> t({4});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor1<double> onesV5() {
    mlc::Tensor1<double> t({5});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor1<double> onesV10() {
    mlc::Tensor1<double> t({10});
    for (size_t i = 0; i < t.size(); i++) t[i] = 1.0;
    return t;
}

mlc::Tensor2<double> eye33() {
    mlc::Tensor2<double> t({3, 3});
    for (size_t i = 0; i < t.size(); i++) t[i] = 0.0;
    for (int i = 0; i < 3; i++) t(i, i) = 1.0;
    return t;
}

mlc::Tensor2<double> eye55() {
    mlc::Tensor2<double> t({5, 5});
    for (size_t i = 0; i < t.size(); i++) t[i] = 0.0;
    for (int i = 0; i < 5; i++) t(i, i) = 1.0;
    return t;
}

// --- Operations ---

mlc::Tensor2<double> add2d(
    const mlc::Tensor2<double>& a,
    const mlc::Tensor2<double>& b
) {
    int64_t m = a.shape()[0], n = a.shape()[1];
    mlc::Tensor2<double> r({m, n});
    for (size_t i = 0; i < a.size(); i++)
        r[i] = a.data()[i] + b.data()[i];
    return r;
}

mlc::Tensor2<double> transpose2d(const mlc::Tensor2<double>& a) {
    int64_t m = a.shape()[0], n = a.shape()[1];
    mlc::Tensor2<double> r({n, m});
    for (int64_t i = 0; i < m; i++)
        for (int64_t j = 0; j < n; j++)
            r(j, i) = a(i, j);
    return r;
}

mlc::Tensor2<double> matmul2d(
    const mlc::Tensor2<double>& a,
    const mlc::Tensor2<double>& b
) {
    int64_t m = a.shape()[0], k = a.shape()[1], n = b.shape()[1];
    mlc::Tensor2<double> r({m, n});
    for (size_t i = 0; i < r.size(); i++) r[i] = 0.0;
    for (int64_t i = 0; i < m; i++)
        for (int64_t j = 0; j < n; j++)
            for (int64_t l = 0; l < k; l++)
                r(i, j) += a(i, l) * b(l, j);
    return r;
}

double dot1d(
    const mlc::Tensor1<double>& a,
    const mlc::Tensor1<double>& b
) {
    double s = 0;
    for (size_t i = 0; i < a.size(); i++)
        s += a.data()[i] * b.data()[i];
    return s;
}

double tsum1d(const mlc::Tensor1<double>& a) {
    double s = 0;
    for (size_t i = 0; i < a.size(); i++) s += a.data()[i];
    return s;
}

double trace2d(const mlc::Tensor2<double>& a) {
    int64_t n = a.shape()[0];
    double s = 0;
    for (int64_t i = 0; i < n; i++) s += a(i, i);
    return s;
}

mlc::Tensor1<double> diag2d(const mlc::Tensor2<double>& a) {
    int64_t n = a.shape()[0];
    mlc::Tensor1<double> r({n});
    for (int64_t i = 0; i < n; i++) r.data()[i] = a(i, i);
    return r;
}

mlc::Tensor2<double> diagMat1d(const mlc::Tensor1<double>& a) {
    int64_t n = a.shape()[0];
    mlc::Tensor2<double> r({n, n});
    for (size_t i = 0; i < r.size(); i++) r[i] = 0.0;
    for (int64_t i = 0; i < n; i++) r(i, i) = a.data()[i];
    return r;
}

mlc::Tensor1<double> flatten2d(const mlc::Tensor2<double>& a) {
    int64_t total = (int64_t)a.size();
    mlc::Tensor1<double> r({total});
    memcpy(r.data(), a.data(), (size_t)total * sizeof(double));
    return r;
}

mlc::Tensor2<double> outer1d(
    const mlc::Tensor1<double>& a,
    const mlc::Tensor1<double>& b
) {
    int64_t m = a.shape()[0], n = b.shape()[0];
    mlc::Tensor2<double> r({m, n});
    for (int64_t i = 0; i < m; i++)
        for (int64_t j = 0; j < n; j++)
            r(i, j) = a.data()[i] * b.data()[j];
    return r;
}

mlc::Tensor2<double> vstack2d(
    const mlc::Tensor2<double>& a,
    const mlc::Tensor2<double>& b
) {
    int64_t ma = a.shape()[0], mb = b.shape()[0], n = a.shape()[1];
    mlc::Tensor2<double> r({ma + mb, n});
    memcpy(r.data(), a.data(), (size_t)(ma * n) * sizeof(double));
    memcpy(r.data() + ma * n, b.data(), (size_t)(mb * n) * sizeof(double));
    return r;
}

mlc::Tensor2<double> hstack2d(
    const mlc::Tensor2<double>& a,
    const mlc::Tensor2<double>& b
) {
    int64_t m = a.shape()[0], na = a.shape()[1], nb = b.shape()[1];
    mlc::Tensor2<double> r({m, na + nb});
    for (int64_t i = 0; i < m; i++) {
        memcpy(r.data() + i * (na + nb),
               a.data() + i * na, (size_t)na * sizeof(double));
        memcpy(r.data() + i * (na + nb) + na,
               b.data() + i * nb, (size_t)nb * sizeof(double));
    }
    return r;
}

mlc::Tensor2<double> kron2d(
    const mlc::Tensor2<double>& a,
    const mlc::Tensor2<double>& b
) {
    int64_t ma = a.shape()[0], na = a.shape()[1];
    int64_t mb = b.shape()[0], nb = b.shape()[1];
    mlc::Tensor2<double> r({ma * mb, na * nb});
    for (int64_t ia = 0; ia < ma; ia++)
        for (int64_t ja = 0; ja < na; ja++)
            for (int64_t ib = 0; ib < mb; ib++)
                for (int64_t jb = 0; jb < nb; jb++)
                    r(ia * mb + ib, ja * nb + jb) = a(ia, ja) * b(ib, jb);
    return r;
}

mlc::Tensor2<double> slice2d(
    int rows, int cols,
    const mlc::Tensor2<double>& a
) {
    mlc::Tensor2<double> r({(int64_t)rows, (int64_t)cols});
    for (int i = 0; i < rows; i++)
        for (int j = 0; j < cols; j++)
            r(i, j) = a(i, j);
    return r;
}

mlc::Tensor1<double> ttake1d(int n, const mlc::Tensor1<double>& a) {
    mlc::Tensor1<double> r({(int64_t)n});
    memcpy(r.data(), a.data(), (size_t)n * sizeof(double));
    return r;
}

#endif


================================================
FILE: test-suite/golden-tests/native-morloc-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-1/exp.txt
================================================
[2,[2,2]]


================================================
FILE: test-suite/golden-tests/native-morloc-1/main.loc
================================================
module main (foo)

import root ((.))

toSnd f x = (x, f x)

double x = (x, x)

int :: Int -> Int
int x = x

foo = toSnd double . int


================================================
FILE: test-suite/golden-tests/native-morloc-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-2/exp.txt
================================================
[2,3]


================================================
FILE: test-suite/golden-tests/native-morloc-2/foo.py
================================================
def add(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/native-morloc-2/main.loc
================================================
module main (foo)

type Py => Int = "int" 
type Py => Tuple2 a b = "tuple" a b

source Py from "foo.py" ("add") 
add :: Int -> Int -> Int

toSnd :: (a -> b) -> a -> (a, b)
toSnd f x = (x, f x)

foo x = toSnd (add 1) x


================================================
FILE: test-suite/golden-tests/native-morloc-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-3/exp.txt
================================================
[1,2,3]


================================================
FILE: test-suite/golden-tests/native-morloc-3/foo.py
================================================
def mlc_map(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/native-morloc-3/main.loc
================================================
module main (foo)

import root ((.))

type Py => Int = "int" 
type Py => Tuple2 a b = "tuple" a b
type Py => List a = "list" a

source Py from "foo.py" ("mlc_map" as map) 
map :: (a -> b) -> [a] -> [b]

foo :: [Int] -> [Int]
foo = map (\x -> x)

weird :: a -> a -> a
weird x y = y

int :: Int -> Int
int x = x

foo = map (int . weird 1)


================================================
FILE: test-suite/golden-tests/native-morloc-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-4/exp.txt
================================================
[[2,2],[[2,[2,2]],[2,[2,2]]]]


================================================
FILE: test-suite/golden-tests/native-morloc-4/main.loc
================================================
module main (foo)

import root ((.))

toSnd f z = (double z, f (bar double z))

double x = (x, x)

bar f x = (x, f x)

int :: Int -> Int
int x = x

foo = toSnd double . int


================================================
FILE: test-suite/golden-tests/native-morloc-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus high.loc 2> build.err
	./nexus foo [99,2] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-5/exp.txt
================================================
99


================================================
FILE: test-suite/golden-tests/native-morloc-5/high.loc
================================================
module main (foo)

type Py => Int = "int"
type Py => Tuple2 a b = "tuple" a b

source Py from "high.py" ("fst", "snd")
fst :: (a, b) -> a
snd :: (a, b) -> b

const :: a -> b -> a
const a b = a

uncurry :: (a -> b -> c) -> (a, b) -> c
uncurry fabc ab = fabc (fst ab) (snd ab) 

foo :: (Int, Int) -> Int
foo = uncurry const


================================================
FILE: test-suite/golden-tests/native-morloc-5/high.py
================================================
def fst(x):
    return x[0]

def snd(x):
    return x[1]


================================================
FILE: test-suite/golden-tests/native-morloc-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus srcFoo '"c"' > obs.txt 2> obs.err
	./nexus natFoo '"e"' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/native-morloc-6/exp.txt
================================================
["a","b","c"]
["c","d","e"]


================================================
FILE: test-suite/golden-tests/native-morloc-6/foo.py
================================================
def morloc_id(x):
    return x

def morloc_map(f, xs):
    return list(map(f, xs))


================================================
FILE: test-suite/golden-tests/native-morloc-6/main.loc
================================================
-- This tests issue #50

module main (srcFoo, natFoo)

type Py => Str = "str"
type Py => List a = "list" a

source Py from "foo.py" ("morloc_map" as map, "morloc_id" as srcId)
map :: (a -> b) -> [a] -> [b]

srcId :: Str -> Str

natId :: Str -> Str
natId x = x

srcFoo :: Str -> [Str]
srcFoo x = map srcId ["a","b", x]

natFoo :: Str -> [Str]
natFoo x = map natId ["c","d", x]


================================================
FILE: test-suite/golden-tests/native-morloc-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/native-morloc-7/exp.txt
================================================
[67,true,3.14,6.7,[67,"Nessie"],[true,6.7],[6.7,true],[67,true,6.7],67,[[true,42,"Alice"],67],[67,true],[67,true,"Alice"],420,[420,true],[420,"Alice",421,"Bob"]]


================================================
FILE: test-suite/golden-tests/native-morloc-7/main.loc
================================================
module main (foo)

test1 = (67,True,3.14)
test2 = (67, (True, "Nessie", 6.7))

record Thing = Thing { a :: Int, b :: (Bool, Int, Str)  }

test3 :: Thing
test3 = { a = 67, b = (True, 42, "Alice") }

test4 :: (Int, Thing)
test4 = (42, { a = 67, b = (True, 420, "Bob") })

test5 :: (Thing, Int, Thing)
test5 = ({ a = 67, b = (True, 420, "Alice") }, 42, { a = 68, b = (False, 421, "Bob") })

foo =
  ( .0 test1                             -- 67,
  , .1 test1                             -- true,
  , .2 test1                             -- 3.14,
  , .1.2 test2                           -- 6.7,
  , .(.0, .1.1) test2                    -- [67,"Nessie"],
  , .1.(.0, .2) test2                    -- [true,6.7],
  , .1.(.2, .0) test2                    -- [6.7,true],
  , .(.0, .1.(.0, .2)) test2             -- [67,true,6.7],
  , .a test3                             -- 67,
  , .(.b, .a) test3                      -- [[true,42,"Alice"],67],
  , .(.a, .b.0) test3                    -- [67,true],
  , .(.a, .b.(.0, .2)) test3             -- [67,true,"Alice"]
  , .1.b.1 test4                         -- 420
  , .1.b.(.1,.0) test4                   -- [420,true]
  , .(.0.b.(.1,.2), .2.b.(.1,.2)) test5  -- [420,"Alice",421,"Bob"]
  )


================================================
FILE: test-suite/golden-tests/native-morloc-8/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/native-morloc-8/exp.txt
================================================
[[42,true,3.14],[67,false,3.14],[67,true,6.28],[42,true,6.28],[42,[true,"Evangeline",6.7]],[42,[false,"Nessie",6.28]],{"a":42,"b":[true,42,"Alice"]},[{"a":67,"b":[true,210,"Alice"]},67,{"a":68,"b":[false,421,"Bob"]}],[42,true,6.28],[68,true,3.14]]


================================================
FILE: test-suite/golden-tests/native-morloc-8/main.loc
================================================
module main (foo)

test1 = (67,True,3.14)
test2 = (67, (True, "Nessie", 6.7))

record Thing = Thing { a :: Int, b :: (Bool, Int, Str)  }

test3 :: Thing
test3 = { a = 67, b = (True, 42, "Alice") }

test4 :: (Thing, Int, Thing)
test4 = ({ a = 67, b = (True, 420, "Alice") }, 42, { a = 68, b = (False, 421, "Bob") })

foo =
  ( .(.0 = 42) test1                               -- [42, true, 3.14]
  , .(.1 = False) test1                            -- [67,false,3.14],
  , .(.2 = 6.28) test1                             -- [67,true,6.28],
  , .(.0 = 42, .2 = 6.28) test1                    -- [42,true,6.28],
  , .(.0 = 42, .1.1 = "Evangeline") test2          -- [42,[true,"Evangeline",6.7]],
  , .(.0 = 42, .1.(.0 = False, .2 = 6.28)) test2   -- [42,[false,"Nessie",6.28]],
  , .(.a = 42) test3                               -- {"a":42,"b":[true,42,"Alice"]},
  , .(.0.b.1 = 210, .1 = 67) test4                 -- [{"a":67,"b":[true,210,"Alice"]},67,{"a":68,"b":[false,421,"Bob"]}]
  , .(.2 = 6.28, .0 = 42) test1                    -- [42,true,6.28]
  , .(.0 = .2.a test4) test1
  )


================================================
FILE: test-suite/golden-tests/native-morloc-9/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"xxy"' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/native-morloc-9/exp.txt
================================================
["xxy+pickle=xxypickle","somewhere in zanzibar","xxy","xxyxxy","<xxy>","xxy>","<xxy","xxy.xxy"]


================================================
FILE: test-suite/golden-tests/native-morloc-9/main.loc
================================================
module main (foo)

test1 :: Str -> Str -> Str
test1 x y = "#{x}+#{y}=#{x}#{y}"

far = (123, "zanzibar")

foo x =
  [ test1 x "pickle"
  , "somewhere in #{.1 far}"
  , "#{x}"
  , "#{x}#{x}"
  , "<#{x}>"
  , "#{x}>"
  , "<#{x}"
  , "#{x}.#{x}"
  ]


================================================
FILE: test-suite/golden-tests/nexus-let-lambda/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- letLambda ---" > obs.txt
	./nexus letLambda >> obs.txt 2> obs.err
	echo "--- letLambdaComplex ---" >> obs.txt
	./nexus letLambdaComplex >> obs.txt 2>> obs.err
	echo "--- letLambdaMultiUse ---" >> obs.txt
	./nexus letLambdaMultiUse >> obs.txt 2>> obs.err
	echo "--- letLambdaNested ---" >> obs.txt
	./nexus letLambdaNested >> obs.txt 2>> obs.err
	echo "--- letLambdaCapture ---" >> obs.txt
	./nexus letLambdaCapture >> obs.txt 2>> obs.err
	echo "--- letLambdaPartial ---" >> obs.txt
	./nexus letLambdaPartial 2 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/nexus-let-lambda/exp.txt
================================================
--- letLambda ---
42
--- letLambdaComplex ---
[5,5]
--- letLambdaMultiUse ---
[1,2]
--- letLambdaNested ---
42
--- letLambdaCapture ---
[1,2]
--- letLambdaPartial ---
[1,2]


================================================
FILE: test-suite/golden-tests/nexus-let-lambda/main.loc
================================================
-- Tests for let-bound lambdas in the pure nexus evaluator (gAST path).
-- These require applyLambdas to inline let-bound lambdas before toNexusExpr,
-- since the nexus evaluator cannot serialize function types.

module main
  ( letLambda
  , letLambdaComplex
  , letLambdaMultiUse
  , letLambdaNested
  , letLambdaCapture
  , letLambdaPartial
  )

-- 1. Simple identity lambda applied in body
letLambda :: Int
letLambda = let f = (\x -> x) in f 42

-- 2. Lambda with compound return type
letLambdaComplex :: (Int, Int)
letLambdaComplex = let f = (\x -> (x, x)) in f 5

-- 3. Let-bound lambda used at multiple call sites
letLambdaMultiUse :: (Int, Int)
letLambdaMultiUse = let f = (\x -> x) in (f 1, f 2)

-- 4. Nested let-bound lambdas: inner lambda calls outer
letLambdaNested :: Int
letLambdaNested =
  let f = (\x -> x)
      g = (\y -> f y)
  in g 42

-- 5. Lambda that captures an outer let-bound data value
letLambdaCapture :: (Int, Int)
letLambdaCapture =
  let x = 1
      f = (\y -> (x, y))
  in f 2

-- 6. Partial application: let-bound lambda returns a function
letLambdaPartial :: Int -> (Int, Int)
letLambdaPartial = let f = (\x -> \y -> (x, y)) in f 1


================================================
FILE: test-suite/golden-tests/nexus-let-pure/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- letSimpleInt ---" > obs.txt
	./nexus letSimpleInt >> obs.txt 2> obs.err
	echo "--- letSimpleStr ---" >> obs.txt
	./nexus letSimpleStr >> obs.txt 2>> obs.err
	echo "--- letSimpleBool ---" >> obs.txt
	./nexus letSimpleBool >> obs.txt 2>> obs.err
	echo "--- letSimpleReal ---" >> obs.txt
	./nexus letSimpleReal >> obs.txt 2>> obs.err
	echo "--- letSimpleList ---" >> obs.txt
	./nexus letSimpleList >> obs.txt 2>> obs.err
	echo "--- letSimpleTuple ---" >> obs.txt
	./nexus letSimpleTuple >> obs.txt 2>> obs.err
	echo "--- letNested ---" >> obs.txt
	./nexus letNested >> obs.txt 2>> obs.err
	echo "--- letCrossRef ---" >> obs.txt
	./nexus letCrossRef >> obs.txt 2>> obs.err
	echo "--- letDeepChain ---" >> obs.txt
	./nexus letDeepChain >> obs.txt 2>> obs.err
	echo "--- letMultiRef ---" >> obs.txt
	./nexus letMultiRef >> obs.txt 2>> obs.err
	echo "--- letUnused ---" >> obs.txt
	./nexus letUnused >> obs.txt 2>> obs.err
	echo "--- letShadow ---" >> obs.txt
	./nexus letShadow >> obs.txt 2>> obs.err
	echo "--- letNestedStruct ---" >> obs.txt
	./nexus letNestedStruct >> obs.txt 2>> obs.err
	echo "--- letGetter ---" >> obs.txt
	./nexus letGetter >> obs.txt 2>> obs.err
	echo "--- letWithArg ---" >> obs.txt
	./nexus letWithArg 42 >> obs.txt 2>> obs.err
	echo "--- letSelfRef ---" >> obs.txt
	./nexus letSelfRef >> obs.txt 2>> obs.err
	echo "--- letDeepNest ---" >> obs.txt
	./nexus letDeepNest >> obs.txt 2>> obs.err
	echo "--- letCrossRefChain ---" >> obs.txt
	./nexus letCrossRefChain >> obs.txt 2>> obs.err
	echo "--- letRecord ---" >> obs.txt
	./nexus letRecord >> obs.txt 2>> obs.err
	echo "--- letRecordGetter ---" >> obs.txt
	./nexus letRecordGetter >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log


================================================
FILE: test-suite/golden-tests/nexus-let-pure/exp.txt
================================================
--- letSimpleInt ---
42
--- letSimpleStr ---
"hello"
--- letSimpleBool ---
true
--- letSimpleReal ---
3.14
--- letSimpleList ---
[1,2,3]
--- letSimpleTuple ---
[42,"world"]
--- letNested ---
[1,2]
--- letCrossRef ---
1
--- letDeepChain ---
1
--- letMultiRef ---
[42,42,42]
--- letUnused ---
42
--- letShadow ---
2
--- letNestedStruct ---
[1,[2,3],"hi"]
--- letGetter ---
10
--- letWithArg ---
42
--- letSelfRef ---
1
--- letDeepNest ---
1
--- letCrossRefChain ---
100
--- letRecord ---
{"x":10,"y":20}
--- letRecordGetter ---
10


================================================
FILE: test-suite/golden-tests/nexus-let-pure/main.loc
================================================
-- Tests for let bindings in the pure nexus evaluator (gAST path).
-- No source declarations, no imports -- all functions are purely nexus-evaluated.

module main
  ( letSimpleInt
  , letSimpleStr
  , letSimpleBool
  , letSimpleReal
  , letSimpleList
  , letSimpleTuple
  , letNested
  , letCrossRef
  , letDeepChain
  , letMultiRef
  , letUnused
  , letShadow
  , letNestedStruct
  , letGetter
  , letWithArg
  , letSelfRef
  , letDeepNest
  , letCrossRefChain
  , letRecord
  , letRecordGetter
  )

record Point = Point { x :: Int, y :: Int }

-- 1. Simple let with integer
letSimpleInt :: Int
letSimpleInt = let x = 42 in x

-- 2. Simple let with string
letSimpleStr :: Str
letSimpleStr = let s = "hello" in s

-- 3. Simple let with boolean
letSimpleBool :: Bool
letSimpleBool = let b = True in b

-- 4. Simple let with real
letSimpleReal :: Real
letSimpleReal = let r = 3.14 in r

-- 5. Simple let with list
letSimpleList :: [Int]
letSimpleList = let xs = [1, 2, 3] in xs

-- 6. Simple let with tuple
letSimpleTuple :: (Int, Str)
letSimpleTuple = let p = (42, "world") in p

-- 7. Nested lets returning tuple
letNested :: (Int, Int)
letNested = let x = 1 in let y = 2 in (x, y)

-- 8. Cross-referencing let (y uses x)
letCrossRef :: Int
letCrossRef = let x = 1 in let y = x in y

-- 9. Deep chain of cross-references (4 levels)
letDeepChain :: Int
letDeepChain =
  let a = 1
      b = a
      c = b
      d = c
  in d

-- 10. Multiple references to same let-bound variable
letMultiRef :: (Int, Int, Int)
letMultiRef = let x = 42 in (x, x, x)

-- 11. Unused let binding
letUnused :: Int
letUnused = let x = 999 in 42

-- 12. Let shadowing (inner x shadows outer x, uniquified to x@0 and x@1)
letShadow :: Int
letShadow = let x = 1 in let x = 2 in x

-- 13. Nested data structure in let
letNestedStruct :: (Int, [Int], Str)
letNestedStruct = let p = (1, [2, 3], "hi") in p

-- 14. Pattern getter on let-bound tuple
letGetter :: Int
letGetter = let p = (10, 20) in .0 p

-- 15. Let with function argument from CLI
letWithArg :: Int -> Int
letWithArg x = let y = x in y

-- 16. Let self-reference: inner let RHS refers to outer x (non-recursive let)
letSelfRef :: Int
letSelfRef = let x = 1 in let x = x in x

-- 17. Many let bindings, use first
letDeepNest :: Int
letDeepNest =
  let a = 1
      b = 2
      c = 3
      d = 4
      e = 5
  in a

-- 18. Long cross-reference chain
letCrossRefChain :: Int
letCrossRefChain =
  let a = 100
      b = a
      c = b
      d = c
      e = d
  in e

-- 19. Record construction in let
letRecord :: Point
letRecord = let p = { x = 10, y = 20 } in p

-- 20. Record field access on let-bound record
letRecordGetter :: Int
letRecordGetter = let p = { x = 10, y = 20 } in .x p


================================================
FILE: test-suite/golden-tests/null-keyword/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testSafeHead > obs.txt 2> obs.err
	./nexus testSafeHeadEmpty >> obs.txt 2>> obs.err
	./nexus testFromNull >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/null-keyword/exp.txt
================================================
10
null
[0,0,0]


================================================
FILE: test-suite/golden-tests/null-keyword/main.R
================================================
fromNull <- function(default_val, x) {
    if (is.null(x)) return(default_val)
    return(x)
}


================================================
FILE: test-suite/golden-tests/null-keyword/main.hpp
================================================
#ifndef MORLOC_NULL_KEYWORD_TEST_HPP
#define MORLOC_NULL_KEYWORD_TEST_HPP

#include <optional>

template <typename T>
T fromNull(const T& default_val, const std::optional<T>& x) {
    if (!x.has_value()) return default_val;
    return *x;
}

#endif


================================================
FILE: test-suite/golden-tests/null-keyword/main.loc
================================================
module main (testSafeHead, testSafeHeadEmpty, testFromNull)

import root-py
import root-cpp
import root-r

safeHead :: [a] -> ?a
safeHead xs
  ? length xs == 0 = Null
  : head xs

source Py from "main.py" ("fromNull")
source R from "main.R" ("fromNull")
source Cpp from "main.hpp" ("fromNull")

fromNull :: a -> ?a -> a

testSafeHead :: ?Int
testSafeHead = safeHead [10, 20, 30]

testSafeHeadEmpty :: ?Int
testSafeHeadEmpty = safeHead []

testFromNull :: (Int, Int, Int)
testFromNull = ( fromNull 0 (idpy Null)
               , fromNull 0 (idr Null)
               , fromNull 0 (idcpp Null)
               )


================================================
FILE: test-suite/golden-tests/null-keyword/main.py
================================================
def fromNull(default_val, x):
    if x is None:
        return default_val
    return x


================================================
FILE: test-suite/golden-tests/numeric-literals/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/numeric-literals/exp.txt
================================================
[[-42,42,42,42,493,493,1,1],[4.2,420000,0.042]]


================================================
FILE: test-suite/golden-tests/numeric-literals/main.loc
================================================
module main (test)

test = (testInts, testFloats)

testInts = [-42, 42, 0x2a, 0X2a, 0o755, 0O755, 0b0001, 0B0001]

testFloats = [4.2, 4.2E5, 4.2e-2]


================================================
FILE: test-suite/golden-tests/object-1-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":34}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/object-1-c/exp.txt
================================================
{"name":"alice","info":34}


================================================
FILE: test-suite/golden-tests/object-1-c/main.loc
================================================
module main (foo)

import root
import root-cpp

source Cpp from "person.h" ("PersonObj")

object (Person a) = Person {name :: Str, info :: a}
object Cpp => (Person a) = "PersonObj"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/object-1-c/person.h
================================================
#ifndef __PERSON_H__
#define __PERSON_H__

#include <vector>
#include <tuple>
#include <utility>

template <class T>
class PersonObj{
    public:
        std::string name;
        T info; 

        PersonObj(std::string name_i, T info_i){
           name = name_i; 
           info = info_i; 
        }

        PersonObj(T info_i){
           name = "anonymous"; 
           info = info_i; 
        }

        PersonObj(){ }

        std::string initials(){
            std::string n = "";
            bool in = false;
            for(size_t i = 0; i < name.size(); i++){
                if (in && name[i] == ' ') {
                    in = false;
                }
                else if (!in && name[i] != ' ') {
                    n.push_back(name[i]);
                    in = true;
                }
            }
            return n;
        }
};

#endif


================================================
FILE: test-suite/golden-tests/object-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":34}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/object-1-py/exp.txt
================================================
{"name":"alice","info":34}


================================================
FILE: test-suite/golden-tests/object-1-py/main.loc
================================================
module main (foo)

import root
import root-py

source Py from "person.py" ("PersonObj" as Person)

object (Person a) = Person {name :: Str, info :: a}
object Py => (Person a) = "PersonObj"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/object-1-py/person.py
================================================
class PersonObj:
  def __init__(self, name, info):
    self.name = name 
    self.info = info 


================================================
FILE: test-suite/golden-tests/object-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":34}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/object-1-r/exp.txt
================================================
{"name":"alice","info":34}


================================================
FILE: test-suite/golden-tests/object-1-r/main.loc
================================================
module main (foo)

import root
import root-r

source R from "person.R" ("PersonObj")

object (Person a) = Person {name :: Str, info :: a}
object R => (Person a) = "PersonObj"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/object-1-r/person.R
================================================
# OK, this isn't really a proper class constructor and eventually I will need
# to deal with the wonkey variation in field accessors, but for now this will
# allow testing of the passing to the right constructor.
personObj <- function(name, info){
  list(name=name, info=info)
}


================================================
FILE: test-suite/golden-tests/optional-coerce-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testCoerceArg > obs.txt 2> obs.err
	./nexus testCoerceFromNull >> obs.txt 2>> obs.err
	./nexus testCoerceAddOpt >> obs.txt 2>> obs.err
	./nexus testCoerceReturn >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-coerce-cpp/exp.txt
================================================
42
-1
7
99


================================================
FILE: test-suite/golden-tests/optional-coerce-cpp/foo.hpp
================================================
#ifndef MORLOC_OPTIONAL_COERCE_TEST_HPP
#define MORLOC_OPTIONAL_COERCE_TEST_HPP

#include <optional>

template <typename T>
T fromNull(const T& default_val, const std::optional<T>& x) {
    if (!x.has_value()) return default_val;
    return *x;
}

template <typename T>
T fromNull(const T& default_val, std::nullopt_t) {
    return default_val;
}

template <typename T>
T fromNull(const T&, const T& x) {
    return x;
}

std::optional<int> addOpt(const std::optional<int>& x, const std::optional<int>& y) {
    if (!x.has_value() || !y.has_value()) return std::nullopt;
    return std::optional<int>(*x + *y);
}

std::optional<int> identity(const std::optional<int>& x) {
    return x;
}

#endif


================================================
FILE: test-suite/golden-tests/optional-coerce-cpp/main.loc
================================================
module main
  ( testCoerceArg
  , testCoerceFromNull
  , testCoerceAddOpt
  , testCoerceReturn
  )

type Cpp => Int = "int"

fromNull :: a -> ?a -> a
addOpt :: ?Int -> ?Int -> ?Int
identity :: ?Int -> ?Int

source Cpp from "foo.hpp" ("fromNull", "addOpt", "identity")

-- Pass Int where ?Int expected (coerce arg)
testCoerceArg :: Int
testCoerceArg = fromNull 0 42

-- Pass Int literal where ?Int expected in fromNull default
testCoerceFromNull :: Int
testCoerceFromNull = fromNull (-1) Null

-- Pass Int where ?Int expected (both args coerced)
testCoerceAddOpt :: ?Int
testCoerceAddOpt = addOpt 3 4

-- Pass Int where ?Int expected, return ?Int
testCoerceReturn :: ?Int
testCoerceReturn = identity 99


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testCppIntToPyOpt > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/cfoo.hpp
================================================
#ifndef MORLOC_COERCE_INTEROP_HPP
#define MORLOC_COERCE_INTEROP_HPP

int cAddOne(int x) {
    return x + 1;
}

#endif


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/cppfuncs.loc
================================================
module cppfuncs (*)

import types

cAddOne :: Int -> Int

source Cpp from "cfoo.hpp" ("cAddOne")


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/main.loc
================================================
module main
  ( testCppIntToPyOpt
  )

import types
import cppfuncs (cAddOne)
import pyfuncs (pUnwrapOr)

-- C++ returns Int, Python expects ?Int via coercion at cross-pool boundary.
-- cAddOne returns Int (=42), pUnwrapOr's 2nd arg expects ?Int.
-- The serialization schema at the boundary must be ?i4 for correct handling.
testCppIntToPyOpt :: Int
testCppIntToPyOpt = pUnwrapOr 0 (cAddOne 41)


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/pfoo.py
================================================
def pUnwrapOr(default_val, x):
    if x is None:
        return default_val
    return x


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/pyfuncs.loc
================================================
module pyfuncs (*)

import types

pUnwrapOr :: a -> ?a -> a

source Py from "pfoo.py" ("pUnwrapOr")


================================================
FILE: test-suite/golden-tests/optional-coerce-interop/types.loc
================================================
module types (*)

type Py => Int = "int"
type Cpp => Int = "int"


================================================
FILE: test-suite/golden-tests/optional-coerce-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testCoerceArg > obs.txt 2> obs.err
	./nexus testCoerceFromNull >> obs.txt 2>> obs.err
	./nexus testCoerceAddOpt >> obs.txt 2>> obs.err
	./nexus testCoerceReturn >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-coerce-py/exp.txt
================================================
42
-1
7
99


================================================
FILE: test-suite/golden-tests/optional-coerce-py/foo.py
================================================
def fromNull(default_val, x):
    if x is None:
        return default_val
    return x

def addOpt(x, y):
    if x is None or y is None:
        return None
    return x + y

def identity(x):
    return x


================================================
FILE: test-suite/golden-tests/optional-coerce-py/main.loc
================================================
module main
  ( testCoerceArg
  , testCoerceFromNull
  , testCoerceAddOpt
  , testCoerceReturn
  )

type Py => Int = "int"
type Py => List a = "list" a

fromNull :: a -> ?a -> a
addOpt :: ?Int -> ?Int -> ?Int
identity :: ?Int -> ?Int

source Py from "foo.py" ("fromNull", "addOpt", "identity")

-- Pass Int where ?Int expected (coerce arg)
testCoerceArg :: Int
testCoerceArg = fromNull 0 42

-- Pass Int literal where ?Int expected in fromNull default
testCoerceFromNull :: Int
testCoerceFromNull = fromNull (-1) Null

-- Pass Int where ?Int expected (both args coerced)
testCoerceAddOpt :: ?Int
testCoerceAddOpt = addOpt 3 4

-- Pass Int where ?Int expected, return ?Int
testCoerceReturn :: ?Int
testCoerceReturn = identity 99


================================================
FILE: test-suite/golden-tests/optional-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testNull > obs.txt 2> obs.err
	./nexus testValue >> obs.txt 2>> obs.err
	./nexus testFromNull >> obs.txt 2>> obs.err
	./nexus testSafeHead >> obs.txt 2>> obs.err
	./nexus testSafeHeadEmpty >> obs.txt 2>> obs.err
	./nexus testOptionalAdd >> obs.txt 2>> obs.err
	./nexus testOptionalAddNull >> obs.txt 2>> obs.err
	./nexus testOptionalList >> obs.txt 2>> obs.err
	./nexus testCountNulls >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-cpp/exp.txt
================================================
null
42
0
10
null
7
null
[1,null,3,null,5]
2


================================================
FILE: test-suite/golden-tests/optional-cpp/foo.hpp
================================================
#ifndef MORLOC_OPTIONAL_TEST_HPP
#define MORLOC_OPTIONAL_TEST_HPP

#include <optional>
#include <vector>
#include <string>

template <typename T>
bool isNull(const std::optional<T>& x) {
    return !x.has_value();
}

template <typename T>
T fromNull(const T& default_val, const std::optional<T>& x) {
    if (!x.has_value()) return default_val;
    return *x;
}

template <typename T>
T fromNull(const T& default_val, std::nullopt_t) {
    return default_val;
}

template <typename T>
std::optional<T> toNull(const T& x) {
    return std::optional<T>(x);
}

std::optional<int> safeHead(const std::vector<int>& xs) {
    if (xs.empty()) return std::nullopt;
    return std::optional<int>(xs[0]);
}

std::optional<int> optionalAdd(const std::optional<int>& x, const std::optional<int>& y) {
    if (!x.has_value() || !y.has_value()) return std::nullopt;
    return std::optional<int>(*x + *y);
}

std::vector<std::optional<int>> optionalList(const std::vector<int>& xs) {
    std::vector<std::optional<int>> result;
    result.reserve(xs.size());
    for (const auto& x : xs) {
        if (x < 0) result.push_back(std::nullopt);
        else result.push_back(std::optional<int>(x));
    }
    return result;
}

int countNulls(const std::vector<std::optional<int>>& xs) {
    int count = 0;
    for (const auto& x : xs) {
        if (!x.has_value()) count++;
    }
    return count;
}

#endif


================================================
FILE: test-suite/golden-tests/optional-cpp/main.loc
================================================
module main
  ( testNull
  , testValue
  , testFromNull
  , testSafeHead
  , testSafeHeadEmpty
  , testOptionalAdd
  , testOptionalAddNull
  , testOptionalList
  , testCountNulls
  )

type Cpp => Int = "int"
type Cpp => Bool = "bool"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

isNull :: ?a -> Bool
fromNull :: a -> ?a -> a
toNull :: a -> ?a
safeHead :: [Int] -> ?Int
optionalAdd :: ?Int -> ?Int -> ?Int
optionalList :: [Int] -> [?Int]
countNulls :: [?Int] -> Int

source Cpp from "foo.hpp"
  ( "isNull"
  , "fromNull"
  , "toNull"
  , "safeHead"
  , "optionalAdd"
  , "optionalList"
  , "countNulls"
  )

testNull :: ?Int
testNull = Null

testValue :: ?Int
testValue = toNull 42

testFromNull :: Int
testFromNull = fromNull 0 Null

testSafeHead :: ?Int
testSafeHead = safeHead [10, 20, 30]

testSafeHeadEmpty :: ?Int
testSafeHeadEmpty = safeHead []

testOptionalAdd :: ?Int
testOptionalAdd = optionalAdd (toNull 3) (toNull 4)

testOptionalAddNull :: ?Int
testOptionalAddNull = optionalAdd Null (toNull 4)

testOptionalList :: [?Int]
testOptionalList = optionalList [1, -2, 3, -4, 5]

testCountNulls :: Int
testCountNulls = countNulls (optionalList [1, -2, 3, -4, 5])


================================================
FILE: test-suite/golden-tests/optional-interop-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testCppToPy > obs.txt 2> obs.err
	./nexus testCppToPyNull >> obs.txt 2>> obs.err
	./nexus testPyToCpp >> obs.txt 2>> obs.err
	./nexus testPyToCppNull >> obs.txt 2>> obs.err
	./nexus testChainCppPy >> obs.txt 2>> obs.err
	./nexus testChainPyCpp >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-interop-cp/cppfuncs.loc
================================================
module cppfuncs (*)

import types

cSafeDiv :: Int -> Int -> ?Int
cFromNull :: Int -> ?Int -> Int
cDouble :: ?Int -> ?Int

source Cpp from "foo.hpp" ("cSafeDiv", "cFromNull", "cDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-cp/exp.txt
================================================
3
-1
5
-1
6
10


================================================
FILE: test-suite/golden-tests/optional-interop-cp/foo.hpp
================================================
#ifndef MORLOC_OPTIONAL_INTEROP_HPP
#define MORLOC_OPTIONAL_INTEROP_HPP

#include <optional>

std::optional<int> cSafeDiv(int x, int y) {
    if (y == 0) return std::nullopt;
    return std::optional<int>(x / y);
}

int cFromNull(int default_val, const std::optional<int>& x) {
    if (!x.has_value()) return default_val;
    return *x;
}

std::optional<int> cDouble(const std::optional<int>& x) {
    if (!x.has_value()) return std::nullopt;
    return std::optional<int>(*x * 2);
}

#endif


================================================
FILE: test-suite/golden-tests/optional-interop-cp/foo.py
================================================
def pSafeDiv(x, y):
    if y == 0:
        return None
    return x // y

def pFromNull(default_val, x):
    if x is None:
        return default_val
    return x

def pDouble(x):
    if x is None:
        return None
    return x * 2


================================================
FILE: test-suite/golden-tests/optional-interop-cp/main.loc
================================================
module main
  ( testCppToPy
  , testCppToPyNull
  , testPyToCpp
  , testPyToCppNull
  , testChainCppPy
  , testChainPyCpp
  )

import types
import cppfuncs (cSafeDiv, cFromNull, cDouble)
import pyfuncs (pSafeDiv, pFromNull, pDouble)

-- C++ produces optional, Python consumes it
testCppToPy :: Int
testCppToPy = pFromNull (-1) (cSafeDiv 10 3)

-- C++ produces null, Python consumes it
testCppToPyNull :: Int
testCppToPyNull = pFromNull (-1) (cSafeDiv 10 0)

-- Python produces optional, C++ consumes it
testPyToCpp :: Int
testPyToCpp = cFromNull (-1) (pSafeDiv 10 2)

-- Python produces null, C++ consumes it
testPyToCppNull :: Int
testPyToCppNull = cFromNull (-1) (pSafeDiv 10 0)

-- Chain: C++ safeDiv -> Python double -> C++ fromNull
testChainCppPy :: Int
testChainCppPy = cFromNull 0 (pDouble (cSafeDiv 10 3))

-- Chain: Python safeDiv -> C++ double -> Python fromNull
testChainPyCpp :: Int
testChainPyCpp = pFromNull 0 (cDouble (pSafeDiv 10 2))


================================================
FILE: test-suite/golden-tests/optional-interop-cp/pyfuncs.loc
================================================
module pyfuncs (*)

import types

pSafeDiv :: Int -> Int -> ?Int
pFromNull :: Int -> ?Int -> Int
pDouble :: ?Int -> ?Int

source Py from "foo.py" ("pSafeDiv", "pFromNull", "pDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-cp/types.loc
================================================
module types (*)

type Py => Int = "int"
type Cpp => Int = "int"
type Py => List a = "list" a
type Cpp => List a = "std::vector<$1>" a


================================================
FILE: test-suite/golden-tests/optional-interop-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testPyToR > obs.txt 2> obs.err
	./nexus testPyToRNull >> obs.txt 2>> obs.err
	./nexus testRToPy >> obs.txt 2>> obs.err
	./nexus testRToPyNull >> obs.txt 2>> obs.err
	./nexus testChainPyR >> obs.txt 2>> obs.err
	./nexus testChainRPy >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-interop-pr/exp.txt
================================================
3
-1
5
-1
6
10


================================================
FILE: test-suite/golden-tests/optional-interop-pr/foo.R
================================================
rSafeDiv <- function(x, y) {
    if (y == 0) return(NULL)
    return(as.integer(x %/% y))
}

rFromNull <- function(default_val, x) {
    if (is.null(x)) return(default_val)
    return(x)
}

rDouble <- function(x) {
    if (is.null(x)) return(NULL)
    return(as.integer(x * 2L))
}


================================================
FILE: test-suite/golden-tests/optional-interop-pr/foo.py
================================================
def pSafeDiv(x, y):
    if y == 0:
        return None
    return x // y

def pFromNull(default_val, x):
    if x is None:
        return default_val
    return x

def pDouble(x):
    if x is None:
        return None
    return x * 2


================================================
FILE: test-suite/golden-tests/optional-interop-pr/main.loc
================================================
module main
  ( testPyToR
  , testPyToRNull
  , testRToPy
  , testRToPyNull
  , testChainPyR
  , testChainRPy
  )

import types
import pyfuncs (pSafeDiv, pFromNull, pDouble)
import rfuncs (rSafeDiv, rFromNull, rDouble)

testPyToR :: Int
testPyToR = rFromNull (-1) (pSafeDiv 10 3)

testPyToRNull :: Int
testPyToRNull = rFromNull (-1) (pSafeDiv 10 0)

testRToPy :: Int
testRToPy = pFromNull (-1) (rSafeDiv 10 2)

testRToPyNull :: Int
testRToPyNull = pFromNull (-1) (rSafeDiv 10 0)

testChainPyR :: Int
testChainPyR = rFromNull 0 (rDouble (pSafeDiv 10 3))

testChainRPy :: Int
testChainRPy = pFromNull 0 (pDouble (rSafeDiv 10 2))


================================================
FILE: test-suite/golden-tests/optional-interop-pr/pyfuncs.loc
================================================
module pyfuncs (*)

import types

pSafeDiv :: Int -> Int -> ?Int
pFromNull :: Int -> ?Int -> Int
pDouble :: ?Int -> ?Int

source Py from "foo.py" ("pSafeDiv", "pFromNull", "pDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-pr/rfuncs.loc
================================================
module rfuncs (*)

import types

rSafeDiv :: Int -> Int -> ?Int
rFromNull :: Int -> ?Int -> Int
rDouble :: ?Int -> ?Int

source R from "foo.R" ("rSafeDiv", "rFromNull", "rDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-pr/types.loc
================================================
module types (*)

type Py => Int = "int"
type R => Int = "integer"
type Py => List a = "list" a
type R => List a = "list" a


================================================
FILE: test-suite/golden-tests/optional-interop-rc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testRToCpp > obs.txt 2> obs.err
	./nexus testRToCppNull >> obs.txt 2>> obs.err
	./nexus testCppToR >> obs.txt 2>> obs.err
	./nexus testCppToRNull >> obs.txt 2>> obs.err
	./nexus testChainRCpp >> obs.txt 2>> obs.err
	./nexus testChainCppR >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-interop-rc/cppfuncs.loc
================================================
module cppfuncs (*)

import types

cSafeDiv :: Int -> Int -> ?Int
cFromNull :: Int -> ?Int -> Int
cDouble :: ?Int -> ?Int

source Cpp from "foo.hpp" ("cSafeDiv", "cFromNull", "cDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-rc/exp.txt
================================================
5
-1
3
-1
10
6


================================================
FILE: test-suite/golden-tests/optional-interop-rc/foo.R
================================================
rSafeDiv <- function(x, y) {
    if (y == 0) return(NULL)
    return(as.integer(x %/% y))
}

rFromNull <- function(default_val, x) {
    if (is.null(x)) return(default_val)
    return(x)
}

rDouble <- function(x) {
    if (is.null(x)) return(NULL)
    return(as.integer(x * 2L))
}


================================================
FILE: test-suite/golden-tests/optional-interop-rc/foo.hpp
================================================
#ifndef MORLOC_OPTIONAL_INTEROP_RC_HPP
#define MORLOC_OPTIONAL_INTEROP_RC_HPP

#include <optional>

std::optional<int> cSafeDiv(int x, int y) {
    if (y == 0) return std::nullopt;
    return std::optional<int>(x / y);
}

int cFromNull(int default_val, const std::optional<int>& x) {
    if (!x.has_value()) return default_val;
    return *x;
}

std::optional<int> cDouble(const std::optional<int>& x) {
    if (!x.has_value()) return std::nullopt;
    return std::optional<int>(*x * 2);
}

#endif


================================================
FILE: test-suite/golden-tests/optional-interop-rc/main.loc
================================================
module main
  ( testRToCpp
  , testRToCppNull
  , testCppToR
  , testCppToRNull
  , testChainRCpp
  , testChainCppR
  )

import types
import cppfuncs (cSafeDiv, cFromNull, cDouble)
import rfuncs (rSafeDiv, rFromNull, rDouble)

testRToCpp :: Int
testRToCpp = cFromNull (-1) (rSafeDiv 10 2)

testRToCppNull :: Int
testRToCppNull = cFromNull (-1) (rSafeDiv 10 0)

testCppToR :: Int
testCppToR = rFromNull (-1) (cSafeDiv 10 3)

testCppToRNull :: Int
testCppToRNull = rFromNull (-1) (cSafeDiv 10 0)

testChainRCpp :: Int
testChainRCpp = cFromNull 0 (cDouble (rSafeDiv 10 2))

testChainCppR :: Int
testChainCppR = rFromNull 0 (rDouble (cSafeDiv 10 3))


================================================
FILE: test-suite/golden-tests/optional-interop-rc/rfuncs.loc
================================================
module rfuncs (*)

import types

rSafeDiv :: Int -> Int -> ?Int
rFromNull :: Int -> ?Int -> Int
rDouble :: ?Int -> ?Int

source R from "foo.R" ("rSafeDiv", "rFromNull", "rDouble")


================================================
FILE: test-suite/golden-tests/optional-interop-rc/types.loc
================================================
module types (*)

type Cpp => Int = "int"
type R => Int = "integer"
type Cpp => List a = "std::vector<$1>" a
type R => List a = "list" a


================================================
FILE: test-suite/golden-tests/optional-json/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus echoOptInt null > obs.txt 2> obs.err
	./nexus echoOptInt 42 >> obs.txt 2>> obs.err
	./nexus echoOptStr null >> obs.txt 2>> obs.err
	./nexus echoOptStr '"hello"' >> obs.txt 2>> obs.err
	./nexus echoOptList null >> obs.txt 2>> obs.err
	./nexus echoOptList '[1,2,3]' >> obs.txt 2>> obs.err
	./nexus fromNullInt null >> obs.txt 2>> obs.err
	./nexus fromNullInt 99 >> obs.txt 2>> obs.err
	./nexus isNullInt null >> obs.txt 2>> obs.err
	./nexus isNullInt 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-json/exp.txt
================================================
null
42
null
"hello"
null
[1,2,3]
0
99
true
false


================================================
FILE: test-suite/golden-tests/optional-json/foo.py
================================================
def identity(x):
    return x

def fromNull(default_val, x):
    if x is None:
        return default_val
    return x

def isNull(x):
    return x is None


================================================
FILE: test-suite/golden-tests/optional-json/main.loc
================================================
module main
  ( echoOptInt
  , echoOptStr
  , echoOptList
  , fromNullInt
  , isNullInt
  )

type Py => Int = "int"
type Py => Bool = "bool"
type Py => Str = "str"
type Py => List a = "list" a

identity :: a -> a
fromNull :: a -> ?a -> a
isNull :: ?a -> Bool

source Py from "foo.py" ("identity", "fromNull", "isNull")

echoOptInt :: ?Int -> ?Int
echoOptInt x = identity x

echoOptStr :: ?Str -> ?Str
echoOptStr x = identity x

echoOptList :: ?[Int] -> ?[Int]
echoOptList x = identity x

fromNullInt :: ?Int -> Int
fromNullInt x = fromNull 0 x

isNullInt :: ?Int -> Bool
isNullInt x = isNull x


================================================
FILE: test-suite/golden-tests/optional-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testNull > obs.txt 2> obs.err
	./nexus testValue >> obs.txt 2>> obs.err
	./nexus testFromNull >> obs.txt 2>> obs.err
	./nexus testSafeHead >> obs.txt 2>> obs.err
	./nexus testSafeHeadEmpty >> obs.txt 2>> obs.err
	./nexus testOptionalAdd >> obs.txt 2>> obs.err
	./nexus testOptionalAddNull >> obs.txt 2>> obs.err
	./nexus testOptionalList >> obs.txt 2>> obs.err
	./nexus testCountNulls >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-py/exp.txt
================================================
null
42
0
10
null
7
null
[1,null,3,null,5]
2


================================================
FILE: test-suite/golden-tests/optional-py/foo.py
================================================
def isNull(x):
    return x is None

def fromNull(default_val, x):
    if x is None:
        return default_val
    return x

def toNull(x):
    return x

def safeHead(xs):
    if len(xs) == 0:
        return None
    return xs[0]

def optionalAdd(x, y):
    if x is None or y is None:
        return None
    return x + y

def optionalList(xs):
    return [None if x < 0 else x for x in xs]

def countNulls(xs):
    return sum(1 for x in xs if x is None)


================================================
FILE: test-suite/golden-tests/optional-py/main.loc
================================================
module main
  ( testNull
  , testValue
  , testFromNull
  , testSafeHead
  , testSafeHeadEmpty
  , testOptionalAdd
  , testOptionalAddNull
  , testOptionalList
  , testCountNulls
  )

type Py => Int = "int"
type Py => Bool = "bool"
type Py => Str = "str"
type Py => List a = "list" a

isNull :: ?a -> Bool
fromNull :: a -> ?a -> a
toNull :: a -> ?a
safeHead :: [Int] -> ?Int
optionalAdd :: ?Int -> ?Int -> ?Int
optionalList :: [Int] -> [?Int]
countNulls :: [?Int] -> Int

source Py from "foo.py"
  ( "isNull"
  , "fromNull"
  , "toNull"
  , "safeHead"
  , "optionalAdd"
  , "optionalList"
  , "countNulls"
  )

testNull :: ?Int
testNull = Null

testValue :: ?Int
testValue = toNull 42

testFromNull :: Int
testFromNull = fromNull 0 Null

testSafeHead :: ?Int
testSafeHead = safeHead [10, 20, 30]

testSafeHeadEmpty :: ?Int
testSafeHeadEmpty = safeHead []

testOptionalAdd :: ?Int
testOptionalAdd = optionalAdd (toNull 3) (toNull 4)

testOptionalAddNull :: ?Int
testOptionalAddNull = optionalAdd Null (toNull 4)

testOptionalList :: [?Int]
testOptionalList = optionalList [1, -2, 3, -4, 5]

testCountNulls :: Int
testCountNulls = countNulls (optionalList [1, -2, 3, -4, 5])


================================================
FILE: test-suite/golden-tests/optional-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testNull > obs.txt 2> obs.err
	./nexus testValue >> obs.txt 2>> obs.err
	./nexus testFromNull >> obs.txt 2>> obs.err
	./nexus testSafeHead >> obs.txt 2>> obs.err
	./nexus testSafeHeadEmpty >> obs.txt 2>> obs.err
	./nexus testOptionalAdd >> obs.txt 2>> obs.err
	./nexus testOptionalAddNull >> obs.txt 2>> obs.err
	./nexus testOptionalList >> obs.txt 2>> obs.err
	./nexus testCountNulls >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-r/exp.txt
================================================
null
42
0
10
null
7
null
[1,null,3,null,5]
2


================================================
FILE: test-suite/golden-tests/optional-r/foo.R
================================================
isNull <- function(x) {
    is.null(x)
}

fromNull <- function(default_val, x) {
    if (is.null(x)) return(default_val)
    return(x)
}

toNull <- function(x) {
    return(x)
}

safeHead <- function(xs) {
    if (length(xs) == 0) return(NULL)
    return(xs[[1]])
}

optionalAdd <- function(x, y) {
    if (is.null(x) || is.null(y)) return(NULL)
    return(x + y)
}

optionalList <- function(xs) {
    lapply(xs, function(x) if (x < 0) NULL else x)
}

countNulls <- function(xs) {
    sum(sapply(xs, is.null))
}


================================================
FILE: test-suite/golden-tests/optional-r/main.loc
================================================
module main
  ( testNull
  , testValue
  , testFromNull
  , testSafeHead
  , testSafeHeadEmpty
  , testOptionalAdd
  , testOptionalAddNull
  , testOptionalList
  , testCountNulls
  )

type R => Int = "integer"
type R => Bool = "logical"
type R => Str = "character"
type R => List a = "list" a

isNull :: ?a -> Bool
fromNull :: a -> ?a -> a
toNull :: a -> ?a
safeHead :: [Int] -> ?Int
optionalAdd :: ?Int -> ?Int -> ?Int
optionalList :: [Int] -> [?Int]
countNulls :: [?Int] -> Int

source R from "foo.R"
  ( "isNull"
  , "fromNull"
  , "toNull"
  , "safeHead"
  , "optionalAdd"
  , "optionalList"
  , "countNulls"
  )

testNull :: ?Int
testNull = Null

testValue :: ?Int
testValue = toNull 42

testFromNull :: Int
testFromNull = fromNull 0 Null

testSafeHead :: ?Int
testSafeHead = safeHead [10, 20, 30]

testSafeHeadEmpty :: ?Int
testSafeHeadEmpty = safeHead []

testOptionalAdd :: ?Int
testOptionalAdd = optionalAdd (toNull 3) (toNull 4)

testOptionalAddNull :: ?Int
testOptionalAddNull = optionalAdd Null (toNull 4)

testOptionalList :: [?Int]
testOptionalList = optionalList [1, -2, 3, -4, 5]

testCountNulls :: Int
testCountNulls = countNulls (optionalList [1, -2, 3, -4, 5])


================================================
FILE: test-suite/golden-tests/optional-records-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMakePerson > obs.txt 2> obs.err
	./nexus testOptionalField >> obs.txt 2>> obs.err
	./nexus testFindPerson >> obs.txt 2>> obs.err
	./nexus testFindPersonMissing >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-records-cpp/exp.txt
================================================
{"name":"Alice","age":30}
null
{"name":"Alice","age":30}
null


================================================
FILE: test-suite/golden-tests/optional-records-cpp/foo.hpp
================================================
#ifndef MORLOC_OPTIONAL_RECORDS_HPP
#define MORLOC_OPTIONAL_RECORDS_HPP

#include <optional>
#include <string>
#include <vector>

struct person_t {
    std::string name;
    std::optional<int> age;
};

person_t makePerson(const std::string& name, const std::optional<int>& age) {
    return person_t{name, age};
}

std::string getName(const person_t& p) {
    return p.name;
}

std::optional<int> getAge(const person_t& p) {
    return p.age;
}

template <typename T>
std::optional<T> toNull(const T& x) {
    return std::optional<T>(x);
}

std::optional<person_t> findPerson(const std::string& name, const std::vector<person_t>& people) {
    for (const auto& p : people) {
        if (p.name == name) return std::optional<person_t>(p);
    }
    return std::nullopt;
}

#endif


================================================
FILE: test-suite/golden-tests/optional-records-cpp/main.loc
================================================
module main
  ( testMakePerson
  , testOptionalField
  , testFindPerson
  , testFindPersonMissing
  )

type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

record Person where
  name :: Str
  age :: ?Int
record Cpp => Person = "person_t"

makePerson :: Str -> ?Int -> Person
getName :: Person -> Str
getAge :: Person -> ?Int
toNull :: a -> ?a
findPerson :: Str -> [Person] -> ?Person

source Cpp from "foo.hpp" ("makePerson", "getName", "getAge", "toNull", "findPerson")

alice :: Person
alice = makePerson "Alice" (toNull 30)

bob :: Person
bob = makePerson "Bob" Null

testMakePerson :: Person
testMakePerson = alice

testOptionalField :: ?Int
testOptionalField = getAge bob

testFindPerson :: ?Person
testFindPerson = findPerson "Alice" [alice, bob]

testFindPersonMissing :: ?Person
testFindPersonMissing = findPerson "Charlie" [alice, bob]


================================================
FILE: test-suite/golden-tests/optional-records-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMakePerson > obs.txt 2> obs.err
	./nexus testOptionalField >> obs.txt 2>> obs.err
	./nexus testFindPerson >> obs.txt 2>> obs.err
	./nexus testFindPersonMissing >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-records-py/exp.txt
================================================
{"name":"Alice","age":30}
null
{"name":"Alice","age":30}
null


================================================
FILE: test-suite/golden-tests/optional-records-py/foo.py
================================================
def makePerson(name, age):
    return {"name": name, "age": age}

def getName(p):
    return p["name"]

def getAge(p):
    return p["age"]

def toNull(x):
    return x

def findPerson(name, people):
    for p in people:
        if p["name"] == name:
            return p
    return None


================================================
FILE: test-suite/golden-tests/optional-records-py/main.loc
================================================
module main
  ( testMakePerson
  , testOptionalField
  , testFindPerson
  , testFindPersonMissing
  )

type Py => Int = "int"
type Py => Str = "str"
type Py => List a = "list" a

record Person where
  name :: Str
  age :: ?Int
record Py => Person = "dict"

makePerson :: Str -> ?Int -> Person
getName :: Person -> Str
getAge :: Person -> ?Int
toNull :: a -> ?a
findPerson :: Str -> [Person] -> ?Person

source Py from "foo.py" ("makePerson", "getName", "getAge", "toNull", "findPerson")

alice :: Person
alice = makePerson "Alice" (toNull 30)

bob :: Person
bob = makePerson "Bob" Null

testMakePerson :: Person
testMakePerson = alice

testOptionalField :: ?Int
testOptionalField = getAge bob

testFindPerson :: ?Person
testFindPerson = findPerson "Alice" [alice, bob]

testFindPersonMissing :: ?Person
testFindPersonMissing = findPerson "Charlie" [alice, bob]


================================================
FILE: test-suite/golden-tests/optional-records-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testMakePerson > obs.txt 2> obs.err
	./nexus testOptionalField >> obs.txt 2>> obs.err
	./nexus testFindPerson >> obs.txt 2>> obs.err
	./nexus testFindPersonMissing >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/optional-records-r/exp.txt
================================================
{"name":"Alice","age":30}
null
{"name":"Alice","age":30}
null


================================================
FILE: test-suite/golden-tests/optional-records-r/foo.R
================================================
makePerson <- function(name, age) {
    list(name = name, age = age)
}

getName <- function(p) {
    p$name
}

getAge <- function(p) {
    p$age
}

toNull <- function(x) {
    return(x)
}

findPerson <- function(name, people) {
    for (p in people) {
        if (p$name == name) return(p)
    }
    return(NULL)
}


================================================
FILE: test-suite/golden-tests/optional-records-r/main.loc
================================================
module main
  ( testMakePerson
  , testOptionalField
  , testFindPerson
  , testFindPersonMissing
  )

type R => Int = "integer"
type R => Str = "character"
type R => List a = "list" a

record Person where
  name :: Str
  age :: ?Int
record R => Person = "list"

makePerson :: Str -> ?Int -> Person
getName :: Person -> Str
getAge :: Person -> ?Int
toNull :: a -> ?a
findPerson :: Str -> [Person] -> ?Person

source R from "foo.R" ("makePerson", "getName", "getAge", "toNull", "findPerson")

alice :: Person
alice = makePerson "Alice" (toNull 30)

bob :: Person
bob = makePerson "Bob" Null

testMakePerson :: Person
testMakePerson = alice

testOptionalField :: ?Int
testOptionalField = getAge bob

testFindPerson :: ?Person
testFindPerson = findPerson "Alice" [alice, bob]

testFindPersonMissing :: ?Person
testFindPersonMissing = findPerson "Charlie" [alice, bob]


================================================
FILE: test-suite/golden-tests/packer-definitions-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"alice"' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/packer-definitions-1/exp.txt
================================================
"{\"name\": \"alice\", \"hobby\": [\"phishing\", \"SIM swapping\"]}"


================================================
FILE: test-suite/golden-tests/packer-definitions-1/foo.py
================================================
import json

def foo(name):
    return dict(name = name, hobby = ["phishing", "SIM swapping"])

#  packJsonObj   Py :: pack   => "str" -> "dict"
def packJsonObj(json_str):
    return json.loads(json_str)

#  unpackJsonObj Py :: unpack => "dict" -> "str"
def unpackJsonObj(json_obj):
    return json.dumps(json_obj)


================================================
FILE: test-suite/golden-tests/packer-definitions-1/main.loc
================================================
module main (foo)

source Py from "foo.py" ("foo")

foo :: Str -> JsonObj

type Py => Str = "str"
type Py => JsonObj = "dict"

class Packable a b where
  pack :: a -> b
  unpack :: b -> a

instance Packable (Str) JsonObj where
  source Py from "foo.py"
    ( "packJsonObj" as pack
    , "unpackJsonObj" as unpack
    )


================================================
FILE: test-suite/golden-tests/packer-definitions-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"alice"' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/packer-definitions-2/exp.txt
================================================
"{\"name\": \"alice\", \"hobby\": [\"phishing\", \"SIM swapping\"]}"


================================================
FILE: test-suite/golden-tests/packer-definitions-2/foo.py
================================================
def foo(name):
    return dict(name = name, hobby = ["phishing", "SIM swapping"])


================================================
FILE: test-suite/golden-tests/packer-definitions-2/lib/json/json.py
================================================
import json

#  packJsonObj   Py :: pack   => "str" -> "dict"
def packJsonObj(json_str):
    return json.loads(json_str)

#  unpackJsonObj Py :: unpack => "dict" -> "str"
def unpackJsonObj(json_obj):
    return json.dumps(json_obj)


================================================
FILE: test-suite/golden-tests/packer-definitions-2/lib/json/main.loc
================================================
module lib.json (JsonObj, Str)

type Py => Str = "str"
type Py => JsonObj = "dict"

class Packable a b where
  pack :: a -> b
  unpack :: b -> a

instance Packable (Str) JsonObj where
  source Py from "json.py"
    ( "packJsonObj" as pack
    , "unpackJsonObj" as unpack
    )


================================================
FILE: test-suite/golden-tests/packer-definitions-2/main.loc
================================================
module main (foo)

import lib.json (JsonObj, Str)

source Py from "foo.py" ("foo")

foo :: Str -> JsonObj


================================================
FILE: test-suite/golden-tests/packer-definitions-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"Alice"' > obs.txt 2> obs.err

.PHONY: clean
clean:
	rm -rf nexus pools *pdf *rda __pycache__


================================================
FILE: test-suite/golden-tests/packer-definitions-3/dumby.hpp
================================================
#ifndef __MORLOC_DUMBY_HPP__
#define __MORLOC_DUMBY_HPP__

#include <string>
#include <functional>

// h :: (a -> b) -> Str -> Real
template <class F>
double h(F f, std::string x){
  return 4.2;
}

#endif


================================================
FILE: test-suite/golden-tests/packer-definitions-3/dumby.py
================================================
#  f :: Real -> Real
def f(x): 
    return (2 * x)


================================================
FILE: test-suite/golden-tests/packer-definitions-3/exp.txt
================================================
4.2


================================================
FILE: test-suite/golden-tests/packer-definitions-3/main.loc
================================================
module main (foo)

type Cpp => Real = "double"
type Cpp => Str = "std::string"
type Cpp => (Tuple2 a b) = "std::tuple<$1,$2>" a b

type Py => Real = "float"
type Py => Str = "str"
type Py => (Tuple2 a b) = "tuple" a b

source Cpp from "dumby.hpp" ("h")
h :: (a -> b) -> Str -> Real

source Py from "dumby.py" ("f")
f :: Real -> Real

g :: (Real -> Real) -> Str -> Real
g f' = h (\l -> ("ladida", f' l))

foo :: Str -> Real
foo = g f


================================================
FILE: test-suite/golden-tests/packer-definitions-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err

.PHONY: clean
clean:
	rm -rf nexus pools *pdf *rda __pycache__


================================================
FILE: test-suite/golden-tests/packer-definitions-4/dumby.hpp
================================================
#ifndef __MORLOC_DUMBY_HPP__
#define __MORLOC_DUMBY_HPP__

// fcpp :: Real -> Real
double fcpp(double x){
  return (2*x);
}

#endif


================================================
FILE: test-suite/golden-tests/packer-definitions-4/dumby.py
================================================
#  fpy :: Real -> Real
def fpy(x): 
    return (2 * x)


================================================
FILE: test-suite/golden-tests/packer-definitions-4/exp.txt
================================================
[84,84]


================================================
FILE: test-suite/golden-tests/packer-definitions-4/main.loc
================================================
-- This fails
module main (foo)

type Cpp => Real = "double"
type Cpp => (Tuple2 a b) = "std::tuple<$1,$2>" a b

type Py => Real = "float"
type Py => (Tuple2 a b) = "tuple" a b

source Cpp from "dumby.hpp" ("fcpp")
fcpp :: Real -> Real

source Py from "dumby.py" ("fpy")
fpy :: Real -> Real

foo x = (fcpp x, fpy x)


================================================
FILE: test-suite/golden-tests/packer-definitions-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 10 20 > obs.txt 2> obs.err

.PHONY: clean
clean:
	rm -rf nexus pools *pdf *rda __pycache__


================================================
FILE: test-suite/golden-tests/packer-definitions-5/exp.txt
================================================
[["x","y"],[10,20]]


================================================
FILE: test-suite/golden-tests/packer-definitions-5/main.loc
================================================
module main (foo)

type Cpp => Map a b = "std::map<$1,$2>" a b
type Cpp => List a = "std::vector<$1>" a
type Cpp => Tuple2 a b = "std::tuple<$1,$2>" a b
type Cpp => Str = "std::string"
type Cpp => Int = "int"

type Py => Map a b = "dict" a b
type Py => List a = "list" a
type Py => Tuple2 a b = "tuple" a b
type Py => Str = "str"
type Py => Int = "int"

class Packable a b where
  pack :: a -> b
  unpack :: b -> a

instance Packable ([Str],[val]) (Map Str val) where
  source Py from "map.py"
    ( "packMap" as pack
    , "unpackMap" as unpack
    )

  source Cpp from "map.hpp"
    ( "morloc_packMap" as pack
    , "morloc_unpackMap" as unpack
    )

source Cpp from "map.hpp" ("insert")
insert :: Map a b -> a -> b -> Map a b

source Py from "map.py" ("singleton")
singleton :: Str -> a -> Map Str a

foo :: Int -> Int -> Map Str Int
foo x y = insert (singleton "x" x) "y" y


================================================
FILE: test-suite/golden-tests/packer-definitions-5/map.hpp
================================================
#ifndef __MORLOC_PACKER_TEST_5_HPP__
#define __MORLOC_PACKER_TEST_5_HPP__

#include <vector>
#include <map>
#include <utility>
#include <cassert>

template <class A, class B>
std::map<A,B> morloc_packMap(std::tuple<std::vector<A>,std::vector<B>> items){
    std::map<A,B> m;
    std::vector<A> a = std::get<0>(items);
    std::vector<B> b = std::get<1>(items);
    assert(a.size() == b.size());
    for(std::size_t i = 0; i < a.size(); i++){
        m[a[i]] = b[i];
    }
    return m;
}

template <class A, class B>
std::tuple<std::vector<A>,std::vector<B>> morloc_unpackMap(std::map<A,B> m){
    std::vector<A> a;
    std::vector<B> b;
    for (auto tuple : m) {
        a.push_back(std::get<0>(tuple));
        b.push_back(std::get<1>(tuple));
    }
    return std::make_tuple(a, b);
}

template <class A, class B>
std::map<A,B> insert(std::map<A,B> m, A a, B b){
  m[a] = b;
  return m;
}

#endif


================================================
FILE: test-suite/golden-tests/packer-definitions-5/map.py
================================================
def packMap(xs):
    return dict(zip(xs[0], xs[1]))

def unpackMap(d):
    return (list(d.keys()), list(d.values()))

def singleton(k, v):
    return {k : v}


================================================
FILE: test-suite/golden-tests/packets-interop/.gitignore
================================================
test-data.*


================================================
FILE: test-suite/golden-tests/packets-interop/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	# below buffer interop
	python3 make_test_data.py 4065 > test-data.json
	./nexus pfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	# above buffer interop
	python3 make_test_data.py 4066 > test-data.json
	./nexus pfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	# at mesg size
	python3 make_test_data.py 65536 > test-data.json
	./nexus pfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	# at mesg size + 1
	python3 make_test_data.py 65537 > test-data.json
	./nexus pfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	# above mesg size
	python3 make_test_data.py 1048577 > test-data.json
	./nexus pfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cfoo test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rfoo test-data.json | wc -c 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__ data* test-data*


================================================
FILE: test-suite/golden-tests/packets-interop/exp.txt
================================================
4068
4068
4068
4069
4069
4069
65539
65539
65539
65540
65540
65540
1048580
1048580
1048580


================================================
FILE: test-suite/golden-tests/packets-interop/foo.R
================================================
rid <- function(x) x


================================================
FILE: test-suite/golden-tests/packets-interop/foo.h
================================================
template <class A>
A cid(A x){
  return x;
}


================================================
FILE: test-suite/golden-tests/packets-interop/foo.py
================================================
def pid(x):
    return x


================================================
FILE: test-suite/golden-tests/packets-interop/main.loc
================================================
module main (cid, pid, rid, pfoo, rfoo, cfoo)

import root ((.))

source Cpp from "foo.h" ("cid")
source Py from "foo.py" ("pid")
source R from "foo.R" ("rid")


type Cpp => Str = "std::string"
type Py => Str = "str"
type R => Str = "character"

cid :: Str -> Str
pid :: Str -> Str
rid :: Str -> Str

cfoo :: Str -> Str
cfoo = cid . pid . cid

pfoo :: Str -> Str
pfoo = pid . cid . pid

rfoo :: Str -> Str
rfoo = rid . pid . rid


================================================
FILE: test-suite/golden-tests/packets-interop/make_test_data.py
================================================
import sys
print('"' + "x" * int(sys.argv[1]) + '"')


================================================
FILE: test-suite/golden-tests/packets-large/.gitignore
================================================
test-data.json


================================================
FILE: test-suite/golden-tests/packets-large/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	# below buffer
	python3 make_test_data.py 4065 > test-data.json
	./nexus pid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rid test-data.json | wc -c 2>> obs.err  >> obs.txt
	# above buffer
	python3 make_test_data.py 4066 > test-data.json
	./nexus pid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rid test-data.json | wc -c 2>> obs.err  >> obs.txt
	# above mesg size
	python3 make_test_data.py 1048577 > test-data.json
	./nexus pid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus cid test-data.json | wc -c 2>> obs.err  >> obs.txt
	./nexus rid test-data.json | wc -c 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__ data* 


================================================
FILE: test-suite/golden-tests/packets-large/exp.txt
================================================
4068
4068
4068
4069
4069
4069
1048580
1048580
1048580


================================================
FILE: test-suite/golden-tests/packets-large/foo.R
================================================
rid <- function(x) x


================================================
FILE: test-suite/golden-tests/packets-large/foo.h
================================================
template <class A>
A cid(A x){
  return x;
}


================================================
FILE: test-suite/golden-tests/packets-large/foo.py
================================================
def pid(x):
    return x


================================================
FILE: test-suite/golden-tests/packets-large/main.loc
================================================
module main (cid, pid, rid, pfoo, rfoo, cfoo)

import root ((.))

source Cpp from "foo.h" ("cid")
source Py from "foo.py" ("pid")
source R from "foo.R" ("rid")


type Cpp => Str = "std::string"
type Py => Str = "str"
type R => Str = "character"

cid :: Str -> Str
pid :: Str -> Str
rid :: Str -> Str

cfoo :: Str -> Str
cfoo = cid . pid . cid

pfoo :: Str -> Str
pfoo = pid . cid . pid

rfoo :: Str -> Str
rfoo = rid . pid . rid


================================================
FILE: test-suite/golden-tests/packets-large/make_test_data.py
================================================
import sys
print('"' + "x" * int(sys.argv[1]) + '"')


================================================
FILE: test-suite/golden-tests/parser-stress/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testPrecedence       > obs.txt 2> obs.err
	./nexus testParens          2>> obs.err  >> obs.txt
	./nexus testNegatives       2>> obs.err  >> obs.txt
	./nexus testNumericLiterals 2>> obs.err  >> obs.txt
	./nexus testMixedArith      2>> obs.err  >> obs.txt
	./nexus testGetterArith     2>> obs.err  >> obs.txt
	./nexus testNestedParens    2>> obs.err  >> obs.txt
	./nexus testAssociativity   2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/parser-stress/exp.txt
================================================
[true,true,true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true,true,true,true]


================================================
FILE: test-suite/golden-tests/parser-stress/main.loc
================================================
module main
  ( testPrecedence
  , testParens
  , testNegatives
  , testNumericLiterals
  , testMixedArith
  , testGetterArith
  , testNestedParens
  , testAssociativity
  )

import root
import root-py

-- ================================================================
-- Test 1: Basic operator precedence (no parens)
-- Fixity from root:
--   infixl 6 (+) (-)
--   infixl 7 (*) (//) (%)
--   infixr 8 (**)
-- ================================================================
testPrecedence :: [Bool]
testPrecedence =
  [ 2 + 3 * 4 == 14              -- * before +
  , 10 - 2 * 3 == 4              -- * before -
  , 1 + 2 + 3 == 6               -- left assoc +
  , 10 - 3 - 2 == 5              -- left assoc -
  , 2 * 3 + 4 * 5 == 26          -- two *'s, then +
  , 10 - 2 * 3 + 1 == 5          -- mixed - and + with *
  , 100 // 10 + 5 == 15          -- // before +
  , 100 // 10 * 2 == 20          -- // and * same prec, left assoc
  , 7 % 3 + 1 == 2               -- % before +
  , 2 + 3 * 4 + 5 == 19          -- sandwich: + * +
  ]

-- ================================================================
-- Test 2: Parenthesized expressions override precedence
-- THIS IS THE CORE TEST for the CParenE/ParenE fix
-- ================================================================
testParens :: [Bool]
testParens =
  [ (2 + 3) * 4 == 20            -- parens force + before *
  , 2 * (3 + 4) == 14            -- parens on right
  , (2 + 3) * (4 + 5) == 45      -- both sides
  , (10 - 2) * 3 == 24           -- parens force - before *
  , 10 - (2 * 3) == 4            -- parens around natural precedence (no change)
  , 2 * (3 + 4) != 2 * 3 + 4    -- 14 != 10, parens matter!
  , (1 + 1) * (1 + 1) == 4       -- simple both-sides
  , ((1 + 2)) == 3               -- double parens
  , (((1 + 2) * 3)) == 9         -- triple nesting
  , 100 // (2 + 3) == 20         -- parens with integer division
  , (100 // 2) + 3 == 53         -- parens not needed but present
  , (10 % 3) * 2 == 2            -- parens with modulo
  , 10 % (3 * 2) == 4            -- parens force * inside %
  ]

-- ================================================================
-- Test 3: Negative numbers and unary minus
-- ================================================================
testNegatives :: [Bool]
testNegatives =
  [ -1 + 2 == 1                  -- negative literal
  , -3 * -2 == 6                 -- two negatives
  , 5 + -3 == 2                  -- negative on right of +
  , 5 * -2 == -10                -- negative on right of *
  , -1 * -1 == 1                 -- double negative
  , (-1) * (-1) == 1             -- parens around negatives
  , (0 - 1) * 2 == -2             -- subtraction instead of unary minus on expr
  , -10 + 5 * 2 == 0             -- precedence with negative: -10 + (5*2)
  , (-10 + 5) * 2 == -10         -- parens override: (-5) * 2
  , 0 - 1 == -1                  -- subtraction vs negative
  ]

-- ================================================================
-- Test 4: Numeric literal formats
-- ================================================================
testNumericLiterals :: [Bool]
testNumericLiterals =
  [ 0xff == 255                  -- hex lowercase
  , 0xFF == 255                  -- hex uppercase
  , 0XFF == 255                  -- hex with capital X
  , 0x0 == 0                    -- hex zero
  , 0o77 == 63                   -- octal
  , 0O77 == 63                   -- octal capital O
  , 0o10 == 8                    -- octal 10 = decimal 8
  , 0b1010 == 10                 -- binary
  , 0B1111 == 15                 -- binary capital B
  , 0b0 == 0                    -- binary zero
  , 0b11111111 == 255            -- binary 255
  , 0xff + 1 == 256              -- hex in arithmetic
  , 0b1010 * 2 == 20             -- binary in arithmetic
  , 0o10 + 0b10 == 10            -- octal + binary
  , (0xff + 1) * 2 == 512        -- parens with hex
  , 0xff * (0b10 + 1) == 765     -- mixed literal formats with parens
  ]

-- ================================================================
-- Test 5: Mixed arithmetic with all operators
-- ================================================================
testMixedArith :: [Bool]
testMixedArith =
  [ 2 + 3 * 4 - 1 == 13                 -- + * - chain
  , (2 + 3) * (4 - 1) == 15             -- parens both sides
  , 100 // 10 + 100 % 10 == 10          -- // and % then +
  , (100 + 50) // 10 == 15              -- parens with //
  , 10 * 2 + 3 * 4 - 5 == 27            -- multi-term
  , (10 * 2 + 3) * (4 - 5) == -23       -- complex parens
  , 2 * 3 + 4 * 5 + 6 * 7 == 68         -- three products summed
  , (2 * 3 + 4) * (5 + 6 * 7) == 470    -- nested precedence
  , 1 + 2 * 3 + 4 * 5 + 6 == 33         -- long chain
  , (1 + 2) * (3 + 4) * (5 + 6) == 231  -- three parenthesized groups
  ]

-- ================================================================
-- Test 6: Getters/accessors mixed with arithmetic
-- ================================================================
testGetterArith :: [Bool]
testGetterArith =
  [ (.0 (10, 20)) + 5 == 15             -- getter result in arithmetic
  , (.1 (10, 20)) * 2 == 40             -- getter then multiply
  , (.0 (3, 7)) * (.1 (3, 7)) == 21     -- two getters multiplied
  , (.0 (10, 20)) + (.1 (10, 20)) == 30 -- two getters added
  , (.0 (2, 3)) * (.1 (2, 3)) + 1 == 7  -- getters with precedence
  , ((.0 (2, 3)) + (.1 (2, 3))) * 2 == 10  -- parens around getter arithmetic
  , (.0 (100, 200)) // (.1 (5, 10)) == 10  -- getters with integer division
  ]

-- ================================================================
-- Test 7: Deeply nested parenthesization
-- ================================================================
testNestedParens :: [Bool]
testNestedParens =
  [ ((((1 + 2)))) == 3                           -- quad nesting
  , (((2 + 3)) * ((4 + 5))) == 45                -- deep both sides
  , ((1 + 2) * (3 + 4)) + ((5 + 6) * (7 + 8)) == 186  -- two complex products
  , (((1 + 1) + 1) + 1) + 1 == 5                 -- left-nested
  , 1 + (1 + (1 + (1 + 1))) == 5                 -- right-nested
  , ((2) * ((3) + (4))) == 14                     -- redundant parens everywhere
  , (1 + (2 * (3 + (4 * 5)))) == 47              -- alternating + and * nesting
  , ((1 + 2 * 3) + (4 * 5 + 6)) == 33            -- parens grouping subexpressions
  ]

-- ================================================================
-- Test 8: Associativity stress tests
-- ================================================================
testAssociativity :: [Bool]
testAssociativity =
  [ -- Addition is associative, these should all be equal
    (1 + 2) + 3 == 1 + (2 + 3)
  , (10 + 20) + 30 == 10 + (20 + 30)
    -- Subtraction is NOT associative
  , (10 - 3) - 2 == 5                 -- left assoc: (10-3)-2 = 5
  , 10 - (3 - 2) == 9                 -- right grouping: 10-(3-2) = 9
  , (10 - 3) - 2 != 10 - (3 - 2)     -- proves non-associativity
    -- Multiplication is associative
  , (2 * 3) * 4 == 2 * (3 * 4)
    -- Integer division is NOT associative
  , (100 // 10) // 2 == 5             -- left assoc: (100//10)//2 = 5
  , 100 // (10 // 2) == 20            -- right grouping: 100//(10//2) = 20
  , (100 // 10) // 2 != 100 // (10 // 2)  -- proves non-associativity
    -- Mixed precedence chains
  , 2 + 3 * 4 == (2 + (3 * 4))       -- natural precedence = explicit right grouping of *
  , 2 * 3 + 4 == ((2 * 3) + 4)       -- natural precedence = explicit left grouping of *
  ]


================================================
FILE: test-suite/golden-tests/path-shadowing-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/path-shadowing-c/bar/main.hpp
================================================
#ifndef __BAR_MAIN_HPP__
#define __BAR_MAIN_HPP__

double add (double x, double y){
    return x + y;
}

#endif


================================================
FILE: test-suite/golden-tests/path-shadowing-c/bar/main.loc
================================================
module bar (*)

source Cpp from "main.hpp" ("add")

type Cpp => Real = "double"

add :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-c/baz/main.hpp
================================================
#ifndef __BAZ_MAIN_HPP__
#define __BAZ_MAIN_HPP__

double mul (double x, double y){
    return x * y;
}

#endif


================================================
FILE: test-suite/golden-tests/path-shadowing-c/baz/main.loc
================================================
module baz (*)

source Cpp from "main.hpp" ("mul")

type Cpp => Real = "double"

mul :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-c/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/path-shadowing-c/main.loc
================================================
module main (foo)

type Cpp => Real = "double"

import bar (add)
import baz (mul)

foo x = add x (mul 2.0 20.0)


================================================
FILE: test-suite/golden-tests/path-shadowing-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/path-shadowing-py/bar/main.loc
================================================
module (*)

source Py from "main.py" ("add")

type Py => Real = "float"

add :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-py/bar/main.py
================================================
def add (x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/path-shadowing-py/baz/main.loc
================================================
module (*)

source Py from "main.py" ("mul")

type Py => Real = "float"

mul :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-py/baz/main.py
================================================
def mul (x, y):
    return x * y


================================================
FILE: test-suite/golden-tests/path-shadowing-py/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/path-shadowing-py/main.loc
================================================
module main (foo)

type Py => Real = "float"

import .bar (add)
import .baz (mul)

foo x = add x (mul 2.0 20.0)


================================================
FILE: test-suite/golden-tests/path-shadowing-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/path-shadowing-r/bar/main.R
================================================
add <- function(x, y){
    x + y
}


================================================
FILE: test-suite/golden-tests/path-shadowing-r/bar/main.loc
================================================
module bar (*)

source R from "main.R" ("add")

type R => Real = "numeric"

add :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-r/baz/main.R
================================================
mul <- function(x, y){
    x * y
}


================================================
FILE: test-suite/golden-tests/path-shadowing-r/baz/main.loc
================================================
module baz (*)

source R from "main.R" ("mul")

type R => Real = "numeric"

mul :: Real -> Real -> Real


================================================
FILE: test-suite/golden-tests/path-shadowing-r/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/path-shadowing-r/main.loc
================================================
module main (foo)

type R => Real = "numeric"

import bar (add)
import baz (mul)

foo x = add x (mul 2.0 20.0)


================================================
FILE: test-suite/golden-tests/pattern-getters/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testr   >  obs.txt
	./nexus testpy  2>> obs.err  >> obs.txt
	./nexus testcpp 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/pattern-getters/exp.txt
================================================
[true,true,true,true,true]
[true,true,true,true,true]
[true,true,true,true,true]


================================================
FILE: test-suite/golden-tests/pattern-getters/main.loc
================================================
module main (testpy, testr, testcpp)

import root
import root-py
import root-r
import root-cpp

-- module main (foo)
-- foo = idr ( (==) (map .1 [(1,True), (2,False)]) [True,False] )

testr = idr
  [ (==) ((.1 (42, "Jim")))
       "Jim"
  , (==) (.1.(.0,.2) (42, ("Jim", True, 69)))
       ("Jim", 69)
  -- , (==) (map .1 [(1,2), (2,3)]) [2,3]
  , True -- for now, I'm ignoring this case, there is an issue with list versus vector generation
  , (==) (.(.1, .0) (1, 2))
       (2,1)
  , (==) (.(.1) (1, 2))
       2
  ]

testpy = idpy -- force into python
  [ (==) (.1 (42, "Jim"))
       "Jim"
  , (==) (.1.(.0,.2) (42, ("Jim", True, 69)))
       ("Jim", 69)
  , (==) (map .1 [(1,2), (2,3)])
       [2,3]
  , (==) (.(.1, .0) (1, 2))
       (2,1)
  , (==) (.(.1) (1, 2))
       2
  ]

testcpp = idcpp
  [ (==) (.1 (42, "Jim"))
       "Jim"
  , (==) (.1.(.0,.2) (42, ("Jim", True, 69)))
       ("Jim", 69)
  , (==) (map .1 [(1,2), (2,3)]) [2,3]
  , (==) (.(.1, .0) (1, 2))
       (2,1)
  , (==) (.(.1) (1, 2))
       2
  ]


================================================
FILE: test-suite/golden-tests/pattern-setters/.gitignore
================================================
nexus*


================================================
FILE: test-suite/golden-tests/pattern-setters/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus-py main-py.loc 2> build.err
	morloc make -o nexus-r main-r.loc 2> build.err
	morloc make -o nexus-cpp main-cpp.loc 2> build.err
	./nexus-py test > obs.txt 2> obs.err
	./nexus-r test 2>> obs.err  >> obs.txt
	./nexus-cpp test 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/pattern-setters/exp.txt
================================================
[true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true]
[true,true,true,true,true,true,true,true]


================================================
FILE: test-suite/golden-tests/pattern-setters/main-cpp.loc
================================================
module testcpp (test)

source Cpp from "types.hpp" ("location_t", "worker_t")

import tests
import root-cpp


================================================
FILE: test-suite/golden-tests/pattern-setters/main-py.loc
================================================
module testpy (test)

import tests
import root-py


================================================
FILE: test-suite/golden-tests/pattern-setters/main-r.loc
================================================
module testr (test)

import tests
import root-r


================================================
FILE: test-suite/golden-tests/pattern-setters/tests.loc
================================================
module tests (test)

import root

record Location = Location
  { latitude :: Real
  , longitude :: Real
  , altitude :: Real
  }
record Py => Location = "dict"
record R => Location = "list"
record Cpp => Location = "location_t"

record Worker = Worker
  { home :: Location
  , age :: Int
  , job :: (Bool, Location)
  }
record Py => Worker = "dict"
record R => Worker = "list"
record Cpp => Worker = "worker_t"

defaultLocation :: Location
defaultLocation =
  { latitude = 42.03
  , longitude = -93.62
  , altitude = 942.0
  } 

defaultWorker :: Worker
defaultWorker =
  { home = defaultLocation
  , age = 12
  , job = (True, defaultLocation)
  }

test = -- map .(.1 = 9) [(1,2), (2,3)]
  [
    -- getters
    (==) (.(.1 = "Sally") (42, "Jim"))
       (42, "Sally")
  , (==) (.1.(.0 = "Sally", .2 = 70) (42, ("Jim", True, 69)))
       (42, ("Sally", True, 70))
  , (==) (map .(.1 = 9) [(1,2), (2,3)])
       [(1,9), (2,9)]
  , (==) (.latitude defaultLocation)
       (42.03 :: Real)
  , (==) (.(.age, .job.1.altitude, .age) defaultWorker)
       (12, 942.0, 12)
    -- setters
  , (==) (.latitude ((.latitude = 0.7) defaultLocation)) 0.7
  , (==) (.(.latitude, .longitude) (.(.latitude = 0.7, .longitude = -100.0) defaultLocation))
       ( 0.7, -100.0 )
  , (==) (   .(.home.altitude,         .job.1.altitude)
         ( .(.home.altitude = 936.0, .job.1.altitude = 666.0) defaultWorker ))
       (936.0, 666.0)
  ]


================================================
FILE: test-suite/golden-tests/pattern-setters/types.hpp
================================================
#include <utility>

struct location_t {
  double latitude;
  double longitude;
  double altitude;
};

struct worker_t {
  location_t home;
  int age;
  std::tuple<bool, location_t> job;
};


================================================
FILE: test-suite/golden-tests/poly-list-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testListLiteral > obs.txt 2> obs.err
	./nexus testListMempty >> obs.txt 2>> obs.err
	./nexus testListAppend >> obs.txt 2>> obs.err
	./nexus testListCons >> obs.txt 2>> obs.err
	./nexus testListUncons >> obs.txt 2>> obs.err
	./nexus testListSnoc >> obs.txt 2>> obs.err
	./nexus testListUnsnoc >> obs.txt 2>> obs.err
	./nexus testListAt >> obs.txt 2>> obs.err
	./nexus testDequeLiteral >> obs.txt 2>> obs.err
	./nexus testDequeMempty >> obs.txt 2>> obs.err
	./nexus testDequeAppend >> obs.txt 2>> obs.err
	./nexus testDequeCons >> obs.txt 2>> obs.err
	./nexus testDequeUncons >> obs.txt 2>> obs.err
	./nexus testDequeSnoc >> obs.txt 2>> obs.err
	./nexus testDequeUnsnoc >> obs.txt 2>> obs.err
	./nexus testVectorLiteral >> obs.txt 2>> obs.err
	./nexus testVectorAppend >> obs.txt 2>> obs.err
	./nexus testVectorCons >> obs.txt 2>> obs.err
	./nexus testVectorUncons >> obs.txt 2>> obs.err
	./nexus testVectorSnoc >> obs.txt 2>> obs.err
	./nexus testVectorUnsnoc >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/poly-list-1/exp.txt
================================================
[1,2,3]
[1,2,3]
[1,2,3,4]
[0,1,2,3]
[1,[2,3]]
[1,2,3,4]
[[1,2],3]
20
[10,20,30]
[4,5,6]
[1,2,3,4]
[0,1,2,3]
[1,[2,3]]
[1,2,3,4]
[[1,2],3]
[7,8,9]
[1,2,3,4]
[0,1,2,3]
[1,[2,3]]
[1,2,3,4]
[[1,2],3]


================================================
FILE: test-suite/golden-tests/poly-list-1/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <vector>
#include <deque>
#include <tuple>

// --- List (std::vector) operations ---

template <typename T>
std::vector<T> appendList(std::vector<T> a, std::vector<T> b) {
    a.insert(a.end(), b.begin(), b.end());
    return a;
}

template <typename T>
T listAt(int i, std::vector<T> xs) {
    return xs[i];
}

template <typename T>
std::vector<T> listCons(T x, std::vector<T> xs) {
    xs.insert(xs.begin(), x);
    return xs;
}

template <typename T>
std::tuple<T, std::vector<T>> listUncons(std::vector<T> xs) {
    T head = xs.front();
    std::vector<T> tail(xs.begin() + 1, xs.end());
    return {head, tail};
}

template <typename T>
std::vector<T> listSnoc(std::vector<T> xs, T x) {
    xs.push_back(x);
    return xs;
}

template <typename T>
std::tuple<std::vector<T>, T> listUnsnoc(std::vector<T> xs) {
    T last = xs.back();
    xs.pop_back();
    return {xs, last};
}

// --- Deque (std::deque) operations ---

template <typename T>
std::deque<T> appendDeque(std::deque<T> a, std::deque<T> b) {
    a.insert(a.end(), b.begin(), b.end());
    return a;
}

template <typename T>
std::deque<T> dequeCons(T x, std::deque<T> xs) {
    xs.push_front(x);
    return xs;
}

template <typename T>
std::tuple<T, std::deque<T>> dequeUncons(std::deque<T> xs) {
    T head = xs.front();
    xs.pop_front();
    return {head, xs};
}

template <typename T>
std::deque<T> dequeSnoc(std::deque<T> xs, T x) {
    xs.push_back(x);
    return xs;
}

template <typename T>
std::tuple<std::deque<T>, T> dequeUnsnoc(std::deque<T> xs) {
    T last = xs.back();
    xs.pop_back();
    return {xs, last};
}

#endif


================================================
FILE: test-suite/golden-tests/poly-list-1/main.loc
================================================
module main (testListLiteral, testListMempty, testListAppend,
             testListCons, testListUncons,
             testListSnoc, testListUnsnoc,
             testListAt,
             testDequeLiteral, testDequeMempty, testDequeAppend,
             testDequeCons, testDequeUncons,
             testDequeSnoc, testDequeUnsnoc,
             testVectorLiteral, testVectorAppend,
             testVectorCons, testVectorUncons,
             testVectorSnoc, testVectorUnsnoc)

-- Primitive types (standalone, no root import)
type Cpp => Int = "int"

-- Container types
type Cpp => List a = "std::vector<$1>" a
type Cpp => Deque a = "std::deque<$1>" a
type Cpp => Vector a = "std::vector<$1>" a

-- Tuple for uncons/unsnoc return types
type Cpp => Tuple2 a b = "std::tuple<$1,$2>" a b

-- General type definitions
type List a
type Deque a = List a
type Vector a = List a

-- Typeclasses
class Semigroup a where
  append :: a -> a -> a

class Semigroup a => Monoid a where
  mempty :: a

class Indexed f where
  at :: Int -> f a -> a

class Stack f where
  cons :: a -> f a -> f a
  uncons :: f a -> (a, f a)

class Queue f where
  snoc :: f a -> a -> f a
  unsnoc :: f a -> (f a, a)

-- List instances
instance Semigroup (List a) where
  source Cpp from "foo.hpp" ("appendList" as append)

instance Monoid (List a) where
  mempty = []

instance Indexed List where
  source Cpp from "foo.hpp" ("listAt" as at)

instance Stack List where
  source Cpp from "foo.hpp" ("listCons" as cons)
  source Cpp from "foo.hpp" ("listUncons" as uncons)

instance Queue List where
  source Cpp from "foo.hpp" ("listSnoc" as snoc)
  source Cpp from "foo.hpp" ("listUnsnoc" as unsnoc)

-- Deque instances (maps to std::deque in C++)
instance Semigroup (Deque a) where
  source Cpp from "foo.hpp" ("appendDeque" as append)

instance Monoid (Deque a) where
  mempty = []

instance Stack Deque where
  source Cpp from "foo.hpp" ("dequeCons" as cons)
  source Cpp from "foo.hpp" ("dequeUncons" as uncons)

instance Queue Deque where
  source Cpp from "foo.hpp" ("dequeSnoc" as snoc)
  source Cpp from "foo.hpp" ("dequeUnsnoc" as unsnoc)

-- No Vector instances needed (reduces to List in C++)

-- List tests
testListLiteral :: [Int]
testListLiteral = [1, 2, 3]

testListMempty :: [Int]
testListMempty = append mempty [1, 2, 3]

testListAppend :: [Int]
testListAppend = append [1, 2] [3, 4]

testListCons :: [Int]
testListCons = cons 0 [1, 2, 3]

testListUncons :: (Int, [Int])
testListUncons = uncons [1, 2, 3]

testListSnoc :: [Int]
testListSnoc = snoc [1, 2, 3] 4

testListUnsnoc :: ([Int], Int)
testListUnsnoc = unsnoc [1, 2, 3]

testListAt :: Int
testListAt = at 1 [10, 20, 30]

-- Deque tests (uses Deque-specific instances with std::deque)
testDequeLiteral :: Deque Int
testDequeLiteral = [10, 20, 30]

testDequeMempty :: Deque Int
testDequeMempty = append mempty [4, 5, 6]

testDequeAppend :: Deque Int
testDequeAppend = append [1, 2] [3, 4]

testDequeCons :: Deque Int
testDequeCons = cons 0 [1, 2, 3]

testDequeUncons :: (Int, Deque Int)
testDequeUncons = uncons [1, 2, 3]

testDequeSnoc :: Deque Int
testDequeSnoc = snoc [1, 2, 3] 4

testDequeUnsnoc :: (Deque Int, Int)
testDequeUnsnoc = unsnoc [1, 2, 3]

-- Vector tests (uses List instances via alias, both map to std::vector)
testVectorLiteral :: Vector Int
testVectorLiteral = [7, 8, 9]

testVectorAppend :: Vector Int
testVectorAppend = append [1, 2] [3, 4]

testVectorCons :: Vector Int
testVectorCons = cons 0 [1, 2, 3]

testVectorUncons :: (Int, Vector Int)
testVectorUncons = uncons [1, 2, 3]

testVectorSnoc :: Vector Int
testVectorSnoc = snoc [1, 2, 3] 4

testVectorUnsnoc :: (Vector Int, Int)
testVectorUnsnoc = unsnoc [1, 2, 3]


================================================
FILE: test-suite/golden-tests/record-docstrings/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc > /dev/null 2> build.err
	echo foo > obs.txt 2> obs.err
	./nexus foo --alg-config=algconf.json [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo --alg-config=algconf.json -m 0 -n 0 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo -m 0 -n 0 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo -m 5 -n 0 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo -m 5 -n 2 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo -n 2 -m 5 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo -m 5 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus foo [1,2,3] 2>> obs.err  >> obs.txt
	echo bar 2>> obs.err  >> obs.txt
	./nexus bar [1,2,3] 2>> obs.err  >> obs.txt
	./nexus bar -y a [1,2,3] 2>> obs.err  >> obs.txt
	./nexus bar -y a -t 5 -m 6 [1,2,3] 2>> obs.err  >> obs.txt
	./nexus bar -y f -t 5 -m 6 --alg-conf=algconf.json [1,2,3] 2>> obs.err  >> obs.txt
	echo travelTime 2>> obs.err  >> obs.txt
	./nexus travelTime -w 2 3 4 2>> obs.err  >> obs.txt
	echo baz 2>> obs.err  >> obs.txt
	./nexus baz foo 2>> obs.err  >> obs.txt
	./nexus baz "foo bar" 2>> obs.err  >> obs.txt
	echo bif 2>> obs.err  >> obs.txt
	./nexus bif 2>> obs.err  >> obs.txt
	./nexus bif --clean 2>> obs.err  >> obs.txt
	./nexus bif --sys-config sysconf.json --clean 2>> obs.err  >> obs.txt
	./nexus bif --sys-config sysconf.json 2>> obs.err  >> obs.txt
	./nexus bif --sys-config sysconf.json --no-clean 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/record-docstrings/algconf.json
================================================
{"m":100,"n":1000}


================================================
FILE: test-suite/golden-tests/record-docstrings/exp.txt
================================================
foo
100106
6
6
11
211
211
11
6
bar
110
107
6507
6507
travelTime
24
baz
["foo","foo"]
["foo bar","foo bar"]
bif
"False"
"True"
"True"
"True"
"False"


================================================
FILE: test-suite/golden-tests/record-docstrings/foo.py
================================================
def fooFun(algconf, xs):
    return sum(xs) + algconf["m"] + algconf["n"] * 100

def barFun(sysconf, algconf, yolo, xs):
    return sum(xs) + len(yolo) + 100 * sysconf["numThreads"] + 1000 * algconf["m"]

def travelTime(v,n,w,b,d):
    return w * b * d + 5 * v + n

def bif(algconf):
    return str(algconf["removeCaches"])


================================================
FILE: test-suite/golden-tests/record-docstrings/main.loc
================================================
-- A module main doing foo
--
-- Here is a multi-lined
-- doc about this thing
--
-- author: Weena
-- email: weena@nowhere.com
-- github: ...
-- bugs: ...
-- website: ...
-- maintainer: ...
module main (
  -- name: fun
  -- desc: A fun group of functions
  fooFun,
  barFun,
  -- name: biffy
  -- desc: A biffy group of functions
  baz,
  travelTime,
  bif
  )

import root-py

--' System configuration
--' metavar: SYS_CONFIG
--' unroll: true
--' arg: --sys-config
record SysConfig where
  --' tmp directory
  --' arg: --tmp-dir
  --' metavar: FILE
  --' default: "/tmp"
  --' literal: true
  tmpDir :: Str

  --' number of threads to use
  --' arg: -t/--threads
  --' metavar: INT
  --' default: 1
  numThreads :: Int

  --' clean out caches before running?
  --' true:  --clean
  --' false: --no-clean
  --' default: false
  removeCaches :: Bool


--' Algorithm configuration
--' metavar: ALG_CONFIG
--' unroll: true
--' arg: --alg-config
record AlgConfig where
  --' some hyper parameter
  --' arg: -m
  --' default: 0
  m :: Int

  --' some other hyper parameter
  --' arg: -n/--nosy
  --' default: 0
  n :: Int

record Py => SysConfig = "dict"
record Py => AlgConfig = "dict"

bif :: SysConfig -> Str

--' Do some foo stuff
--'
--' Lalala more info
--'
--' name: foo
fooFun ::
    AlgConfig ->
    --' large vector of integers
    --' metavar: DATA
    [Int] ->
    --' the final metric thingy we wanted
    --' metavar: RESULT
    Int

--' Do some bar stuff
--'
--' details details details
--' more details details
--'
--' name: bar
barFun ::
    SysConfig ->
    AlgConfig ->
    --' the lone parameters
    --' arg: -y/--yolo
    --' literal: true
    --' default: "yolo"
    Str ->
    --' larger vector of integers
    --' metavar: DATA
    [Int] ->
    --' the final metric thingy we wanted
    --' metavar: RESULT
    Int

source Py from "foo.py" ("fooFun", "barFun", "travelTime", "bif")

--' baz is the dope
baz ::
  --' this is the
  --' literal: true
  Str ->
  --' thing i like
  [Str]
baz x = [x,x]


--' Speed of wind [m/s]
--' arg: -w/--wind-speed
--' default: 0
type WindSpeed = Real

--' Speed under ideal conditions on flat surface [m/s]
type BaseSpeed = Real

--' Final distance traveled in meters
type Distance = Real

--' Time in seconds
type Seconds = Real

--' Calculate travel time
--' return: Number of seconds in the air
travelTime ::
  --' add five to the result
  --' true: --add-five
  Bool ->
  --' arg: --nothin
  --' default: 0
  Int ->
  WindSpeed ->
  BaseSpeed ->
  Distance ->
  Seconds


================================================
FILE: test-suite/golden-tests/record-docstrings/sysconf.json
================================================
{"tmpDir":"tmp","numThreads":1,"removeCaches":true}


================================================
FILE: test-suite/golden-tests/records-alias/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test 42 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/records-alias/exp.txt
================================================
{"x":42}


================================================
FILE: test-suite/golden-tests/records-alias/foo.py
================================================
def make_bar(n):
    return {"x": n}


================================================
FILE: test-suite/golden-tests/records-alias/lib/main.loc
================================================
module lib (Foo)

import root-py (Int)

record Foo where
  x :: Int

record Py => Foo = "dict"


================================================
FILE: test-suite/golden-tests/records-alias/main.loc
================================================
module main (test)

import root-py (Int)
import lib (Foo as Bar)

source Py from "foo.py" ("make_bar" as makeBar)
makeBar :: Int -> Bar

test :: Int -> Bar
test = makeBar


================================================
FILE: test-suite/golden-tests/records-complex-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err
	./nexus bar 42 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/records-complex-1/exp.txt
================================================
{"shitlist":[["campers who play load music","earwigs","tollroads","nextflow"],[0,2,1,3]],"things":["spiders"],"size":42}
[[["aa"],[42]],["b"],42]


================================================
FILE: test-suite/golden-tests/records-complex-1/foo.R
================================================
addShit <- function(name, level_of_shit, foo){
    foo$shitlist[[name]] <- level_of_shit
    foo
}


================================================
FILE: test-suite/golden-tests/records-complex-1/foo.hpp
================================================
#pragma once

#include <string>
#include <vector>

struct foo_t {
    std::map<std::string, int> shitlist;
    std::vector<std::string> things;
    int size;
};

foo_t addShit(std::string name, int level_of_shit, foo_t foo){
    foo.shitlist.insert({name, level_of_shit});
    return foo;
}


================================================
FILE: test-suite/golden-tests/records-complex-1/foo.py
================================================
def addShit(name, level_of_shit, foo):
    foo["shitlist"][name] = level_of_shit
    return foo


================================================
FILE: test-suite/golden-tests/records-complex-1/main.loc
================================================
-- Tests passing records of primitives across languages and accessing fields

module main (foo, bar)

import map-py
import map-r
import map-cpp

record Foo = Foo
  { shitlist :: Map Str Int
  , things :: [Str]
  , size :: Int
  }
record Cpp => Foo = "foo_t"
record Py  => Foo = "dict"
record R   => Foo = "list"

source Py from "foo.py" ("addShit" as addShitPy)
source Cpp from "foo.hpp" ("addShit" as addShitCpp)
source R from "foo.R" ("addShit" as addShitR)
addShitCpp :: Str -> Int -> Foo -> Foo
addShitPy  :: Str -> Int -> Foo -> Foo
addShitR   :: Str -> Int -> Foo -> Foo

emptyMap :: Map Str Int
emptyMap = pack ([],[])

-- test interop
foo size =
  ( addShitPy  "nextflow" 3
  . addShitCpp "earwigs" 2
  . addShitR   "tollroads" 1
  . addShitPy  "campers who play load music" 0
  ) { shitlist = emptyMap
    , things = ["spiders"]
    , size = size
    }

-- test access
bar size = (.shitlist fpy, .things fcpp, .size fr) where
    fpy = addShitPy "aa" 42
      { shitlist = emptyMap
      , things = ["a"]
      , size = size
      }

    fcpp = addShitPy "bb" 42
      { shitlist = emptyMap
      , things = ["b"]
      , size = size
      }

    fr = addShitR "cc" 42
      { shitlist = emptyMap
      , things = ["c"]
      , size = size
      }


================================================
FILE: test-suite/golden-tests/records-complex-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err
	./nexus bar 42 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/records-complex-2/exp.txt
================================================
{"shitlists":[["campers who play load music","earwigs","tollroads","nextflow"],[[["yolo"],[0]],[["yolo"],[2]],[["yolo"],[1]],[["yolo"],[3]]]],"things":["spiders"],"size":42}
[[["aa"],[[["yolo"],[42]]]],["b"],42]


================================================
FILE: test-suite/golden-tests/records-complex-2/foo.R
================================================
addShit <- function(name, level_of_shit, foo){
    foo$shitlists[[name]] <- list(yolo = level_of_shit)
    foo
}


================================================
FILE: test-suite/golden-tests/records-complex-2/foo.hpp
================================================
#pragma once

#include <string>
#include <vector>

struct foo_t {
    std::map<std::string, std::map<std::string,int>> shitlists;
    std::vector<std::string> things;
    int size;
};

foo_t addShit(std::string name, int level_of_shit, foo_t foo){
    std::map<std::string,int> x;
    x.insert({"yolo", level_of_shit});
    foo.shitlists.insert({name, x});
    return foo;
}


================================================
FILE: test-suite/golden-tests/records-complex-2/foo.py
================================================
def addShit(name, level_of_shit, foo):
    foo["shitlists"][name] = {"yolo" : level_of_shit}
    return foo


================================================
FILE: test-suite/golden-tests/records-complex-2/main.loc
================================================
-- Tests passing records of primitives across languages and accessing fields

module main (foo, bar)

import map-r
import map-py
import map-cpp

record Foo = Foo
  { shitlists :: Map Str (Map Str Int)
  , things :: [Str]
  , size :: Int
  }
record Cpp => Foo = "foo_t"
record Py  => Foo = "dict"
record R   => Foo = "list"

source Py from "foo.py" ("addShit" as addShitPy)
source Cpp from "foo.hpp" ("addShit" as addShitCpp)
source R from "foo.R" ("addShit" as addShitR)
addShitCpp :: Str -> Int -> Foo -> Foo
addShitPy  :: Str -> Int -> Foo -> Foo
addShitR   :: Str -> Int -> Foo -> Foo

emptyMap :: Map Str (Map Str Int)
emptyMap = pack ([],[])

-- test interop
foo size =
  ( addShitPy  "nextflow" 3
  . addShitCpp "earwigs" 2
  . addShitR   "tollroads" 1
  . addShitPy  "campers who play load music" 0
  ) { shitlists = emptyMap
    , things = ["spiders"]
    , size = size
    }

-- test access
bar size = (.shitlists fpy, .things fcpp, .size fr) where
    fpy = addShitPy "aa" 42
      { shitlists = emptyMap
      , things = ["a"]
      , size = size
      }

    fcpp = addShitPy "bb" 42
      { shitlists = emptyMap
      , things = ["b"]
      , size = size
      }

    fr = addShitR "cc" 42
      { shitlists = emptyMap
      , things = ["c"]
      , size = size
      }


================================================
FILE: test-suite/golden-tests/records-nested/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err
	./nexus bar 42 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/records-nested/exp.txt
================================================
{"bars":[{"things":[],"size":0},{"things":[],"size":1},{"things":[],"size":2},{"things":[],"size":3}],"things":["spiders"],"size":42}
[[{"things":["carrot"],"size":1}],["b"],42]


================================================
FILE: test-suite/golden-tests/records-nested/foo.R
================================================
addBar <- function(bar, foo){
    foo$bars[[length(foo$bars) + 1]] <- bar
    foo
}


================================================
FILE: test-suite/golden-tests/records-nested/foo.hpp
================================================
#pragma once

#include <string>
#include <vector>

struct bar_t {
    std::vector<std::string> things;
    int size;
};

struct foo_t {
    std::vector<bar_t> bars;
    std::vector<std::string> things;
    int size;
};


foo_t addBar(bar_t bar, foo_t foo){
    foo.bars.push_back(bar);
    return foo;
}


================================================
FILE: test-suite/golden-tests/records-nested/foo.py
================================================
def addBar(bar, foo):
    foo["bars"].append(bar)
    return foo


================================================
FILE: test-suite/golden-tests/records-nested/main.loc
================================================
-- Tests passing records of primitives across languages and accessing fields

module main (foo, bar)

import root
import root-r
import root-py
import root-cpp

record Foo where
  bars :: [Bar]
  things :: [Str]
  size :: Int

record Cpp => Foo = "foo_t"
record Py  => Foo = "dict"
record R   => Foo = "list"

record Bar where
  things :: [Str] -- note that record names CAN be reused (not like in Haskell)
  size :: Int

record Cpp => Bar = "bar_t"
record Py  => Bar = "dict"
record R   => Bar = "list"

source Py from "foo.py" ("addBar" as addBarPy)
source Cpp from "foo.hpp" ("addBar" as addBarCpp)
source R from "foo.R" ("addBar" as addBarR)
addBarCpp :: Bar -> Foo -> Foo
addBarPy  :: Bar -> Foo -> Foo
addBarR   :: Bar -> Foo -> Foo


-- test interop
foo size =
  ( addBarPy  { things = [], size = 3}
  . addBarCpp { things = [], size = 2}
  . addBarR   { things = [], size = 1}
  . addBarPy  { things = [], size = 0}
  ) { bars = []
    , things = ["spiders"]
    , size = size
    }

-- test access
bar size = (.bars fpy, .things fcpp, .size fr) where
    fpy = addBarPy { things = ["carrot"], size = 1}
      { bars = []
      , things = ["a"]
      , size = size
      }

    fcpp = addBarCpp { things = ["stick"], size = 2}
      { bars = []
      , things = ["b"]
      , size = size
      }

    fr = addBarR { things = ["winch"], size = 3}
      { bars = []
      , things = ["c"]
      , size = size
      }


================================================
FILE: test-suite/golden-tests/records-primitive/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err
	./nexus bar 42 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/records-primitive/exp.txt
================================================
{"flooz":[0,1,2,3],"things":["spiders"],"size":42}
[[42],42]


================================================
FILE: test-suite/golden-tests/records-primitive/foo.R
================================================
addFlooz <- function(flooz, foo){
    foo$flooz <- append(foo$flooz, flooz)
    foo
}


================================================
FILE: test-suite/golden-tests/records-primitive/foo.hpp
================================================
#pragma once

#include <string>
#include <vector>

struct foo_t {
    std::vector<int> flooz;
    std::vector<std::string> things;
    int size;
};

foo_t addFlooz(int flooz, foo_t foo){
    foo.flooz.push_back(flooz);
    return foo;
}


================================================
FILE: test-suite/golden-tests/records-primitive/foo.py
================================================
def addFlooz(flooz, foo):
    foo["flooz"].append(flooz)
    return foo


================================================
FILE: test-suite/golden-tests/records-primitive/main.loc
================================================
-- Tests passing records of primitives across languages and accessing fields

module main (foo, bar)

import root ((.))
import root-py  (Str, Int, Tuple3, List)
import root-cpp (Str, Int, Tuple3, List)
import root-r   (Str, Int, Tuple3, List)

record Foo where
  flooz :: [Int]
  things :: [Str]
  size :: Int
record Cpp => Foo = "foo_t"
record R   => Foo = "list"
record Py  => Foo = "dict"

source Py from "foo.py" ("addFlooz" as addFloozPy)
source Cpp from "foo.hpp" ("addFlooz" as addFloozCpp)
source R from "foo.R" ("addFlooz" as addFloozR)
addFloozCpp :: Int -> Foo -> Foo
addFloozPy  :: Int -> Foo -> Foo
addFloozR   :: Int -> Foo -> Foo

-- test interop
foo size =
  ( addFloozPy  3
  . addFloozCpp 2
  . addFloozR   1
  . addFloozPy  0
  ) { flooz = []
    , things = ["spiders"]
    , size = size
    }

-- test access
bar size = (.flooz fpy, .size fr) where
    fpy = addFloozPy 42
      { flooz = []
      , things = ["a"]
      , size = size
      }

    fr = addFloozR 42
      { flooz = []
      , things = ["c"]
      , size = size
      }


================================================
FILE: test-suite/golden-tests/recursion-cross-py-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-cross-py-cpp/cpp_helpers.hpp
================================================
int cpp_sub(int a, int b) {
    return a - b;
}


================================================
FILE: test-suite/golden-tests/recursion-cross-py-cpp/exp.txt
================================================
1
1
120


================================================
FILE: test-suite/golden-tests/recursion-cross-py-cpp/main.loc
================================================
module main (fact)

import root-py
import root-cpp

source Py from "py_helpers.py" ("py_mul" as mul)
mul :: Int -> Int -> Int

source Cpp from "cpp_helpers.hpp" ("cpp_sub" as sub)
sub :: Int -> Int -> Int

fact :: Int -> Int
fact n
  ? n == 0 = 1
  : mul n (fact (sub n 1))


================================================
FILE: test-suite/golden-tests/recursion-cross-py-cpp/py_helpers.py
================================================
def py_mul(a, b):
    return a * b


================================================
FILE: test-suite/golden-tests/recursion-cross-r-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-cross-r-cpp/cpp_helpers.hpp
================================================
int cpp_sub(int a, int b) {
    return a - b;
}


================================================
FILE: test-suite/golden-tests/recursion-cross-r-cpp/exp.txt
================================================
1
1
120


================================================
FILE: test-suite/golden-tests/recursion-cross-r-cpp/main.loc
================================================
module main (fact)

import root-r
import root-cpp

source R from "r_helpers.R" ("r_mul" as mul)
mul :: Int -> Int -> Int

source Cpp from "cpp_helpers.hpp" ("cpp_sub" as sub)
sub :: Int -> Int -> Int

fact :: Int -> Int
fact n
  ? n == 0 = 1
  : mul n (fact (sub n 1))


================================================
FILE: test-suite/golden-tests/recursion-cross-r-cpp/r_helpers.R
================================================
r_mul <- function(a, b) {
    a * b
}


================================================
FILE: test-suite/golden-tests/recursion-direct-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err
	./nexus fact 10 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-direct-cpp/exp.txt
================================================
1
1
120
3628800


================================================
FILE: test-suite/golden-tests/recursion-direct-cpp/main.loc
================================================
module main (fact)

import root-cpp

fact :: Int -> Int
fact n
  ? n == 0 = 1
  : n * fact (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-direct-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err
	./nexus fact 10 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-direct-py/exp.txt
================================================
1
1
120
3628800


================================================
FILE: test-suite/golden-tests/recursion-direct-py/main.loc
================================================
module main (fact)

import root-py

fact :: Int -> Int
fact n
  ? n == 0 = 1
  : n * fact (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-direct-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err
	./nexus fact 10 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-direct-r/exp.txt
================================================
1
1
120
3628800


================================================
FILE: test-suite/golden-tests/recursion-direct-r/main.loc
================================================
module main (fact)

import root-r

fact :: Int -> Int
fact n
  ? n == 0 = 1
  : n * fact (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-helper-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err
	./nexus fact 10 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-helper-cpp/exp.txt
================================================
1
1
120
3628800


================================================
FILE: test-suite/golden-tests/recursion-helper-cpp/main.loc
================================================
module main (fact)

import root-cpp

-- exported wrapper delegates to non-exported recursive helper
fact :: Int -> Int
fact n = factHelper n 1

factHelper :: Int -> Int -> Int
factHelper n acc
  ? n == 0 = acc
  : factHelper (n - 1) (acc * n)


================================================
FILE: test-suite/golden-tests/recursion-helper-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus fact 0 > obs.txt 2> obs.err
	./nexus fact 1 >> obs.txt 2>> obs.err
	./nexus fact 5 >> obs.txt 2>> obs.err
	./nexus fact 10 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-helper-py/exp.txt
================================================
1
1
120
3628800


================================================
FILE: test-suite/golden-tests/recursion-helper-py/main.loc
================================================
module main (fact)

import root-py

-- exported wrapper delegates to non-exported recursive helper
fact :: Int -> Int
fact n = factHelper n 1

factHelper :: Int -> Int -> Int
factHelper n acc
  ? n == 0 = acc
  : factHelper (n - 1) (acc * n)


================================================
FILE: test-suite/golden-tests/recursion-mutual-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus isEven 0 > obs.txt 2> obs.err
	./nexus isEven 1 >> obs.txt 2>> obs.err
	./nexus isEven 4 >> obs.txt 2>> obs.err
	./nexus isOdd 0 >> obs.txt 2>> obs.err
	./nexus isOdd 3 >> obs.txt 2>> obs.err
	./nexus isOdd 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-mutual-cpp/exp.txt
================================================
true
false
true
false
true
false


================================================
FILE: test-suite/golden-tests/recursion-mutual-cpp/main.loc
================================================
module main (isEven, isOdd)

import root-cpp

isEven :: Int -> Bool
isEven n
  ? n == 0 = True
  : isOdd (n - 1)

isOdd :: Int -> Bool
isOdd n
  ? n == 0 = False
  : isEven (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-mutual-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus isEven 0 > obs.txt 2> obs.err
	./nexus isEven 1 >> obs.txt 2>> obs.err
	./nexus isEven 4 >> obs.txt 2>> obs.err
	./nexus isOdd 0 >> obs.txt 2>> obs.err
	./nexus isOdd 3 >> obs.txt 2>> obs.err
	./nexus isOdd 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-mutual-py/exp.txt
================================================
true
false
true
false
true
false


================================================
FILE: test-suite/golden-tests/recursion-mutual-py/main.loc
================================================
module main (isEven, isOdd)

import root-py

isEven :: Int -> Bool
isEven n
  ? n == 0 = True
  : isOdd (n - 1)

isOdd :: Int -> Bool
isOdd n
  ? n == 0 = False
  : isEven (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-mutual-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus isEven 0 > obs.txt 2> obs.err
	./nexus isEven 1 >> obs.txt 2>> obs.err
	./nexus isEven 4 >> obs.txt 2>> obs.err
	./nexus isOdd 0 >> obs.txt 2>> obs.err
	./nexus isOdd 3 >> obs.txt 2>> obs.err
	./nexus isOdd 4 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-mutual-r/exp.txt
================================================
true
false
true
false
true
false


================================================
FILE: test-suite/golden-tests/recursion-mutual-r/main.loc
================================================
module main (isEven, isOdd)

import root-r

isEven :: Int -> Bool
isEven n
  ? n == 0 = True
  : isOdd (n - 1)

isOdd :: Int -> Bool
isOdd n
  ? n == 0 = False
  : isEven (n - 1)


================================================
FILE: test-suite/golden-tests/recursion-thunk-helper-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus sumDown 0 > obs.txt 2> obs.err
	./nexus sumDown 1 >> obs.txt 2>> obs.err
	./nexus sumDown 3 >> obs.txt 2>> obs.err
	./nexus sumDown 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-thunk-helper-cpp/exp.txt
================================================
0
2
12
30


================================================
FILE: test-suite/golden-tests/recursion-thunk-helper-cpp/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

int double_val(int x) {
    return x * 2;
}

#endif


================================================
FILE: test-suite/golden-tests/recursion-thunk-helper-cpp/main.loc
================================================
-- Test non-exported recursive helper returning an effect type.
-- sumDown n = 0 + 1 + 2 + ... + n (each term doubled by sourced fn)

module main (sumDown)

import root-cpp

source Cpp from "foo.hpp" ("double_val")

type Cpp => Int = "int"

double_val :: Int -> <IO> Int

-- Exported wrapper delegates to non-exported recursive helper
sumDown :: Int -> <IO> Int
sumDown n = helper n

-- Non-exported recursive helper returning <IO> Int
helper :: Int -> <IO> Int
helper n
  ? n <= 0 = double_val 0
  : do
      x <- double_val n
      rest <- helper (n - 1)
      x + rest


================================================
FILE: test-suite/golden-tests/recursion-thunk-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus sumDown 0 > obs.txt 2> obs.err
	./nexus sumDown 1 >> obs.txt 2>> obs.err
	./nexus sumDown 3 >> obs.txt 2>> obs.err
	./nexus sumDown 5 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/recursion-thunk-py/exp.txt
================================================
0
2
12
30


================================================
FILE: test-suite/golden-tests/recursion-thunk-py/foo.py
================================================
def double(x):
    return x * 2


================================================
FILE: test-suite/golden-tests/recursion-thunk-py/main.loc
================================================
-- Test exported recursive function returning an effect type.
-- sumDown n = 0 + 1 + 2 + ... + n (each term doubled by sourced fn)

module main (sumDown)

import root-py

source Py from "foo.py" ("double")

double :: Int -> <IO> Int

sumDown :: Int -> <IO> Int
sumDown n
  ? n <= 0 = double 0
  : do
      x <- double n
      rest <- sumDown (n - 1)
      x + rest


================================================
FILE: test-suite/golden-tests/scoping-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-1/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-1/w.loc
================================================
module main (f)

k = 42

-- a function can use terms from the global scope
f = k


================================================
FILE: test-suite/golden-tests/scoping-10/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus high.loc 2> build.err
	./nexus foo [99,2] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-10/exp.txt
================================================
99


================================================
FILE: test-suite/golden-tests/scoping-10/high.loc
================================================
module high (foo)

import low

source Py from "high.py" ("fst", "snd")

type Py => Int = "int"
type Py => Tuple2 a b = "tuple" a b

foo :: (Int, Int) -> Int
foo = uncurry const


================================================
FILE: test-suite/golden-tests/scoping-10/high.py
================================================
def fst(x):
    return x[0]

def snd(x):
    return x[1]


================================================
FILE: test-suite/golden-tests/scoping-10/low.loc
================================================
module low (*)

fst :: (a, b) -> a
snd :: (a, b) -> b

const :: a -> b -> a
const a b = a

uncurry :: (a -> b -> c) -> (a, b) -> c
uncurry fabc ab = fabc (fst ab) (snd ab) 


================================================
FILE: test-suite/golden-tests/scoping-11/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-11/exp.txt
================================================
"hellosh"


================================================
FILE: test-suite/golden-tests/scoping-11/main.loc
================================================
module second (foo)
foo = "hellosh"  


module main (*)
import second


================================================
FILE: test-suite/golden-tests/scoping-12/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/scoping-12/exp.txt
================================================
4


================================================
FILE: test-suite/golden-tests/scoping-12/foo.py
================================================
def morloc_add (x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/scoping-12/main.loc
================================================
-- base module defines a general typeclass and function using it
module foo (*)
class Addable a where
    add :: a -> a -> a
inc :: Int -> Int
inc = add 1

-- language-specific module adds an implementation
module foo-py (*)
import foo 
type Py => Int = "int"
instance Addable Int where
    source Py from "foo.py" ("morloc_add" as add)

-- 3rd party module uses a function depending on add but does NOT explicitly use add
module main (foo)
import foo-py
foo x = inc (inc x)


================================================
FILE: test-suite/golden-tests/scoping-13/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/scoping-13/core.hpp
================================================
#ifndef __MORLOC__CORE_HPP__
#define __MORLOC__CORE_HPP__

#include <utility>

// fst      :: forall a b . (a, b) -> a ;
template <class A, class B>
A morloc_fst(std::tuple<A,B> x){
    return(std::get<0>(x));
}

template <class A>
bool morloc_eq(A x, A y){
   return x == y;
}

#endif


================================================
FILE: test-suite/golden-tests/scoping-13/exp.txt
================================================
true


================================================
FILE: test-suite/golden-tests/scoping-13/foo/main.loc
================================================
module foo (*)

class Eq a where
  eq :: a -> a -> Bool

fst :: (a, b) -> a


================================================
FILE: test-suite/golden-tests/scoping-13/foo/test/bar.py
================================================
import sys

def runTest(xs):
    if(all(xs)):
        print("success", file=sys.stderr)
        return True
    else:
        print("fail", file=sys.stderr)
        return False


================================================
FILE: test-suite/golden-tests/scoping-13/foo/test/main.loc
================================================
module foo.test (test)

-- import everything from foo (functions this module tests)
import foo

type Py => Int = "int"
type Py => Bool = "bool"
type Py => List a = "list" a
type Py => Tuple2 a b = "tuple" a b

source Py from "bar.py" ("runTest")
runTest :: [Bool] -> Bool

test :: Bool
test = runTest
  [ eq 0 (fst (0,1))
  , eq 1 (fst (1,0))
  ]


================================================
FILE: test-suite/golden-tests/scoping-13/foo-cpp.loc
================================================
module foo-cpp (*)

import foo 

type Cpp => Filename = "std::string"
type Cpp => Unit = "mlc::Unit" -- this is an enum with a single element, NOT `void`, which corresponds to bottom
type Cpp => Real = "double"
type Cpp => Int = "int"
type Cpp => Str = "std::string"
type Cpp => Bool = "bool"
type Cpp => (Map a b) = "std::map<$1,$2>" a b
type Cpp => (List a) = "std::vector<$1>" a
type Cpp => (Tuple2 a b) = "std::tuple<$1,$2>" a b
type Cpp => (Tuple3 a b c) = "std::tuple<$1,$2,$3>" a b c

source Cpp from "core.hpp"
    ( "morloc_fst" as fst
    )

instance Eq a where
  source Cpp from "core.hpp" ("morloc_eq" as eq)


================================================
FILE: test-suite/golden-tests/scoping-13/main.loc
================================================
module main (test)

import foo-cpp
import foo.test (test)


================================================
FILE: test-suite/golden-tests/scoping-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f 42 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-2/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-2/w.loc
================================================
module main (f)

m = 20

-- a function's parameters may shadow terms from the global scope
f :: Int -> Int
f m = m


================================================
FILE: test-suite/golden-tests/scoping-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-3/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-3/w.loc
================================================
module main (f)

-- a function may use terms from its where-scope
f = x where
    x = 42


================================================
FILE: test-suite/golden-tests/scoping-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-4/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-4/w.loc
================================================
module main (f)

import root-py

-- terms in the function's where-scope are unordered and share scope
f = x where
    a = 1.0
    x = a + b
    b = 41.0


================================================
FILE: test-suite/golden-tests/scoping-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-5/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-5/w.loc
================================================
module main (f)

import root-py

-- where scopes may be nested
f = x where
    x = y where
        y = 42


================================================
FILE: test-suite/golden-tests/scoping-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-6/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-6/w.loc
================================================
module main (f)

import root-py

-- where-scopes inherit the scope of their parent
f = x where
   x = y where
       y = a + b
       a = 1.0
   b = 41.0


================================================
FILE: test-suite/golden-tests/scoping-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-7/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-7/w.loc
================================================
module main (f)

import root-py

-- where-scopes inherit the scope of all their ancestors
f = x where
   x = y where
       y = z where
           z = c + a + b
           a = 1.0
       b = 2.0
   c = 39.0


================================================
FILE: test-suite/golden-tests/scoping-8/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-8/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-8/w.loc
================================================
module main (f)

import root-py

-- cousins do not interfere with one another
f = x where
   x = a + b
   a = 19.0 + c where
       c = 1.0
   b = 1.0 + c where
       c = 21.0


================================================
FILE: test-suite/golden-tests/scoping-9/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus w.loc 2> build.err
	./nexus f > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/scoping-9/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/scoping-9/w.loc
================================================
module main (f)

import root-py

-- functions with or without signatures may be defined in the where-scope
f = bar (bif 2.0) where

   bif x = x + 10.0

   bar :: Real -> Real
   bar x = x + 30.0


================================================
FILE: test-suite/golden-tests/selection-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/selection-1/exp.txt
================================================
45


================================================
FILE: test-suite/golden-tests/selection-1/main.loc
================================================
module main (foo)

-- A function may be imported from multiple modules. The compiler is
-- responsible for deciding which of the available implementations to use.
--
-- In the case below, C++ should be selected for both `add` instances, since
-- C++ is the faster language.

import root-py
import root-cpp

foo x y = x + y + 42.0


================================================
FILE: test-suite/golden-tests/selection-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/selection-2/arithmetic/main.loc
================================================
module arithmetic (*)

-- Imports multiple instances and exports all of them. I expect
-- this will be a very common pattern.

import root-py (Integral, Numeric)
import root-cpp (Integral, Numeric)
import root-r (Integral, Numeric)


================================================
FILE: test-suite/golden-tests/selection-2/exp.txt
================================================
45


================================================
FILE: test-suite/golden-tests/selection-2/main.loc
================================================
module main (foo)

-- This should compile to exactly the same code as selection-1.
-- The only difference is that it uses an extra module, Arithmetic, to abstract
-- away the concrete language imports, this is likely to be a common pattern.

import arithmetic

foo x y = x + y + 42.0


================================================
FILE: test-suite/golden-tests/selection-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,3,6] [7,7,7] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/selection-3/exp.txt
================================================
10.9157800414902


================================================
FILE: test-suite/golden-tests/selection-3/main.loc
================================================
module main (foo)

type R => Real = "numeric"
type R => List a = "list" a

-- NOTE: previously I also included the rms2 function, however, the compiler
-- does not yet have a way to choose which to use.
source R from "rms.R" ("rms1" as rms, "add") 
rms :: [Real] -> Real
add :: Real -> Real -> Real

foo xs ys = add (rms xs) (rms ys)


================================================
FILE: test-suite/golden-tests/selection-3/rms.R
================================================
rms1 <- function(xs){
  sqrt ( sum(xs ^ 2) / length(xs) )
}

rms2 <- function(xs){
  sqrt (mean (xs ^ 2))
}

add <- function(x, y){
  x + y
}


================================================
FILE: test-suite/golden-tests/selection-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 1 2 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/selection-4/exp.txt
================================================
45


================================================
FILE: test-suite/golden-tests/selection-4/main.loc
================================================
-- This should compile to exactly the same code as selection-2. Expect the
-- Arithmetic module is in the same file.

module arithmetic (*)
import root (Real, Int)
import root-r (Integral)
import root-py (Integral)
import root-cpp (Integral)

module main (foo)
import arithmetic (Integral)
foo x y = x + y + 42.0


================================================
FILE: test-suite/golden-tests/serial-form-10-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"Bob","info":"charming"}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-10-c/exp.txt
================================================
{"name":"Bob","info":"charming"}


================================================
FILE: test-suite/golden-tests/serial-form-10-c/main.loc
================================================
module main (foo)

import root-cpp (idcpp, Str)

record (Person a) = Person {name :: Str, info :: a}
record cpp => (Person a) = "struct"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Str -> Person Str
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-10-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"Bob","info":"charming"}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-10-py/exp.txt
================================================
{"name":"Bob","info":"charming"}


================================================
FILE: test-suite/golden-tests/serial-form-10-py/main.loc
================================================
module main (foo)

import root-py

record (Person a) = Person {name :: Str, info :: a}
record py => (Person a) = "dict" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Str -> Person Str
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-10-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"Bob","info":"charming"}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-10-r/exp.txt
================================================
{"name":"Bob","info":"charming"}


================================================
FILE: test-suite/golden-tests/serial-form-10-r/main.loc
================================================
module main (foo)

import root-r

record (Person a) = Person {name :: Str, info :: a}
record R => (Person a) = "list" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Str -> Person Str
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-11-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":[["a","b"],[1,2]]}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-11-c/exp.txt
================================================
{"name":"alice","info":[["a","b"],[1,2]]}


================================================
FILE: test-suite/golden-tests/serial-form-11-c/main.loc
================================================
module main (foo)

import map-cpp (idcpp, Map, Str, Int, Tuple2, List)

record (Person a) = Person {name :: Str, info :: a}
record cpp => (Person a) = "struct" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Map Str Int) -> Person (Map Str Int)
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-11-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":[["a","b"],[1,2]]}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-11-py/exp.txt
================================================
{"name":"alice","info":[["a","b"],[1,2]]}


================================================
FILE: test-suite/golden-tests/serial-form-11-py/main.loc
================================================
module main (foo)

import map-py

record (Person a) = Person {name :: Str, info :: a}
record py => (Person a) = "dict" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Map Str Int) -> Person (Map Str Int)
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-11-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":[["a","b"],[1,2]]}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-11-r/exp.txt
================================================
{"name":"alice","info":[["a","b"],[1,2]]}


================================================
FILE: test-suite/golden-tests/serial-form-11-r/main.loc
================================================
module main (foo)

import map-r

record (Person a) = Person {name :: Str, info :: a}
record R => (Person a) = "list" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Map Str Int) -> Person (Map Str Int)
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-12-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":{"name":"bob","info":42}}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-12-c/exp.txt
================================================
{"name":"alice","info":{"name":"bob","info":42}}


================================================
FILE: test-suite/golden-tests/serial-form-12-c/main.loc
================================================
module main (foo)

import root-cpp (idcpp, Int, Str)

record (Person a) = Person {name :: Str, info :: a}
record cpp => (Person a) = "struct" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Person Int) -> Person (Person Int)
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-12-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":{"name":"bob","info":42}}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-12-py/exp.txt
================================================
{"name":"alice","info":{"name":"bob","info":42}}


================================================
FILE: test-suite/golden-tests/serial-form-12-py/main.loc
================================================
module main (foo)

import root-py

record (Person a) = Person {name :: Str, info :: a}
record py => (Person a) = "dict" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Person Int) -> Person (Person Int)
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-12-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":"alice","info":{"name":"bob","info":42}}' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-12-r/exp.txt
================================================
{"name":"alice","info":{"name":"bob","info":42}}


================================================
FILE: test-suite/golden-tests/serial-form-12-r/main.loc
================================================
module main (foo)

import root-r

record (Person a) = Person {name :: Str, info :: a}
record R => (Person a) = "list" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person (Person Int) -> Person (Person Int)
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-2-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b","a"],[55,42]]' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-2-c/exp.txt
================================================
[["a","b"],[42,55]]


================================================
FILE: test-suite/golden-tests/serial-form-2-c/main.loc
================================================
module main (foo)

import map-cpp

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str Int -> Map Str Int
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-2-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b","a"],[55,42]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-2-py/exp.txt
================================================
[["b","a"],[55,42]]


================================================
FILE: test-suite/golden-tests/serial-form-2-py/main.loc
================================================
module main (foo)

import map-py

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str Int -> Map Str Int
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-2-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b","a"],[55,42]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-2-r/exp.txt
================================================
[["b","a"],[55,42]]


================================================
FILE: test-suite/golden-tests/serial-form-2-r/main.loc
================================================
module main (foo)

import map-r

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str Int -> Map Str Int
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-4-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b",55],["a",42]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-4-c/exp.txt
================================================
[["b",55],["a",42]]


================================================
FILE: test-suite/golden-tests/serial-form-4-c/main.loc
================================================
module main (foo)

import root-cpp (idcpp, Int, Str, List, Tuple2)

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo     :: [(Str, Int)] -> [(Str, Int)]
foo     :: [(Str, Int)] -> [(Str, Int)]
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-4-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b",55],["a",42]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-4-py/exp.txt
================================================
[["b",55],["a",42]]


================================================
FILE: test-suite/golden-tests/serial-form-4-py/main.loc
================================================
module main (foo)

import root-py

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [(Str, Int)] -> [(Str, Int)]
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-4-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["b",55],["a",42]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-4-r/exp.txt
================================================
[["b",55],["a",42]]


================================================
FILE: test-suite/golden-tests/serial-form-4-r/main.loc
================================================
module main (foo)

import root-r

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [(Str, Int)] -> [(Str, Int)]
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-5-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[[["a","b"],[1,5]],[["c","d"],[2,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-5-c/exp.txt
================================================
[[["a","b"],[1,5]],[["c","d"],[2,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-5-c/main.loc
================================================
module main (foo)

import map-cpp (idcpp, Map, Int, Str, List, Tuple2)

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Map Str Int] -> [Map Str Int]
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-5-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[[["a","b"],[1,5]],[["c","d"],[2,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-5-py/exp.txt
================================================
[[["a","b"],[1,5]],[["c","d"],[2,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-5-py/main.loc
================================================
module main (foo)

import map-py

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Map Str Int] -> [Map Str Int]
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-5-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[[["a","b"],[1,5]],[["c","d"],[2,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-5-r/exp.txt
================================================
[[["a","b"],[1,5]],[["c","d"],[2,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-5-r/main.loc
================================================
module main (foo)

import map-r

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Map Str Int] -> [Map Str Int]
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-6-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[{"name":"alice","info":42},{"name":"bob","info":43}]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-6-c/exp.txt
================================================
[{"name":"alice","info":42},{"name":"bob","info":43}]


================================================
FILE: test-suite/golden-tests/serial-form-6-c/main.loc
================================================
module main (foo)

import root-cpp (idcpp, Str, Int, List)

record (Person a) = Person {name :: Str, info :: a}
record Cpp => Person a = "struct" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Person Int] -> [Person Int]
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-6-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[{"name":"alice","info":42},{"name":"bob","info":43}]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-6-py/exp.txt
================================================
[{"name":"alice","info":42},{"name":"bob","info":43}]


================================================
FILE: test-suite/golden-tests/serial-form-6-py/main.loc
================================================
module main (foo)

import root-py

record (Person a) = Person {name :: Str, info :: a}
record Py  => Person a = "dict"   {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Person Int] -> [Person Int]
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-6-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[{"name":"alice","info":42},{"name":"bob","info":43}]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-6-r/exp.txt
================================================
[{"name":"alice","info":42},{"name":"bob","info":43}]


================================================
FILE: test-suite/golden-tests/serial-form-6-r/main.loc
================================================
module main (foo)

import root-r

record (Person a) = Person {name :: Str, info :: a}
record R   => Person a = "list"   {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: [Person Int] -> [Person Int]
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-7-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[1,2,3],[4,5,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-7-c/exp.txt
================================================
[["a","b"],[[1,2,3],[4,5,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-7-c/main.loc
================================================
module main (foo)

import map-cpp (idcpp, Map, Str, List, Int, Tuple2)

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str [Int] -> Map Str [Int]
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-7-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[1,2,3],[4,5,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-7-py/exp.txt
================================================
[["a","b"],[[1,2,3],[4,5,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-7-py/main.loc
================================================
module main (foo)

import map-py

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str [Int] -> Map Str [Int]
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-7-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[1,2,3],[4,5,6]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-7-r/exp.txt
================================================
[["a","b"],[[1,2,3],[4,5,6]]]


================================================
FILE: test-suite/golden-tests/serial-form-7-r/main.loc
================================================
module main (foo)

import map-r

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str [Int] -> Map Str [Int]
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-8-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[[3,4],[2.48,1.2]],[[1,2],[1.2,2.48]]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-8-c/exp.txt
================================================
[["a","b"],[[[3,4],[2.48,1.2]],[[1,2],[1.2,2.48]]]]


================================================
FILE: test-suite/golden-tests/serial-form-8-c/main.loc
================================================
module main (foo)

import map-cpp (idcpp, Map, Str, Int, Real, Tuple2, List)

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Map Int Real) -> Map Str (Map Int Real)
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-8-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[[3,4],[2.48,1.2]],[[1,2],[1.2,2.48]]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-8-py/exp.txt
================================================
[["a","b"],[[[3,4],[2.48,1.2]],[[1,2],[1.2,2.48]]]]


================================================
FILE: test-suite/golden-tests/serial-form-8-py/main.loc
================================================
module main (foo)

import map-py

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Map Int Real) -> Map Str (Map Int Real)

foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-8-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[[["3","4"],[2.48,1.2]],[["1","2"],[1.2,2.48]]]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-8-r/exp.txt
================================================
[["a","b"],[[["3","4"],[2.48,1.2]],[["1","2"],[1.2,2.48]]]]


================================================
FILE: test-suite/golden-tests/serial-form-8-r/main.loc
================================================
module main (foo)

import map-r

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Map Str Real) -> Map Str (Map Str Real)

foo xs = idr xs


================================================
FILE: test-suite/golden-tests/serial-form-9-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-9-c/exp.txt
================================================
[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]


================================================
FILE: test-suite/golden-tests/serial-form-9-c/main.loc
================================================
module main (foo)

import map-cpp (idcpp, Map, Int, Str, List, Tuple2)

record (Person a) = Person {name :: Str, info :: a}
record cpp => (Person a) = "struct" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Person Int) -> Map Str (Person Int)
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/serial-form-9-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-9-py/exp.txt
================================================
[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]


================================================
FILE: test-suite/golden-tests/serial-form-9-py/main.loc
================================================
module main (foo)

import map-py

record (Person a) = Person {name :: Str, info :: a}
record py => (Person a) = "dict" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Person Int) -> Map Str (Person Int)
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/serial-form-9-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]' | sed 's/ //g' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/serial-form-9-r/exp.txt
================================================
[["a","b"],[{"name":"alice","info":2},{"name":"bob","info":3}]]


================================================
FILE: test-suite/golden-tests/serial-form-9-r/main.loc
================================================
module main (foo)

import map-r

record (Person a) = Person {name :: Str, info :: a}
record R => (Person a) = "list" {name :: Str, info :: a}

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Map Str (Person Int) -> Map Str (Person Int)
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/slurm-label-codegen/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 5 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/slurm-label-codegen/bar.py
================================================
def bar(x):
    return x + 1


================================================
FILE: test-suite/golden-tests/slurm-label-codegen/exp.txt
================================================
6


================================================
FILE: test-suite/golden-tests/slurm-label-codegen/main.loc
================================================
module main (foo)

import root-py

source Py from "bar.py" ("bar")

bar :: Int -> Int

foo :: Int -> Int
foo x = heavy:bar x


================================================
FILE: test-suite/golden-tests/slurm-label-codegen/main.yaml
================================================
labeled-groups:
  heavy:
    cache: false
    benchmark: false


================================================
FILE: test-suite/golden-tests/source-old-op-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test_add 3 4 > obs.txt 2> obs.err
	./nexus test_sub 10 3 >> obs.txt 2>> obs.err
	./nexus test_mul 5 6 >> obs.txt 2>> obs.err
	./nexus test_neg 42 >> obs.txt 2>> obs.err
	./nexus test_expr >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/source-old-op-py/exp.txt
================================================
7
7
30
-42
13


================================================
FILE: test-suite/golden-tests/source-old-op-py/foo.py
================================================
def neg(x):
    return -x

def abs_val(x):
    return abs(x)


================================================
FILE: test-suite/golden-tests/source-old-op-py/main.loc
================================================
-- Test bare operators in old-style source declarations
module main (test_add, test_sub, test_mul, test_neg, test_expr)

type Py => Int = "int"

class Arith a where
  neg :: a -> a
  (+) :: a -> a -> a
  (-) :: a -> a -> a
  (*) :: a -> a -> a

infixl 6 +, -
infixl 7 *

-- Test: bare operators (+), (-), (*) and op-to-name alias (+) as add_fn
instance Arith Int where
  %inline source Py from "foo.py"
    ( "neg" as neg
    , (+), (-), (*)
    )

test_add :: Int -> Int -> Int
test_add x y = x + y

test_sub :: Int -> Int -> Int
test_sub x y = x - y

test_mul :: Int -> Int -> Int
test_mul x y = x * y

test_neg :: Int -> Int
test_neg x = neg x

-- (3 + 4) * 2 - 1 = 13
test_expr :: Int
test_expr = (3 + 4) * 2 - 1


================================================
FILE: test-suite/golden-tests/specialization-1-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/specialization-1-c/exp.txt
================================================
[1,2,3,10,12,14,16,18]


================================================
FILE: test-suite/golden-tests/specialization-1-c/foo.hpp
================================================
#include <stack>
#include <list>
#include <forward_list>
#include <deque>
#include <queue>
#include <vector>
#include <algorithm>


// Stack to Vector and back
template <typename T>
std::vector<T> toVector(const std::stack<T>& xs) {
    std::vector<T> result;
    std::stack<T> temp = xs;  // Create a temporary stack to preserve the original
    result.reserve(temp.size());
    while (!temp.empty()) {
        result.push_back(temp.top());
        temp.pop();
    }
    std::reverse(result.begin(), result.end());  // Reverse to maintain original order
    return result;
}

// List to Vector and back
template <typename T>
std::vector<T> toVector(const std::list<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Forward List to Vector and back
template <typename T>
std::vector<T> toVector(const std::forward_list<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Deque to Vector and back
template <typename T>
std::vector<T> toVector(const std::deque<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Queue to Vector and back
template <typename T>
std::vector<T> toVector(std::queue<T> xs) {  // Note: pass by value to allow modification
    std::vector<T> result;
    result.reserve(xs.size());
    while (!xs.empty()) {
        result.push_back(std::move(xs.front()));
        xs.pop();
    }
    return result;
}


template <typename T>
std::stack<T> vectorToStack(const std::vector<T>& xs) {
    return std::stack<T>(std::deque<T>(xs.begin(), xs.end()));
}

template <typename T>
std::list<T> vectorToList(const std::vector<T>& xs) {
    return std::list<T>(xs.begin(), xs.end());
}

template <typename T>
std::forward_list<T> vectorToForwardList(const std::vector<T>& xs) {
    return std::forward_list<T>(xs.begin(), xs.end());
}

template <typename T>
std::deque<T> vectorToDeque(const std::vector<T>& xs) {
    return std::deque<T>(xs.begin(), xs.end());
}

template <typename T>
std::queue<T> vectorToQueue(const std::vector<T>& xs) {
    return std::queue<T>(std::deque<T>(xs.begin(), xs.end()));
}


template <typename T>
T& id(const T& x) {
    return x;
}

// Vector
template <typename T>
std::vector<T> append(T element, std::vector<T> container) {
    container.push_back(element);
    return container;
}

// List
template <typename T>
std::list<T> append(T element, std::list<T> container) {
    container.push_back(element);
    return container;
}

// Forward List - a horribly dodgy thing to do in a forward list
template <typename T>
std::forward_list<T> append(T element, std::forward_list<T> container) {
    if (container.empty()) {
        container.push_front(std::move(element));
    } else {
        auto it = container.before_begin();
        auto end = container.end();
        while (std::next(it) != end) {
            ++it;
        }
        container.insert_after(it, std::move(element));
    }
    return container;
}

// Deque
template <typename T>
std::deque<T> append(T element, std::deque<T> container) {
    container.push_back(element);
    return container;
}

// Stack
template <typename T>
std::stack<T> append(T element, std::stack<T> container) {
    container.push(element);
    return container;
}

// Queue
template <typename T>
std::queue<T> append(T element, std::queue<T> container) {
    container.push(element);
    return container;
}


================================================
FILE: test-suite/golden-tests/specialization-1-c/main.loc
================================================
module main (foo)

import root-cpp ((.), Int, List)


-- aliases at the general level
type Stack'       a = List a
type List'        a = List a
type ForwardList' a = List a
type Deque'       a = List a
type Queue'       a = List a
type Vector'      a = List a


-- define a C++ specialization for each type
type Cpp => Stack' a = "std::stack<$1>" a
type Cpp => List' a = "std::list<$1>" a
type Cpp => ForwardList' a = "std::forward_list<$1>" a
type Cpp => Deque' a = "std::deque<$1>" a
type Cpp => Queue' a = "std::queue<$1>" a


-- a typeclass for orderd containers
class Listlike f where
    -- add a new element to the end of a list
    append :: a -> f a -> f a

    -- convert to the canonical list type
    toList :: f a -> List a


-- define instances for each data structure, `append` and `toVector` have overloaded C++ definitions
instance Listlike Stack' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike List' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike ForwardList' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike Deque' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike Queue' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike Vector' where
    source Cpp from "foo.hpp" ("append", "id" as toList)


source Cpp from "foo.hpp"
    ( "vectorToDeque"
    , "vectorToForwardList"
    , "vectorToList"
    , "vectorToQueue"
    , "vectorToStack"
    )

vectorToDeque :: Vector' a -> Deque' a
vectorToForwardList :: Vector' a -> ForwardList' a
vectorToList :: Vector' a -> List' a
vectorToQueue :: Vector' a -> Queue' a
vectorToStack :: Vector' a -> Stack' a

foo = toList
    . append 18
    . vectorToList
    . toList
    . append 16
    . vectorToQueue
    . toList
    . append 14
    . vectorToDeque
    . toList
    . append 12
    . vectorToStack
    . toList
    . append 10
    . vectorToForwardList


================================================
FILE: test-suite/golden-tests/specialization-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo [1,2,3] > obs.txt 2> obs.err
	./nexus square [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/specialization-1-py/exp.txt
================================================
[1,4,9]
[1,4,9]


================================================
FILE: test-suite/golden-tests/specialization-1-py/foo.R
================================================
rid <- function(x) x


================================================
FILE: test-suite/golden-tests/specialization-1-py/foo.py
================================================
import numpy as np
from typing import List, Union, TypeVar

T = TypeVar('T', int, float, bool)

def numpy2list(xs: np.ndarray) -> List[Union[int, float, bool]]:
    """
    Convert numpy array xs to a normal python list
    """
    return xs.tolist()

def list2numpy(xs: List[T]) -> np.ndarray:
    """
    Convert pure python list xs to numpy array
    """
    return np.array(xs)

def square(x: Union[int, float, np.ndarray]) -> Union[int, float, np.ndarray]:
    """
    Square the input value or array
    """
    return x ** 2


================================================
FILE: test-suite/golden-tests/specialization-1-py/main.loc
================================================
module main (foo, square)

type Py => Numpy1D a = "numpy.ndarray" a
type Py => List a = "list" a
type Py => Int64 = "int64"

-- No, this is not an error.

-- The R "double" type is a vector of IEEE 64 bit floats, but it is also how R
-- stores integers larger than 32 bits. These still cannot truly represent 64 bit
-- integers because 11 bits used in the exponent. So in reality this is a 53 bit
-- integer.
type R => List Int64 = "double" Int64
type R => Int64 = "double"

type Numpy1D a = List a

source Py from "foo.py" ("list2numpy", "numpy2list", "square")
list2numpy :: List a -> Numpy1D a
numpy2list :: Numpy1D a -> List a
square :: Numpy1D Int64 -> Numpy1D Int64

source R from "foo.R" ("rid")
rid :: a -> a

foo :: List Int64 -> List Int64
foo = numpy2list . square . list2numpy


================================================
FILE: test-suite/golden-tests/specialization-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus length '"yolo my fomo"' > obs.txt 2> obs.err
	./nexus upper '"yolo my fomo"' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/specialization-1-r/exp.txt
================================================
12
"YOLO MY FOMO"


================================================
FILE: test-suite/golden-tests/specialization-1-r/foo.R
================================================
upper <- function(raw_vec) {
  # Create a mask for lowercase ASCII values (a-z)
  mask <- raw_vec >= as.raw(0x61) & raw_vec <= as.raw(0x7A)
  
  # Apply the bitwise XOR operation only to lowercase letters
  raw_vec[mask] <- as.raw(bitwXor(as.integer(raw_vec[mask]), as.integer(0x20)))
  
  raw_vec
}


================================================
FILE: test-suite/golden-tests/specialization-1-r/main.loc
================================================
module main (length, upper)

type Bytes = Str

type R => Str = "character"
type R => Bytes = "raw" 
type R => Int = "integer" 

source R from "foo.R" ("length", "upper")

length :: Bytes -> Int 
upper :: Bytes -> Bytes


================================================
FILE: test-suite/golden-tests/specialization-2-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	# g++ -O3 --std=c++17 -ocpp.out pool.cpp -std=c++17 -I/home/z/.morloc/include -I.
	./nexus foo [7,8,9] > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/specialization-2-c/exp.txt
================================================
[7,8,9,10,12,14,16,18]


================================================
FILE: test-suite/golden-tests/specialization-2-c/foo.hpp
================================================
#include <stack>
#include <list>
#include <forward_list>
#include <deque>
#include <queue>
#include <vector>
#include <algorithm>


// Stack to Vector and back
template <typename T>
std::vector<T> toVector(const std::stack<T>& xs) {
    std::vector<T> result;
    std::stack<T> temp = xs;  // Create a temporary stack to preserve the original
    result.reserve(temp.size());
    while (!temp.empty()) {
        result.push_back(temp.top());
        temp.pop();
    }
    std::reverse(result.begin(), result.end());  // Reverse to maintain original order
    return result;
}

// List to Vector and back
template <typename T>
std::vector<T> toVector(const std::list<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Forward List to Vector and back
template <typename T>
std::vector<T> toVector(const std::forward_list<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Deque to Vector and back
template <typename T>
std::vector<T> toVector(const std::deque<T>& xs) {
    return std::vector<T>(xs.begin(), xs.end());
}

// Queue to Vector and back
template <typename T>
std::vector<T> toVector(std::queue<T> xs) {  // Note: pass by value to allow modification
    std::vector<T> result;
    result.reserve(xs.size());
    while (!xs.empty()) {
        result.push_back(std::move(xs.front()));
        xs.pop();
    }
    return result;
}


template <typename T>
std::stack<T> vectorToStack(const std::vector<T>& xs) {
    std::stack<T> result;
    for (auto it = xs.rbegin(); it != xs.rend(); ++it) {
        result.push(*it);
    }
    return result;
}

template <typename T>
std::list<T> vectorToList(const std::vector<T>& xs) {
    return std::list<T>(xs.begin(), xs.end());
}

template <typename T>
std::forward_list<T> vectorToForwardList(const std::vector<T>& xs) {
    return std::forward_list<T>(xs.begin(), xs.end());
}

template <typename T>
std::deque<T> vectorToDeque(const std::vector<T>& xs) {
    return std::deque<T>(xs.begin(), xs.end());
}

template <typename T>
std::queue<T> vectorToQueue(const std::vector<T>& xs) {
    return std::queue<T>(std::deque<T>(xs.begin(), xs.end()));
}


template <typename T>
T id(const T& x) {
    return x;
}

// Vector
template <typename T>
std::vector<T> append(T element, std::vector<T> container) {
    container.push_back(element);
    return container;
}

// List
template <typename T>
std::list<T> append(T element, std::list<T> container) {
    container.push_back(element);
    return container;
}

// Deque
template <typename T>
std::deque<T> append(T element, std::deque<T> container) {
    container.push_back(element);
    return container;
}

// Queue - WARNING: O(n)
template <typename T>
std::queue<T> append(T element, std::queue<T> container) {
    std::queue<T> temp_queue;

    // Copy elements from original queue to temp_queue
    while (!container.empty()) {
        temp_queue.push(container.front());
        container.pop();
    }

    // Push the new element onto the end of the queue
    temp_queue.push(element);

    // Copy elements back from temp_queue to original queue
    while (!temp_queue.empty()) {
        container.push(temp_queue.front());
        temp_queue.pop();
    }

    return container;
}

// Forward List - WARNING: O(n)
template <typename T>
std::forward_list<T> append(T element, std::forward_list<T> container) {
    std::forward_list<T> new_container;
    new_container.push_front(element); // Add the new element to the *front* of the new list.

    // Reverse the new list
    new_container.reverse();

    // Concatenate the new element with the original list
    container.reverse();
    container.splice_after(container.before_begin(), new_container);
    container.reverse();
    
    return container;
}

// Stack - WARNING: O(n)
template <typename T>
std::stack<T> append(T element, std::stack<T> container) {
    std::stack<T> temp_stack;

    // Transfer elements from original stack to temp_stack in reverse order
    while (!container.empty()) {
        temp_stack.push(container.top());
        container.pop();
    }

    // Push the new element onto the now-empty original stack
    container.push(element);

    // Push the elements back from temp_stack to original stack
    while (!temp_stack.empty()) {
        container.push(temp_stack.top());
        temp_stack.pop();
    }

    return container;
}


================================================
FILE: test-suite/golden-tests/specialization-2-c/foo.py
================================================
def ident(x):
    return x


================================================
FILE: test-suite/golden-tests/specialization-2-c/main.loc
================================================
module main (foo)

-- base types
type Cpp => Int = "int"
type Cpp => List a = "std::vector<$1>" a
type Cpp => Tuple2 a b = "std::tuple<$1,$2>" a b

type Py => Int = "int"
type Py => List a = "list" a
type Py => Tuple2 a b = "tuple" a b


-- aliases at the general level
type Stack'       a = List a
type List'        a = List a
type ForwardList' a = List a
type Deque'       a = List a
type Queue'       a = List a
type Vector'      a = List a


-- define a C++ specialization for each type
type Cpp => Stack' a = "std::stack<$1>" a
type Cpp => List' a = "std::list<$1>" a
type Cpp => ForwardList' a = "std::forward_list<$1>" a
type Cpp => Deque' a = "std::deque<$1>" a
type Cpp => Queue' a = "std::queue<$1>" a
-- note Vector' does not need a definition, it resolves to List and then "std::vector"


-- a typeclass for orderd containers
class Listlike f where
    -- add a new element to the end of a list
    append f a :: a -> f a -> f a

    -- convert to the canonical list type
    toList f a :: f a -> List a


-- define instances for each data structure, `append` and `toVector` have overloaded C++ definitions
instance Listlike Stack' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike List' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike ForwardList' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike Deque' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike Queue' where
    source Cpp from "foo.hpp" ("append", "toVector" as toList)

instance Listlike List where
    source Cpp from "foo.hpp" ("append", "id" as toList)


source Cpp from "foo.hpp"
    ( "vectorToDeque"
    , "vectorToForwardList"
    , "vectorToList"
    , "vectorToQueue"
    , "vectorToStack"
    )

source Py from "foo.py" ("ident" as id)
id :: a -> a 

vectorToDeque :: List a -> Deque' a
vectorToForwardList :: List a -> ForwardList' a
vectorToList :: List a -> List' a
vectorToQueue :: List a -> Queue' a
vectorToStack :: List a -> Stack' a

foo = id
    . append 18
    . vectorToList
    . toList
    . id
    . append 16
    . vectorToQueue
    . toList
    . id
    . append 14
    . vectorToDeque
    . toList
    . id
    . append 12
    . vectorToStack
    . toList
    . id
    . append 10
    . vectorToForwardList


================================================
FILE: test-suite/golden-tests/specialization-2-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus dobytes '"asdf"' > obs.txt 2> obs.err
	./nexus doarray '"asdf"' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/specialization-2-py/exp.txt
================================================
"asdf!"
"asdf!"


================================================
FILE: test-suite/golden-tests/specialization-2-py/foo.R
================================================
rid <- function(x) x


================================================
FILE: test-suite/golden-tests/specialization-2-py/foo.py
================================================
def pid(x):
    return x

def changebytes(x):
    if isinstance(x, bytes):
        return x + b'!'
    else:
        raise TypeError(f"Expected bytes, found {type(x)!s}")

def changebytearray(x):
    if isinstance(x, bytearray):
        return x + b'!'
    else:
        raise TypeError(f"Expected bytearray, found {type(x)!s}")


================================================
FILE: test-suite/golden-tests/specialization-2-py/main.loc
================================================
module main (doarray, dobytes)

type Py => ByteArray = "bytearray"
type Py => Bytes = "bytes"

type ByteArray = Str
type Bytes = Str

type R => ByteArray = "raw"
type R => Bytes = "raw"

source Py from "foo.py" ("pid", "changebytearray", "changebytes")
pid :: a -> a
changebytearray :: ByteArray -> ByteArray
changebytes :: Bytes -> Bytes

source R from "foo.R" ("rid")
rid :: a -> a

doarray :: ByteArray -> ByteArray
doarray = pid . changebytearray . rid . pid

dobytes :: Bytes -> Bytes
dobytes = pid . changebytes . rid . pid


================================================
FILE: test-suite/golden-tests/stderr-stdout/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus pfoo '"wena"' 2> obs.txt 2>> obs.err  >> obs.txt
	./nexus rfoo '"wena"' 2>> obs.txt 2>> obs.err  >> obs.txt
	./nexus cfoo '"wena"' 2>> obs.txt 2>> obs.err  >> obs.txt


clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/stderr-stdout/exp.txt
================================================
STDERR Hello wena
STDOUT Hello wena
STDERR Hello wena 
STDOUT Hello wena 
STDERR Hello wena
STDOUT Hello wena


================================================
FILE: test-suite/golden-tests/stderr-stdout/foo.R
================================================
rfoo <- function(name) {
  cat("STDERR Hello", name, "\n", file = stderr())
  cat("STDOUT Hello", name, "\n")
}


================================================
FILE: test-suite/golden-tests/stderr-stdout/foo.hpp
================================================
#include <iostream>
#include <string>
#include "mlccpptypes/prelude.hpp"

mlc::Unit cfoo(const std::string& name) {
    std::cerr << "STDERR Hello " << name << std::endl;
    std::cout << "STDOUT Hello " << name << std::endl;
    return mlc::_Unit;
}


================================================
FILE: test-suite/golden-tests/stderr-stdout/foo.py
================================================
import sys

def pfoo(name):
    print("STDERR Hello " + name, file=sys.stderr)
    print("STDOUT Hello " + name)


================================================
FILE: test-suite/golden-tests/stderr-stdout/main.loc
================================================
module main (cfoo, pfoo, rfoo)

import root-cpp

source Py from "foo.py" ("pfoo")
source R from "foo.R" ("rfoo")
source Cpp from "foo.hpp" ("cfoo")

pfoo :: Str -> ()
cfoo :: Str -> ()
rfoo :: Str -> ()


================================================
FILE: test-suite/golden-tests/stderr-stdout/package.yaml
================================================
name: math
version: 0.0.0
homepage: https://github.com/morloc-project
synopsis: test
description: test
category: test
license: MIT
author: "Zebulun Arendsee"
maintainer: "z@morloc.io"
github: https://github.com/morloc-lib/math
bug-reports: "/dev/null"
dependencies:
  - "mlc"

# -Wall -lm -lgsl -lcblas
# # cblas is a faster library, but gslcblas comes with gsl, so it more likely to
# # be installed. I need a system for specifying alternative sets of flags.


================================================
FILE: test-suite/golden-tests/stdout-flush-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- forceOnce ---" > obs.txt
	./nexus forceOnce >> obs.txt 2>> obs.err
	echo "--- forceTwice ---" >> obs.txt
	./nexus forceTwice >> obs.txt 2>> obs.err
	echo "--- forceShared ---" >> obs.txt
	./nexus forceShared >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/stdout-flush-py/exp.txt
================================================
--- forceOnce ---
EVAL 5
10
--- forceTwice ---
EVAL 5
EVAL 5
20
--- forceShared ---
EVAL 5
20


================================================
FILE: test-suite/golden-tests/stdout-flush-py/fun.py
================================================
def sideEffect(x):
    print("EVAL " + str(x))
    return x * 2

def add(a, b):
    return a + b


================================================
FILE: test-suite/golden-tests/stdout-flush-py/main.loc
================================================
-- Test that stdout from Python user functions is flushed before pool shutdown.
-- This is a Python analog of thunk-effects (which uses C++).
-- Without line-buffered stdout, print() output can be silently lost when
-- the nexus kills the pool process group.

module main (forceOnce, forceTwice, forceShared)

import root-py

source Py from "fun.py" ("sideEffect", "add")

type Py => Int = "int"

sideEffect :: Int -> <IO> Int
add :: Int -> Int -> Int

-- Single evaluation
-- sideEffect 5 prints "EVAL 5", returns 10
forceOnce :: <IO> Int
forceOnce = sideEffect 5

-- Two independent evaluations
-- sideEffect 5 called twice: "EVAL 5" appears twice, 10 + 10 = 20
forceTwice :: <IO> Int
forceTwice = do
    x <- sideEffect 5
    y <- sideEffect 5
    add x y

-- Shared binding: evaluates once, result shared
-- sideEffect 5 called once: "EVAL 5" appears once, 10 + 10 = 20
forceShared :: <IO> Int
forceShared = do
    x <- sideEffect 5
    add x x


================================================
FILE: test-suite/golden-tests/string-encoding/.gitignore
================================================
a.txt
b.txt


================================================
FILE: test-suite/golden-tests/string-encoding/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus foop a.json 2>> obs.err  >> obs.txt
	./nexus foor a.json 2>> obs.err  >> obs.txt
	./nexus fooc a.json 2>> obs.err  >> obs.txt
	./nexus foop b.json 2>> obs.err  >> obs.txt
	./nexus foor b.json 2>> obs.err  >> obs.txt
	./nexus fooc b.json 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/string-encoding/a.json
================================================
"<\\,\",\f,\n,\r,\t>"


================================================
FILE: test-suite/golden-tests/string-encoding/b.json
================================================
"你知道得太多了"


================================================
FILE: test-suite/golden-tests/string-encoding/exp.txt
================================================
"<\\,\",\f,\n,\r,\t>\npy: <\\,\",\f,\n,\r,\t,草泥马>\npy: <\\,\",\f,\n,\r,\t,草泥马>"
"<\\,\",\f,\n,\r,\t>\nR: <\\,\",\f,\n,\r,\t,草泥马>\nR: <\\,\",\f,\n,\r,\t,草泥马>"
"<\\,\",\f,\n,\r,\t>\nc++: <\\,\",\f,\n,\r,\t,草泥马>\nc++: <\\,\",\f,\n,\r,\t,草泥马>"
"你知道得太多了\npy: <\\,\",\f,\n,\r,\t,草泥马>\npy: <\\,\",\f,\n,\r,\t,草泥马>"
"你知道得太多了\nR: <\\,\",\f,\n,\r,\t,草泥马>\nR: <\\,\",\f,\n,\r,\t,草泥马>"
"你知道得太多了\nc++: <\\,\",\f,\n,\r,\t,草泥马>\nc++: <\\,\",\f,\n,\r,\t,草泥马>"


================================================
FILE: test-suite/golden-tests/string-encoding/foo.R
================================================
mlc_foo <- function(x){
  paste(x, "R: <\\,\",\f,\n,\r,\t,草泥马>", sep="\n")
}


================================================
FILE: test-suite/golden-tests/string-encoding/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

template <class A>
std::string mlc_foo(A x){
  A y = x + "\n" + "c++: <\\,\",\f,\n,\r,\t,草泥马>";
  return y;
}

#endif


================================================
FILE: test-suite/golden-tests/string-encoding/foo.py
================================================
def mlc_foo(x):
    y = x + "\n" + "py: <\\,\",\f,\n,\r,\t,草泥马>"
    return y


================================================
FILE: test-suite/golden-tests/string-encoding/main.loc
================================================
module main (foor, fooc, foop)

import root ((.))

source Py from "foo.py" ("mlc_foo" as pfoo)
source Cpp from "foo.hpp" ("mlc_foo" as cfoo)
source R from "foo.R" ("mlc_foo" as rfoo)

pfoo :: a -> a
cfoo :: a -> a
rfoo :: a -> a

type Py => Str = "str"
type Cpp => Str = "std::string"
type R => Str = "character"

foor :: Str -> Str
foor = rfoo . rfoo

fooc :: Str -> Str
fooc = cfoo . cfoo

foop :: Str -> Str
foop = pfoo . pfoo


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo a.json > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/a.json
================================================
"你知道得太多了"


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/exp.txt
================================================
"你知道得太多了!?."


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/foo.R
================================================
rfoo <- function(x){
    paste0(x, "?")
}


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/foo.hpp
================================================
std::string cfoo(std::string x){
    return x + ".";
}


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/foo.py
================================================
def pfoo(x):
    return x + "!"


================================================
FILE: test-suite/golden-tests/string-encoding-utf8/main.loc
================================================
module main (foo)

import root ((.))

type Py => Str = "str"
type R => Str = "character"
type Cpp => Str = "std::string"

source Py from "foo.py" ("pfoo")
source R from "foo.R" ("rfoo")
source Cpp from "foo.hpp" ("cfoo")
rfoo :: Str -> Str
pfoo :: Str -> Str
cfoo :: Str -> Str

foo = cfoo . rfoo . pfoo


================================================
FILE: test-suite/golden-tests/string-escape/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus pyQ    2>> obs.err >> obs.txt
	./nexus cppQ   2>> obs.err >> obs.txt
	./nexus rQ     2>> obs.err >> obs.txt
	./nexus pyAll  2>> obs.err >> obs.txt
	./nexus cppAll 2>> obs.err >> obs.txt
	./nexus rAll   2>> obs.err >> obs.txt
	./nexus pureQ  2>> obs.err >> obs.txt
	./nexus pureAll 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/string-escape/exp.txt
================================================
"he said \"hi\""
"he said \"hi\""
"he said \"hi\""
"q:\" bs:\\ nl:\n tab:\t end"
"q:\" bs:\\ nl:\n tab:\t end"
"q:\" bs:\\ nl:\n tab:\t end"
"he said \"hi\""
"q:\" bs:\\ nl:\n tab:\t end"


================================================
FILE: test-suite/golden-tests/string-escape/helper.R
================================================
identity <- function(x) {
  x
}


================================================
FILE: test-suite/golden-tests/string-escape/helper.hpp
================================================
#ifndef __HELPER_HPP__
#define __HELPER_HPP__

#include <string>

std::string identity(std::string x) {
    return x;
}

#endif


================================================
FILE: test-suite/golden-tests/string-escape/helper.py
================================================
def identity(x):
    return x


================================================
FILE: test-suite/golden-tests/string-escape/main.loc
================================================
module main (pyQ, cppQ, rQ, pyAll, cppAll, rAll, pureQ, pureAll)

source Py from "helper.py" ("identity" as pyId)
source Cpp from "helper.hpp" ("identity" as cppId)
source R from "helper.R" ("identity" as rId)

pyId :: Str -> Str
cppId :: Str -> Str
rId :: Str -> Str

type Py => Str = "str"
type Cpp => Str = "std::string"
type R => Str = "character"

-- embedded double quotes
pyQ :: Str
pyQ = pyId "he said \"hi\""

cppQ :: Str
cppQ = cppId "he said \"hi\""

rQ :: Str
rQ = rId "he said \"hi\""

-- all supported escape sequences combined
pyAll :: Str
pyAll = pyId "q:\" bs:\\ nl:\n tab:\t end"

cppAll :: Str
cppAll = cppId "q:\" bs:\\ nl:\n tab:\t end"

rAll :: Str
rAll = rId "q:\" bs:\\ nl:\n tab:\t end"

-- pure morloc string constants
pureQ :: Str
pureQ = "he said \"hi\""

pureAll :: Str
pureAll = "q:\" bs:\\ nl:\n tab:\t end"


================================================
FILE: test-suite/golden-tests/string-interpolation/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus sr   '"Alice"' '"Bob"'  > obs.txt 2> obs.err
	./nexus spy  '"Alice"' '"Bob"' 2>> obs.err  >> obs.txt
	./nexus scpp '"Alice"' '"Bob"' 2>> obs.err  >> obs.txt
	./nexus escR   '"hi"' 2>> obs.err >> obs.txt
	./nexus escPy  '"hi"' 2>> obs.err >> obs.txt
	./nexus escCpp '"hi"' 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/string-interpolation/exp.txt
================================================
"x=Alice;y=Bob;"
"x=Alice;y=Bob;"
"x=Alice;y=Bob;"
"a\t\"hi\nb"
"a\t\"\"\"hi\nb"
"a\t\"hi\nb"


================================================
FILE: test-suite/golden-tests/string-interpolation/main.loc
================================================
module main (sr, spy, scpp, escR, escPy, escCpp)

import root
import root-r
import root-py
import root-cpp

sr :: Str -> Str -> Str
sr x y = "x=#{idr x};y=#{idr y};"

spy :: Str -> Str -> Str
spy x y = "x=#{idpy x};y=#{idpy y};"

scpp :: Str -> Str -> Str
scpp x y = "x=#{idcpp x};y=#{idcpp y};"

-- test escape sequences inside interpolated strings
escR :: Str -> Str
escR x = "a\t\"#{idr x}\nb"

escPy :: Str -> Str
escPy x = "a\t\"\"\"#{idpy x}\nb"

escCpp :: Str -> Str
escCpp x = "a\t\"#{idcpp x}\nb"


================================================
FILE: test-suite/golden-tests/string-json-parsing/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus pfoo a.json > obs.txt 2> obs.err
	./nexus pfoo b.json 2>> obs.err  >> obs.txt
	./nexus cfoo a.json 2>> obs.err  >> obs.txt
	./nexus cfoo b.json 2>> obs.err  >> obs.txt
	./nexus rfoo a.json 2>> obs.err  >> obs.txt
	./nexus rfoo b.json 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/string-json-parsing/a.json
================================================
  [   ["\" [hi",["bi]  \t]", "{si", ""] , [-43.5] ], ["", [], []]]  


================================================
FILE: test-suite/golden-tests/string-json-parsing/b.json
================================================
[]


================================================
FILE: test-suite/golden-tests/string-json-parsing/c.json
================================================
[["", [], []]]


================================================
FILE: test-suite/golden-tests/string-json-parsing/exp.txt
================================================
[["\" [hi",["bi]  \t]","{si",""],[-43.5]],["",[],[]]]
[]
[["\" [hi",["bi]  \t]","{si",""],[-43.5]],["",[],[]]]
[]
[["\" [hi",["bi]  \t]","{si",""],[-43.5]],["",[],[]]]
[]


================================================
FILE: test-suite/golden-tests/string-json-parsing/foo.R
================================================
ident <- function(x) { x }


================================================
FILE: test-suite/golden-tests/string-json-parsing/foo.hpp
================================================
template <class A>
A ident(A x){
    return x;
}


================================================
FILE: test-suite/golden-tests/string-json-parsing/foo.py
================================================
def ident(x):
    return x


================================================
FILE: test-suite/golden-tests/string-json-parsing/main.loc
================================================
module main (pfoo, cfoo, rfoo)

source Py from "foo.py" ("ident" as pident)
source Cpp from "foo.hpp" ("ident" as cident)
source R from "foo.R" ("ident" as rident)

type Py => Str = "str"
type Py => Real = "float"
type Py => List a = "list" a
type Py => Tuple3 a b c = "tuple" a b c

type R => Str = "character"
type R => Real = "numeric"
type R => List a = "list" a
type R => Tuple3 a b c = "list" a b c

type Cpp => Str = "std::string"
type Cpp => Real = "double"
type Cpp => List a = "std::vector<$1>" a
type Cpp => Tuple3 a b c = "std::tuple<$1,$2,$3>" a b c

pident :: a -> a
cident :: a -> a
rident :: a -> a

pfoo :: [(Str, [Str], [Real])] -> [(Str, [Str], [Real])]
pfoo = pident

cfoo :: [(Str, [Str], [Real])] -> [(Str, [Str], [Real])]
cfoo = cident

rfoo :: [(Str, [Str], [Real])] -> [(Str, [Str], [Real])]
rfoo = rident


================================================
FILE: test-suite/golden-tests/string-multiline/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus s1 >  obs.txt
	./nexus s2 2>> obs.err  >> obs.txt
	./nexus s3 2>> obs.err  >> obs.txt
	./nexus s4 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/string-multiline/exp.txt
================================================
"  This is the start of a grand paragraph. That\nhas many lines that have few initial spaces than\nthe first paragraph.\n"
"you can also use \"multiline\" strings in one line with internal quotes\n"
"single quotes are also OK\n"
""


================================================
FILE: test-suite/golden-tests/string-multiline/main.loc
================================================
module main (s1, s2, s3, s4)

s1 =
  """
    This is the start of a grand paragraph. That
  has many lines that have few initial spaces than
  the first paragraph.
  """

s2 = """you can also use "multiline" strings in one line with internal quotes"""

s3 = '''single quotes are also OK'''

-- empty string
s4 =
  """
  """


================================================
FILE: test-suite/golden-tests/string-pretty/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- greeting ---" > obs.txt
	./nexus --print greeting >> obs.txt 2>> obs.err
	echo "--- multiline ---" >> obs.txt
	./nexus --print multiline >> obs.txt 2>> obs.err
	echo "--- number ---" >> obs.txt
	./nexus --print number >> obs.txt 2>> obs.err
	echo "--- flag ---" >> obs.txt
	./nexus --print flag >> obs.txt 2>> obs.err
	echo "--- items ---" >> obs.txt
	./nexus --print items >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/string-pretty/exp.txt
================================================
--- greeting ---
hello world
--- multiline ---
line one
line two
line three
--- number ---
42
--- flag ---
true
--- items ---
[
  1,
  2,
  3
]


================================================
FILE: test-suite/golden-tests/string-pretty/main.loc
================================================
module main (greeting, multiline, number, flag, items)

greeting :: Str
greeting = "hello world"

multiline :: Str
multiline = "line one\nline two\nline three"

number :: Int
number = 42

flag :: Bool
flag = True

items :: [Int]
items = [1, 2, 3]


================================================
FILE: test-suite/golden-tests/table-1-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-1-c/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-1-c/main.loc
================================================
module main (foo)

import root
import root-cpp

table (Person a) = Person {name :: Str, info :: a}
table Cpp => (Person a) = "struct"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idcpp xs


================================================
FILE: test-suite/golden-tests/table-1-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-1-py/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-1-py/main.loc
================================================
module main (foo)

import root
import root-py

table (Person a) = Person {name :: Str, info :: a}
table Py => (Person a) = "dict"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/table-1-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-1-r/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-1-r/main.loc
================================================
module main (foo)

import root
import root-r

table (Person a) = Person {name :: Str, info :: a}
table R => (Person a) = "data.frame"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/table-2-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-2-c/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-2-c/main.loc
================================================
module main (foo)

type Cpp => Str = "std::string"
type Cpp => Int = "int"
type Cpp => List a = "std::vector<$1>" a

source Cpp from "person.h" ("PersonYay", "id")
id :: a -> a 

table (Person a) = Person {name :: Str, info :: a}
table Cpp => Person a = "PersonYay"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = id xs


================================================
FILE: test-suite/golden-tests/table-2-c/person.h
================================================
#ifndef __PERSON_H__
#define __PERSON_H__

template <class T>
class PersonYay{
    public:
        std::vector<std::string> name;
        std::vector<T> info; 

        PersonYay(std::vector<std::string> names_i, std::vector<T> infos_i){
            name = names_i;
            info = infos_i;
        }
        PersonYay(){
            name = {};
            info = {};
        }
};

template <class T>
T id(T x){
    return x;
}

#endif


================================================
FILE: test-suite/golden-tests/table-2-py/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-2-py/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-2-py/main.loc
================================================
module main (foo)

import root-py

source py from "person.py" ("PersonObj")

table (Person a) = Person {name :: Str, info :: a}
table Py => (Person a) = "PersonObj"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idpy xs


================================================
FILE: test-suite/golden-tests/table-2-py/person.py
================================================
class PersonObj:
  def __init__(self, name, info):
    self.name = name 
    self.info = info


================================================
FILE: test-suite/golden-tests/table-2-r/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '{"name":["alice","bob"],"info":[34,35]}' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/table-2-r/exp.txt
================================================
{"name":["alice","bob"],"info":[34,35]}


================================================
FILE: test-suite/golden-tests/table-2-r/main.loc
================================================
module main (foo)

import root-r

source R from "person.R" ("person")

table (Person a) = Person {name :: Str, info :: a}
table R => (Person a) = "person"

-- This function returns the input, but passes it though a language-specific id
-- function, which forces deserialization and then serialization.
foo :: Person Int -> Person Int
foo xs = idr xs


================================================
FILE: test-suite/golden-tests/table-2-r/person.R
================================================
# OK, this isn't really a proper class constructor and eventually I will need
# to deal with the wonkey variation in field accessors, but for now this will
# allow testing of the passing to the right constructor.
person <- function(name, info){
  list(name=name, info=info)
}


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- vec1d ---" > obs.txt
	./nexus vec1d >> obs.txt 2>> obs.err
	echo "--- mat2d ---" >> obs.txt
	./nexus mat2d >> obs.txt 2>> obs.err
	echo "--- ten3d ---" >> obs.txt
	./nexus ten3d >> obs.txt 2>> obs.err
	echo "--- emptyVec ---" >> obs.txt
	./nexus emptyVec >> obs.txt 2>> obs.err
	echo "--- singleElem ---" >> obs.txt
	./nexus singleElem >> obs.txt 2>> obs.err
	echo "--- oneByOne ---" >> obs.txt
	./nexus oneByOne >> obs.txt 2>> obs.err
	echo "--- intVec ---" >> obs.txt
	./nexus intVec >> obs.txt 2>> obs.err
	echo "--- f32Vec ---" >> obs.txt
	./nexus f32Vec >> obs.txt 2>> obs.err
	echo "--- testSumMat ---" >> obs.txt
	./nexus testSumMat >> obs.txt 2>> obs.err
	echo "--- testSumVec ---" >> obs.txt
	./nexus testSumVec >> obs.txt 2>> obs.err
	echo "--- testSum3d ---" >> obs.txt
	./nexus testSum3d >> obs.txt 2>> obs.err
	echo "--- largeVec ---" >> obs.txt
	./nexus largeVec >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cpp/exp.txt
================================================
--- vec1d ---
[1,2,3,4,5]
--- mat2d ---
[[1,2,3,4],[5,6,7,8],[9,10,11,12]]
--- ten3d ---
[[[0,1,2,3],[4,5,6,7],[8,9,10,11]],[[12,13,14,15],[16,17,18,19],[20,21,22,23]]]
--- emptyVec ---
[]
--- singleElem ---
[42]
--- oneByOne ---
[[99]]
--- intVec ---
[-10,0,42,2147483647]
--- f32Vec ---
[1.5,-2.5,0]
--- testSumMat ---
78
--- testSumVec ---
15
--- testSum3d ---
276
--- largeVec ---
4999950000


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cpp/main.loc
================================================
-- Comprehensive tensor tests: multiple dimensions, element types,
-- edge cases, compositions, all within C++ only.
module main
  ( vec1d
  , mat2d
  , ten3d
  , emptyVec
  , singleElem
  , oneByOne
  , intVec
  , f32Vec
  , testSumMat
  , testSumVec
  , testSum3d
  , largeVec
  )

import root
import root-cpp

source Cpp from "src.hpp"
  ( "makeVec"
  , "makeMat"
  , "make3d"
  , "makeEmpty"
  , "makeSingle"
  , "makeOneByOne"
  , "makeIntVec"
  , "makeF32Vec"
  , "sumMat"
  , "sumVec"
  , "sum3d"
  , "makeLargeVec"
  , "checkLargeVec"
  )

-- Basic constructors for each dimension
makeVec :: Tensor1 5 Real
makeMat :: Tensor2 3 4 Real
make3d :: Tensor3 2 3 4 Real

-- Edge cases: empty and minimal
makeEmpty :: Tensor1 0 Real
makeSingle :: Tensor1 1 Real
makeOneByOne :: Tensor2 1 1 Real

-- Element type variety
makeIntVec :: Tensor1 4 Int
makeF32Vec :: Tensor1 3 Float32

-- Extraction: tensor -> scalar
sumMat :: Tensor2 3 4 Real -> Real
sumVec :: Tensor1 5 Real -> Real
sum3d :: Tensor3 2 3 4 Real -> Real

-- Large tensor to test SHM path (exceeds inline threshold)
makeLargeVec :: Tensor1 100000 Real
checkLargeVec :: Tensor1 100000 Real -> Real

-- Direct output tests
vec1d = makeVec
mat2d = makeMat
ten3d = make3d
emptyVec = makeEmpty
singleElem = makeSingle
oneByOne = makeOneByOne
intVec = makeIntVec
f32Vec = makeF32Vec

-- Composed scalar tests (zero-arg)
testSumMat :: Real
testSumMat = sumMat makeMat

testSumVec :: Real
testSumVec = sumVec makeVec

testSum3d :: Real
testSum3d = sum3d make3d

-- Large vector round-trip (sum of 0..99999 = 4999950000)
largeVec :: Real
largeVec = checkLargeVec makeLargeVec


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cpp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"
#include <cmath>

// 1D vector: [1.0, 2.0, 3.0, 4.0, 5.0]
mlc::Tensor1<double> makeVec() {
    mlc::Tensor1<double> v({5});
    for (int i = 0; i < 5; i++) v[i] = (double)(i + 1);
    return v;
}

// 2D matrix: [[1..4],[5..8],[9..12]]
mlc::Tensor2<double> makeMat() {
    mlc::Tensor2<double> m({3, 4});
    for (int i = 0; i < 3; i++)
        for (int j = 0; j < 4; j++)
            m(i, j) = (double)(i * 4 + j + 1);
    return m;
}

// 3D: [[[0..3],[4..7],[8..11]],[[12..15],[16..19],[20..23]]]
mlc::Tensor3<double> make3d() {
    mlc::Tensor3<double> t({2, 3, 4});
    for (size_t k = 0; k < 24; k++) t[k] = (double)k;
    return t;
}

// Edge: empty
mlc::Tensor1<double> makeEmpty() {
    return mlc::Tensor1<double>({0});
}

// Edge: single element
mlc::Tensor1<double> makeSingle() {
    mlc::Tensor1<double> v({1});
    v[0] = 42.0;
    return v;
}

// Edge: 1x1 matrix
mlc::Tensor2<double> makeOneByOne() {
    mlc::Tensor2<double> m({1, 1});
    m(0, 0) = 99.0;
    return m;
}

// Int elements
mlc::Tensor1<int> makeIntVec() {
    mlc::Tensor1<int> v({4});
    v[0] = -10; v[1] = 0; v[2] = 42; v[3] = 2147483647;
    return v;
}

// Bool elements
mlc::Tensor1<uint8_t> makeBoolVec() {
    mlc::Tensor1<uint8_t> v({3});
    v[0] = 1; v[1] = 0; v[2] = 1;
    return v;
}

// Float32 elements
mlc::Tensor1<float> makeF32Vec() {
    mlc::Tensor1<float> v({3});
    v[0] = 1.5f; v[1] = -2.5f; v[2] = 0.0f;
    return v;
}

// Sum operations
double sumMat(const mlc::Tensor2<double>& m) {
    double s = 0;
    for (size_t k = 0; k < m.size(); k++) s += m.data()[k];
    return s;
}

double sumVec(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

double sum3d(const mlc::Tensor3<double>& t) {
    double s = 0;
    for (size_t k = 0; k < t.size(); k++) s += t.data()[k];
    return s;
}

// Tensor -> Tensor: scale each element
mlc::Tensor1<double> scaleVec(const mlc::Tensor1<double>& v, double factor) {
    mlc::Tensor1<double> result({v.shape(0)});
    for (size_t i = 0; i < v.size(); i++)
        result[i] = v.data()[i] * factor;
    return result;
}

// Tensor + Tensor: element-wise add
mlc::Tensor1<double> addVecs(const mlc::Tensor1<double>& a, const mlc::Tensor1<double>& b) {
    mlc::Tensor1<double> result({a.shape(0)});
    for (size_t i = 0; i < a.size(); i++)
        result[i] = a.data()[i] + b.data()[i];
    return result;
}

// Large vector (800KB at float64 -- exceeds inline threshold)
mlc::Tensor1<double> makeLargeVec() {
    mlc::Tensor1<double> v({100000});
    for (int i = 0; i < 100000; i++) v[i] = (double)i;
    return v;
}

// Sum of 0+1+...+99999 = 4999950000
double checkLargeVec(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

#endif


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- cpSum2d ---" > obs.txt
	./nexus cpSum2d >> obs.txt 2>> obs.err
	echo "--- pcSum2d ---" >> obs.txt
	./nexus pcSum2d >> obs.txt 2>> obs.err
	echo "--- prSum2d ---" >> obs.txt
	./nexus prSum2d >> obs.txt 2>> obs.err
	echo "--- rpSum2d ---" >> obs.txt
	./nexus rpSum2d >> obs.txt 2>> obs.err
	echo "--- crSum2d ---" >> obs.txt
	./nexus crSum2d >> obs.txt 2>> obs.err
	echo "--- rcSum2d ---" >> obs.txt
	./nexus rcSum2d >> obs.txt 2>> obs.err
	echo "--- cpSum3d ---" >> obs.txt
	./nexus cpSum3d >> obs.txt 2>> obs.err
	echo "--- pcSum3d ---" >> obs.txt
	./nexus pcSum3d >> obs.txt 2>> obs.err
	echo "--- rTransposeVerify ---" >> obs.txt
	./nexus rTransposeVerify >> obs.txt 2>> obs.err
	echo "--- cpSum1d ---" >> obs.txt
	./nexus cpSum1d >> obs.txt 2>> obs.err
	echo "--- pcSum1d ---" >> obs.txt
	./nexus pcSum1d >> obs.txt 2>> obs.err
	echo "--- prSum1d ---" >> obs.txt
	./nexus prSum1d >> obs.txt 2>> obs.err
	echo "--- rpSum1d ---" >> obs.txt
	./nexus rpSum1d >> obs.txt 2>> obs.err
	echo "--- crSum1d ---" >> obs.txt
	./nexus crSum1d >> obs.txt 2>> obs.err
	echo "--- rcSum1d ---" >> obs.txt
	./nexus rcSum1d >> obs.txt 2>> obs.err
	echo "--- cpSum4d ---" >> obs.txt
	./nexus cpSum4d >> obs.txt 2>> obs.err
	echo "--- pcSum4d ---" >> obs.txt
	./nexus pcSum4d >> obs.txt 2>> obs.err
	echo "--- prSum4d ---" >> obs.txt
	./nexus prSum4d >> obs.txt 2>> obs.err
	echo "--- rpSum4d ---" >> obs.txt
	./nexus rpSum4d >> obs.txt 2>> obs.err
	echo "--- cpSumInt ---" >> obs.txt
	./nexus cpSumInt >> obs.txt 2>> obs.err
	echo "--- pcSumInt ---" >> obs.txt
	./nexus pcSumInt >> obs.txt 2>> obs.err
	echo "--- prSumInt ---" >> obs.txt
	./nexus prSumInt >> obs.txt 2>> obs.err
	echo "--- rpSumInt ---" >> obs.txt
	./nexus rpSumInt >> obs.txt 2>> obs.err
	echo "--- crSumInt ---" >> obs.txt
	./nexus crSumInt >> obs.txt 2>> obs.err
	echo "--- rcSumInt ---" >> obs.txt
	./nexus rcSumInt >> obs.txt 2>> obs.err
	echo "--- cpCountTrue ---" >> obs.txt
	./nexus cpCountTrue >> obs.txt 2>> obs.err
	echo "--- pcCountTrue ---" >> obs.txt
	./nexus pcCountTrue >> obs.txt 2>> obs.err
	echo "--- prCountTrue ---" >> obs.txt
	./nexus prCountTrue >> obs.txt 2>> obs.err
	echo "--- rpCountTrue ---" >> obs.txt
	./nexus rpCountTrue >> obs.txt 2>> obs.err
	echo "--- crCountTrue ---" >> obs.txt
	./nexus crCountTrue >> obs.txt 2>> obs.err
	echo "--- rcCountTrue ---" >> obs.txt
	./nexus rcCountTrue >> obs.txt 2>> obs.err
	echo "--- cpSumEmpty ---" >> obs.txt
	./nexus cpSumEmpty >> obs.txt 2>> obs.err
	echo "--- pcSumEmpty ---" >> obs.txt
	./nexus pcSumEmpty >> obs.txt 2>> obs.err
	echo "--- prSumEmpty ---" >> obs.txt
	./nexus prSumEmpty >> obs.txt 2>> obs.err
	echo "--- rpSumEmpty ---" >> obs.txt
	./nexus rpSumEmpty >> obs.txt 2>> obs.err
	echo "--- cpSumSingle ---" >> obs.txt
	./nexus cpSumSingle >> obs.txt 2>> obs.err
	echo "--- pcSumSingle ---" >> obs.txt
	./nexus pcSumSingle >> obs.txt 2>> obs.err
	echo "--- prSumSingle ---" >> obs.txt
	./nexus prSumSingle >> obs.txt 2>> obs.err
	echo "--- rpSumSingle ---" >> obs.txt
	./nexus rpSumSingle >> obs.txt 2>> obs.err
	echo "--- cpSumLarge ---" >> obs.txt
	./nexus cpSumLarge >> obs.txt 2>> obs.err
	echo "--- pcSumLarge ---" >> obs.txt
	./nexus pcSumLarge >> obs.txt 2>> obs.err
	echo "--- prSumLarge ---" >> obs.txt
	./nexus prSumLarge >> obs.txt 2>> obs.err
	echo "--- rpSumLarge ---" >> obs.txt
	./nexus rpSumLarge >> obs.txt 2>> obs.err
	echo "--- crSumLarge ---" >> obs.txt
	./nexus crSumLarge >> obs.txt 2>> obs.err
	echo "--- rcSumLarge ---" >> obs.txt
	./nexus rcSumLarge >> obs.txt 2>> obs.err
	echo "--- cpSumHuge ---" >> obs.txt
	./nexus cpSumHuge >> obs.txt 2>> obs.err
	echo "--- pcSumHuge ---" >> obs.txt
	./nexus pcSumHuge >> obs.txt 2>> obs.err
	echo "--- prSumHuge ---" >> obs.txt
	./nexus prSumHuge >> obs.txt 2>> obs.err
	echo "--- rpSumHuge ---" >> obs.txt
	./nexus rpSumHuge >> obs.txt 2>> obs.err
	echo "--- crSumHuge ---" >> obs.txt
	./nexus crSumHuge >> obs.txt 2>> obs.err
	echo "--- rcSumHuge ---" >> obs.txt
	./nexus rcSumHuge >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/exp.txt
================================================
--- cpSum2d ---
78
--- pcSum2d ---
78
--- prSum2d ---
78
--- rpSum2d ---
78
--- crSum2d ---
78
--- rcSum2d ---
78
--- cpSum3d ---
276
--- pcSum3d ---
276
--- rTransposeVerify ---
[1,2,3,24]
--- cpSum1d ---
55
--- pcSum1d ---
55
--- prSum1d ---
55
--- rpSum1d ---
55
--- crSum1d ---
55
--- rcSum1d ---
55
--- cpSum4d ---
276
--- pcSum4d ---
276
--- prSum4d ---
276
--- rpSum4d ---
276
--- cpSumInt ---
108
--- pcSumInt ---
108
--- prSumInt ---
108
--- rpSumInt ---
108
--- crSumInt ---
108
--- rcSumInt ---
108
--- cpCountTrue ---
4
--- pcCountTrue ---
4
--- prCountTrue ---
4
--- rpCountTrue ---
4
--- crCountTrue ---
4
--- rcCountTrue ---
4
--- cpSumEmpty ---
0
--- pcSumEmpty ---
0
--- prSumEmpty ---
0
--- rpSumEmpty ---
0
--- cpSumSingle ---
42
--- pcSumSingle ---
42
--- prSumSingle ---
42
--- rpSumSingle ---
42
--- cpSumLarge ---
12497500
--- pcSumLarge ---
12497500
--- prSumLarge ---
12497500
--- rpSumLarge ---
12497500
--- crSumLarge ---
12497500
--- rcSumLarge ---
12497500
--- cpSumHuge ---
1249975000
--- pcSumHuge ---
1249975000
--- prSumHuge ---
1249975000
--- rpSumHuge ---
1249975000
--- crSumHuge ---
1249975000
--- rcSumHuge ---
1249975000


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/main.loc
================================================
-- Cross-language tensor tests: all language pairs, multiple dimensions,
-- element types (Real, Int, Bool), edge cases, and performance.
module main
  ( -- 2D Real: all six language pairs
    cpSum2d
  , pcSum2d
  , prSum2d
  , rpSum2d
  , crSum2d
  , rcSum2d
  -- 3D Real: C++/Python pairs + R element verification
  , cpSum3d
  , pcSum3d
  , rTransposeVerify
  -- 1D Real: all six language pairs
  , cpSum1d
  , pcSum1d
  , prSum1d
  , rpSum1d
  , crSum1d
  , rcSum1d
  -- 4D Real: Py<->Cpp, Py<->R
  , cpSum4d
  , pcSum4d
  , prSum4d
  , rpSum4d
  -- Int element type: all six language pairs (1D)
  , cpSumInt
  , pcSumInt
  , prSumInt
  , rpSumInt
  , crSumInt
  , rcSumInt
  -- Bool element type: all six pairs (1D)
  , cpCountTrue
  , pcCountTrue
  , prCountTrue
  , rpCountTrue
  , crCountTrue
  , rcCountTrue
  -- Edge cases: empty and single-element tensors
  , cpSumEmpty
  , pcSumEmpty
  , prSumEmpty
  , rpSumEmpty
  , cpSumSingle
  , pcSumSingle
  , prSumSingle
  , rpSumSingle
  -- Large tensor (5000 doubles = 40KB, all language pairs)
  , cpSumLarge
  , pcSumLarge
  , prSumLarge
  , rpSumLarge
  , crSumLarge
  , rcSumLarge
  -- Very large tensor (50000 doubles = 400KB, crosses 64KB SHM threshold)
  , cpSumHuge
  , pcSumHuge
  , prSumHuge
  , rpSumHuge
  , crSumHuge
  , rcSumHuge
  )

import root
import root-cpp
import root-py
import root-r (Real, Int, Bool)

source Cpp from "src.hpp"
  ( "cppMakeMat"
  , "cppSumMat"
  , "cppMake3d"
  , "cppSum3d"
  , "cppGetCorners3d"
  , "cppMakeVec"
  , "cppSumVec"
  , "cppMake4d"
  , "cppSum4d"
  , "cppMakeIntVec"
  , "cppSumIntVec"
  , "cppMakeBoolVec"
  , "cppCountTrue"
  , "cppMakeEmpty"
  , "cppSumEmpty"
  , "cppMakeSingle"
  , "cppSumSingle"
  , "cppMakeLarge"
  , "cppSumLarge"
  , "cppMakeHuge"
  , "cppSumHuge"
  )

source Py from "src.py"
  ( "pyMakeMat"
  , "pySumMat"
  , "pyMake3d"
  , "pySum3d"
  , "pyMakeVec"
  , "pySumVec"
  , "pyMake4d"
  , "pySum4d"
  , "pyMakeIntVec"
  , "pySumIntVec"
  , "pyMakeBoolVec"
  , "pyCountTrue"
  , "pyMakeEmpty"
  , "pySumEmpty"
  , "pyMakeSingle"
  , "pySumSingle"
  , "pyMakeLarge"
  , "pySumLarge"
  , "pyMakeHuge"
  , "pySumHuge"
  )

source R from "src.R"
  ( "rMakeMat"
  , "rSumMat"
  , "rMake3d"
  , "rMakeVec"
  , "rSumVec"
  , "rMake4d"
  , "rSum4d"
  , "rMakeIntVec"
  , "rSumIntVec"
  , "rMakeBoolVec"
  , "rCountTrue"
  , "rMakeEmpty"
  , "rSumEmpty"
  , "rMakeSingle"
  , "rSumSingle"
  , "rMakeLarge"
  , "rSumLarge"
  , "rMakeHuge"
  , "rSumHuge"
  )

-- === Type signatures ===

-- 2D Real (3x4, values 1..12, sum=78)
cppMakeMat :: Tensor2 3 4 Real
cppSumMat :: Tensor2 3 4 Real -> Real
pyMakeMat :: Tensor2 3 4 Real
pySumMat :: Tensor2 3 4 Real -> Real
rMakeMat :: Tensor2 3 4 Real
rSumMat :: Tensor2 3 4 Real -> Real

-- 3D Real (2x3x4, values 0..23, sum=276)
cppMake3d :: Tensor3 2 3 4 Real
cppSum3d :: Tensor3 2 3 4 Real -> Real
pyMake3d :: Tensor3 2 3 4 Real
pySum3d :: Tensor3 2 3 4 Real -> Real
rMake3d :: Tensor3 2 3 4 Real
cppGetCorners3d :: Tensor3 2 3 4 Real -> [Real]

-- 1D Real (10 elements, values 1..10, sum=55)
cppMakeVec :: Tensor1 10 Real
cppSumVec :: Tensor1 10 Real -> Real
pyMakeVec :: Tensor1 10 Real
pySumVec :: Tensor1 10 Real -> Real
rMakeVec :: Tensor1 10 Real
rSumVec :: Tensor1 10 Real -> Real

-- 4D Real (2x3x2x2, values 0..23, sum=276)
cppMake4d :: Tensor4 2 3 2 2 Real
cppSum4d :: Tensor4 2 3 2 2 Real -> Real
pyMake4d :: Tensor4 2 3 2 2 Real
pySum4d :: Tensor4 2 3 2 2 Real -> Real
rMake4d :: Tensor4 2 3 2 2 Real
rSum4d :: Tensor4 2 3 2 2 Real -> Real

-- 1D Int (8 elements, values 10..17, sum=108)
cppMakeIntVec :: Tensor1 8 Int
cppSumIntVec :: Tensor1 8 Int -> Int
pyMakeIntVec :: Tensor1 8 Int
pySumIntVec :: Tensor1 8 Int -> Int
rMakeIntVec :: Tensor1 8 Int
rSumIntVec :: Tensor1 8 Int -> Int

-- 1D Bool (6 elements: T,F,T,T,F,T -> count=4)
cppMakeBoolVec :: Tensor1 6 Bool
cppCountTrue :: Tensor1 6 Bool -> Int
pyMakeBoolVec :: Tensor1 6 Bool
pyCountTrue :: Tensor1 6 Bool -> Int
rMakeBoolVec :: Tensor1 6 Bool
rCountTrue :: Tensor1 6 Bool -> Int

-- Empty tensor (0 elements, sum=0)
cppMakeEmpty :: Tensor1 0 Real
cppSumEmpty :: Tensor1 0 Real -> Real
pyMakeEmpty :: Tensor1 0 Real
pySumEmpty :: Tensor1 0 Real -> Real
rMakeEmpty :: Tensor1 0 Real
rSumEmpty :: Tensor1 0 Real -> Real

-- Single element (1 element, value 42, sum=42)
cppMakeSingle :: Tensor1 1 Real
cppSumSingle :: Tensor1 1 Real -> Real
pyMakeSingle :: Tensor1 1 Real
pySumSingle :: Tensor1 1 Real -> Real
rMakeSingle :: Tensor1 1 Real
rSumSingle :: Tensor1 1 Real -> Real

-- Large tensor (5000 doubles = 40KB, under SHM threshold)
-- Values 0..4999, sum = 4999*5000/2 = 12497500
cppMakeLarge :: Tensor1 5000 Real
cppSumLarge :: Tensor1 5000 Real -> Real
pyMakeLarge :: Tensor1 5000 Real
pySumLarge :: Tensor1 5000 Real -> Real
rMakeLarge :: Tensor1 5000 Real
rSumLarge :: Tensor1 5000 Real -> Real

-- Very large tensor (50000 doubles = 400KB, exceeds 64KB SHM threshold)
-- Values 0..49999, sum = 49999*50000/2 = 1249975000
cppMakeHuge :: Tensor1 50000 Real
cppSumHuge :: Tensor1 50000 Real -> Real
pyMakeHuge :: Tensor1 50000 Real
pySumHuge :: Tensor1 50000 Real -> Real
rMakeHuge :: Tensor1 50000 Real
rSumHuge :: Tensor1 50000 Real -> Real

-- === 2D Real: all six language pairs ===
cpSum2d :: Real
cpSum2d = pySumMat cppMakeMat
pcSum2d :: Real
pcSum2d = cppSumMat pyMakeMat
prSum2d :: Real
prSum2d = rSumMat pyMakeMat
rpSum2d :: Real
rpSum2d = pySumMat rMakeMat
crSum2d :: Real
crSum2d = rSumMat cppMakeMat
rcSum2d :: Real
rcSum2d = cppSumMat rMakeMat

-- === 3D Real ===
cpSum3d :: Real
cpSum3d = pySum3d cppMake3d
pcSum3d :: Real
pcSum3d = cppSum3d pyMake3d
rTransposeVerify :: [Real]
rTransposeVerify = cppGetCorners3d rMake3d

-- === 1D Real: all six language pairs ===
cpSum1d :: Real
cpSum1d = pySumVec cppMakeVec
pcSum1d :: Real
pcSum1d = cppSumVec pyMakeVec
prSum1d :: Real
prSum1d = rSumVec pyMakeVec
rpSum1d :: Real
rpSum1d = pySumVec rMakeVec
crSum1d :: Real
crSum1d = rSumVec cppMakeVec
rcSum1d :: Real
rcSum1d = cppSumVec rMakeVec

-- === 4D Real ===
cpSum4d :: Real
cpSum4d = pySum4d cppMake4d
pcSum4d :: Real
pcSum4d = cppSum4d pyMake4d
prSum4d :: Real
prSum4d = rSum4d pyMake4d
rpSum4d :: Real
rpSum4d = pySum4d rMake4d

-- === Int element type: all six pairs (1D) ===
cpSumInt :: Int
cpSumInt = pySumIntVec cppMakeIntVec
pcSumInt :: Int
pcSumInt = cppSumIntVec pyMakeIntVec
prSumInt :: Int
prSumInt = rSumIntVec pyMakeIntVec
rpSumInt :: Int
rpSumInt = pySumIntVec rMakeIntVec
crSumInt :: Int
crSumInt = rSumIntVec cppMakeIntVec
rcSumInt :: Int
rcSumInt = cppSumIntVec rMakeIntVec

-- === Bool element type: all six pairs (1D) ===
cpCountTrue :: Int
cpCountTrue = pyCountTrue cppMakeBoolVec
pcCountTrue :: Int
pcCountTrue = cppCountTrue pyMakeBoolVec
prCountTrue :: Int
prCountTrue = rCountTrue pyMakeBoolVec
rpCountTrue :: Int
rpCountTrue = pyCountTrue rMakeBoolVec
crCountTrue :: Int
crCountTrue = rCountTrue cppMakeBoolVec
rcCountTrue :: Int
rcCountTrue = cppCountTrue rMakeBoolVec

-- === Edge cases: empty tensors ===
cpSumEmpty :: Real
cpSumEmpty = pySumEmpty cppMakeEmpty
pcSumEmpty :: Real
pcSumEmpty = cppSumEmpty pyMakeEmpty
prSumEmpty :: Real
prSumEmpty = rSumEmpty pyMakeEmpty
rpSumEmpty :: Real
rpSumEmpty = pySumEmpty rMakeEmpty

-- === Edge cases: single-element tensors ===
cpSumSingle :: Real
cpSumSingle = pySumSingle cppMakeSingle
pcSumSingle :: Real
pcSumSingle = cppSumSingle pyMakeSingle
prSumSingle :: Real
prSumSingle = rSumSingle pyMakeSingle
rpSumSingle :: Real
rpSumSingle = pySumSingle rMakeSingle

-- === Large tensor (40KB, all language pairs) ===
cpSumLarge :: Real
cpSumLarge = pySumLarge cppMakeLarge
pcSumLarge :: Real
pcSumLarge = cppSumLarge pyMakeLarge
prSumLarge :: Real
prSumLarge = rSumLarge pyMakeLarge
rpSumLarge :: Real
rpSumLarge = pySumLarge rMakeLarge
crSumLarge :: Real
crSumLarge = rSumLarge cppMakeLarge
rcSumLarge :: Real
rcSumLarge = cppSumLarge rMakeLarge

-- === Very large tensor (400KB, crosses SHM threshold, all six pairs) ===
cpSumHuge :: Real
cpSumHuge = pySumHuge cppMakeHuge
pcSumHuge :: Real
pcSumHuge = cppSumHuge pyMakeHuge
prSumHuge :: Real
prSumHuge = rSumHuge pyMakeHuge
rpSumHuge :: Real
rpSumHuge = pySumHuge rMakeHuge
crSumHuge :: Real
crSumHuge = rSumHuge cppMakeHuge
rcSumHuge :: Real
rcSumHuge = cppSumHuge rMakeHuge


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/src.R
================================================
# --- 2D Real (3x4, values 1..12) ---
rMakeMat <- function() {
  matrix(as.double(1:12), nrow=3, ncol=4, byrow=TRUE)
}

rSumMat <- function(m) {
  sum(m)
}

# --- 3D Real (2x3x4, values 1..24 but R is 1-indexed)
rMake3d <- function() {
  array(as.double(1:24), dim=c(2, 3, 4))
}

# --- 1D Real (10 elements, values 1..10) ---
rMakeVec <- function() {
  array(as.double(1:10), dim=c(10))
}

rSumVec <- function(v) {
  sum(v)
}

# --- 4D Real (2x3x2x2, values 0..23) ---
rMake4d <- function() {
  array(as.double(0:23), dim=c(2, 3, 2, 2))
}

rSum4d <- function(t) {
  sum(t)
}

# --- 1D Int (8 elements, values 10..17) ---
rMakeIntVec <- function() {
  array(as.integer(10:17), dim=c(8))
}

rSumIntVec <- function(v) {
  as.integer(sum(v))
}

# --- 1D Bool (6 elements: T,F,T,T,F,T) ---
rMakeBoolVec <- function() {
  array(c(TRUE, FALSE, TRUE, TRUE, FALSE, TRUE), dim=c(6))
}

rCountTrue <- function(v) {
  as.integer(sum(v))
}

# --- Empty tensor (0 elements) ---
rMakeEmpty <- function() {
  array(double(0), dim=c(0))
}

rSumEmpty <- function(v) {
  sum(v)
}

# --- Single element (value 42) ---
rMakeSingle <- function() {
  array(42.0, dim=c(1))
}

rSumSingle <- function(v) {
  sum(v)
}

# --- Large tensor (5000 doubles, values 0..4999) ---
rMakeLarge <- function() {
  array(as.double(0:4999), dim=c(5000))
}

rSumLarge <- function(v) {
  sum(v)
}

# --- Very large tensor (50000 doubles, crosses SHM threshold) ---
rMakeHuge <- function() {
  array(as.double(0:49999), dim=c(50000))
}

rSumHuge <- function(v) {
  sum(v)
}


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"
#include <cstdint>

// --- 2D Real (3x4, values 1..12) ---

mlc::Tensor2<double> cppMakeMat() {
    mlc::Tensor2<double> m({3, 4});
    for (int i = 0; i < 3; i++)
        for (int j = 0; j < 4; j++)
            m(i, j) = (double)(i * 4 + j + 1);
    return m;
}

double cppSumMat(const mlc::Tensor2<double>& m) {
    double s = 0;
    for (size_t k = 0; k < m.size(); k++) s += m.data()[k];
    return s;
}

// --- 3D Real (2x3x4, values 0..23) ---

mlc::Tensor3<double> cppMake3d() {
    mlc::Tensor3<double> t({2, 3, 4});
    for (size_t k = 0; k < 24; k++) t[k] = (double)k;
    return t;
}

double cppSum3d(const mlc::Tensor3<double>& t) {
    double s = 0;
    for (size_t k = 0; k < t.size(); k++) s += t.data()[k];
    return s;
}

std::vector<double> cppGetCorners3d(const mlc::Tensor3<double>& t) {
    std::vector<double> result;
    result.push_back(t.data()[0*12 + 0*4 + 0]);  // t(0,0,0)
    result.push_back(t.data()[1*12 + 0*4 + 0]);  // t(1,0,0)
    result.push_back(t.data()[0*12 + 1*4 + 0]);  // t(0,1,0)
    result.push_back(t.data()[1*12 + 2*4 + 3]);  // t(1,2,3)
    return result;
}

// --- 1D Real (10 elements, values 1..10) ---

mlc::Tensor1<double> cppMakeVec() {
    mlc::Tensor1<double> v({10});
    for (int i = 0; i < 10; i++) v[i] = (double)(i + 1);
    return v;
}

double cppSumVec(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

// --- 4D Real (2x3x2x2, values 0..23) ---

mlc::Tensor4<double> cppMake4d() {
    mlc::Tensor4<double> t({2, 3, 2, 2});
    for (size_t k = 0; k < 24; k++) t[k] = (double)k;
    return t;
}

double cppSum4d(const mlc::Tensor4<double>& t) {
    double s = 0;
    for (size_t k = 0; k < t.size(); k++) s += t.data()[k];
    return s;
}

// --- 1D Int (8 elements, values 10..17) ---

mlc::Tensor1<int> cppMakeIntVec() {
    mlc::Tensor1<int> v({8});
    for (int i = 0; i < 8; i++) v[i] = i + 10;
    return v;
}

int cppSumIntVec(const mlc::Tensor1<int>& v) {
    int s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

// --- 1D Bool (6 elements: T,F,T,T,F,T) ---

mlc::Tensor1<bool> cppMakeBoolVec() {
    mlc::Tensor1<bool> v({6});
    v[0] = 1; v[1] = 0; v[2] = 1; v[3] = 1; v[4] = 0; v[5] = 1;
    return v;
}

int cppCountTrue(const mlc::Tensor1<bool>& v) {
    int count = 0;
    for (size_t k = 0; k < v.size(); k++) {
        if (v.data()[k]) count++;
    }
    return count;
}

// --- Empty tensor (0 elements) ---

mlc::Tensor1<double> cppMakeEmpty() {
    return mlc::Tensor1<double>({0});
}

double cppSumEmpty(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

// --- Single element (value 42) ---

mlc::Tensor1<double> cppMakeSingle() {
    mlc::Tensor1<double> v({1});
    v[0] = 42.0;
    return v;
}

double cppSumSingle(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

// --- Large tensor (5000 doubles = 40KB) ---

mlc::Tensor1<double> cppMakeLarge() {
    mlc::Tensor1<double> v({5000});
    for (int i = 0; i < 5000; i++) v[i] = (double)i;
    return v;
}

double cppSumLarge(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

// --- Very large tensor (50000 doubles = 400KB, crosses SHM threshold) ---

mlc::Tensor1<double> cppMakeHuge() {
    mlc::Tensor1<double> v({50000});
    for (int i = 0; i < 50000; i++) v[i] = (double)i;
    return v;
}

double cppSumHuge(const mlc::Tensor1<double>& v) {
    double s = 0;
    for (size_t k = 0; k < v.size(); k++) s += v.data()[k];
    return s;
}

#endif


================================================
FILE: test-suite/golden-tests/tensor-comprehensive-cross/src.py
================================================
import numpy as np

# --- 2D Real (3x4, values 1..12) ---
def pyMakeMat():
    return np.arange(1, 13, dtype=np.float64).reshape(3, 4)

def pySumMat(m):
    return float(np.sum(m))

# --- 3D Real (2x3x4, values 0..23) ---
def pyMake3d():
    return np.arange(24, dtype=np.float64).reshape(2, 3, 4)

def pySum3d(t):
    return float(np.sum(t))

# --- 1D Real (10 elements, values 1..10) ---
def pyMakeVec():
    return np.arange(1, 11, dtype=np.float64)

def pySumVec(v):
    return float(np.sum(v))

# --- 4D Real (2x3x2x2, values 0..23) ---
def pyMake4d():
    return np.arange(24, dtype=np.float64).reshape(2, 3, 2, 2)

def pySum4d(t):
    return float(np.sum(t))

# --- 1D Int (8 elements, values 10..17) ---
def pyMakeIntVec():
    return np.arange(10, 18, dtype=np.int32)

def pySumIntVec(v):
    return int(np.sum(v))

# --- 1D Bool (6 elements: T,F,T,T,F,T) ---
def pyMakeBoolVec():
    return np.array([True, False, True, True, False, True])

def pyCountTrue(v):
    return int(np.sum(v))

# --- Empty tensor (0 elements) ---
def pyMakeEmpty():
    return np.array([], dtype=np.float64)

def pySumEmpty(v):
    return float(np.sum(v))

# --- Single element (value 42) ---
def pyMakeSingle():
    return np.array([42.0], dtype=np.float64)

def pySumSingle(v):
    return float(np.sum(v))

# --- Large tensor (5000 doubles, values 0..4999) ---
def pyMakeLarge():
    return np.arange(5000, dtype=np.float64)

def pySumLarge(v):
    return float(np.sum(v))

# --- Very large tensor (50000 doubles, crosses SHM threshold) ---
def pyMakeHuge():
    return np.arange(50000, dtype=np.float64)

def pySumHuge(v):
    return float(np.sum(v))


================================================
FILE: test-suite/golden-tests/tensor-cp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-cp/exp.txt
================================================
78


================================================
FILE: test-suite/golden-tests/tensor-cp/main.loc
================================================
module main (result)

import root
import root-cpp
import root-py

source Cpp from "src.hpp" ("makeMatrix")
source Py from "src.py" ("sumAll")

makeMatrix :: Tensor2 3 4 Real
sumAll :: Tensor2 3 4 Real -> Real

result :: Real
result = sumAll makeMatrix


================================================
FILE: test-suite/golden-tests/tensor-cp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"

mlc::Tensor2<double> makeMatrix() {
    mlc::Tensor2<double> m({3, 4});
    for (int i = 0; i < 3; i++)
        for (int j = 0; j < 4; j++)
            m(i, j) = (double)(i * 4 + j + 1);
    return m;
}
#endif


================================================
FILE: test-suite/golden-tests/tensor-cp/src.py
================================================
import numpy as np

def sumAll(m):
    return float(np.sum(m))


================================================
FILE: test-suite/golden-tests/tensor-dimensions/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- t1d ---" > obs.txt
	./nexus t1d >> obs.txt 2>> obs.err
	echo "--- t2d ---" >> obs.txt
	./nexus t2d >> obs.txt 2>> obs.err
	echo "--- t3d ---" >> obs.txt
	./nexus t3d >> obs.txt 2>> obs.err
	echo "--- t4d ---" >> obs.txt
	./nexus t4d >> obs.txt 2>> obs.err
	echo "--- t5d ---" >> obs.txt
	./nexus t5d >> obs.txt 2>> obs.err
	echo "--- testSum1d ---" >> obs.txt
	./nexus testSum1d >> obs.txt 2>> obs.err
	echo "--- testSum2d ---" >> obs.txt
	./nexus testSum2d >> obs.txt 2>> obs.err
	echo "--- testSum3d ---" >> obs.txt
	./nexus testSum3d >> obs.txt 2>> obs.err
	echo "--- testSum4d ---" >> obs.txt
	./nexus testSum4d >> obs.txt 2>> obs.err
	echo "--- testSum5d ---" >> obs.txt
	./nexus testSum5d >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-dimensions/exp.txt
================================================
--- t1d ---
[0,1,2,3,4,5]
--- t2d ---
[[0,1,2],[3,4,5]]
--- t3d ---
[[[0,1,2,3],[4,5,6,7],[8,9,10,11]],[[12,13,14,15],[16,17,18,19],[20,21,22,23]]]
--- t4d ---
[[[[0,1],[2,3]],[[4,5],[6,7]],[[8,9],[10,11]]],[[[12,13],[14,15]],[[16,17],[18,19]],[[20,21],[22,23]]]]
--- t5d ---
[[[[[0,1],[2,3],[4,5]],[[6,7],[8,9],[10,11]]],[[[12,13],[14,15],[16,17]],[[18,19],[20,21],[22,23]]]],[[[[24,25],[26,27],[28,29]],[[30,31],[32,33],[34,35]]],[[[36,37],[38,39],[40,41]],[[42,43],[44,45],[46,47]]]]]
--- testSum1d ---
15
--- testSum2d ---
15
--- testSum3d ---
276
--- testSum4d ---
276
--- testSum5d ---
1128


================================================
FILE: test-suite/golden-tests/tensor-dimensions/main.loc
================================================
-- Test all tensor dimensions (1D through 5D) with Python->C++ cross-language.
module main
  ( t1d
  , t2d
  , t3d
  , t4d
  , t5d
  , testSum1d
  , testSum2d
  , testSum3d
  , testSum4d
  , testSum5d
  )

import root
import root-py
import root-cpp

source Py from "src.py"
  ( "make1d" as pyMake1d
  , "make2d" as pyMake2d
  , "make3d" as pyMake3d
  , "make4d" as pyMake4d
  , "make5d" as pyMake5d
  )

source Cpp from "src.hpp"
  ( "cppSum1d"
  , "cppSum2d"
  , "cppSum3d"
  , "cppSum4d"
  , "cppSum5d"
  )

pyMake1d :: Tensor1 6 Int
pyMake2d :: Tensor2 2 3 Int
pyMake3d :: Tensor3 2 3 4 Int
pyMake4d :: Tensor4 2 3 2 2 Int
pyMake5d :: Tensor5 2 2 2 3 2 Int

cppSum1d :: Tensor1 6 Int -> Int
cppSum2d :: Tensor2 2 3 Int -> Int
cppSum3d :: Tensor3 2 3 4 Int -> Int
cppSum4d :: Tensor4 2 3 2 2 Int -> Int
cppSum5d :: Tensor5 2 2 2 3 2 Int -> Int

t1d = pyMake1d
t2d = pyMake2d
t3d = pyMake3d
t4d = pyMake4d
t5d = pyMake5d

testSum1d :: Int
testSum1d = cppSum1d pyMake1d

testSum2d :: Int
testSum2d = cppSum2d pyMake2d

testSum3d :: Int
testSum3d = cppSum3d pyMake3d

testSum4d :: Int
testSum4d = cppSum4d pyMake4d

testSum5d :: Int
testSum5d = cppSum5d pyMake5d


================================================
FILE: test-suite/golden-tests/tensor-dimensions/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"

mlc::Tensor<int, 4> cppMake4d() {
    int64_t dims[4] = {2, 3, 2, 2};
    mlc::Tensor<int, 4> t(dims);
    for (size_t i = 0; i < t.size(); i++) t[i] = (int)i;
    return t;
}

mlc::Tensor<int, 5> cppMake5d() {
    int64_t dims[5] = {2, 2, 2, 3, 2};
    mlc::Tensor<int, 5> t(dims);
    for (size_t i = 0; i < t.size(); i++) t[i] = (int)i;
    return t;
}

int cppSum1d(const mlc::Tensor1<int>& t) {
    int s = 0; for (size_t i = 0; i < t.size(); i++) s += t.data()[i]; return s;
}
int cppSum2d(const mlc::Tensor2<int>& t) {
    int s = 0; for (size_t i = 0; i < t.size(); i++) s += t.data()[i]; return s;
}
int cppSum3d(const mlc::Tensor3<int>& t) {
    int s = 0; for (size_t i = 0; i < t.size(); i++) s += t.data()[i]; return s;
}
int cppSum4d(const mlc::Tensor<int, 4>& t) {
    int s = 0; for (size_t i = 0; i < t.size(); i++) s += t.data()[i]; return s;
}
int cppSum5d(const mlc::Tensor<int, 5>& t) {
    int s = 0; for (size_t i = 0; i < t.size(); i++) s += t.data()[i]; return s;
}

#endif


================================================
FILE: test-suite/golden-tests/tensor-dimensions/src.py
================================================
import numpy as np

def make1d():
    return np.arange(6, dtype=np.int32)

def make2d():
    return np.arange(6, dtype=np.int32).reshape(2, 3)

def make3d():
    return np.arange(24, dtype=np.int32).reshape(2, 3, 4)

def make4d():
    return np.arange(24, dtype=np.int32).reshape(2, 3, 2, 2)

def make5d():
    return np.arange(48, dtype=np.int32).reshape(2, 2, 2, 3, 2)


================================================
FILE: test-suite/golden-tests/tensor-nat-basic/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testMakeVec ---" > obs.txt
	./nexus testMakeVec >> obs.txt 2>> obs.err
	echo "--- testMakeMat ---" >> obs.txt
	./nexus testMakeMat >> obs.txt 2>> obs.err
	echo "--- testId ---" >> obs.txt
	./nexus testId >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/tensor-nat-basic/exp.txt
================================================
--- testMakeVec ---
[1,2,3]
--- testMakeMat ---
[[0,1,2],[10,11,12]]
--- testId ---
[1,2,3,4]


================================================
FILE: test-suite/golden-tests/tensor-nat-basic/labeled.hpp
================================================
#ifndef __LABELED_HPP__
#define __LABELED_HPP__

#include "mlc_tensor.hpp"

// Create a vector of given length, filled with 1.0, 2.0, ...
mlc::Tensor1<double> makeVec(int n) {
    mlc::Tensor1<double> v({(int64_t)n});
    for (int i = 0; i < n; i++) v[i] = (double)(i + 1);
    return v;
}

// Create an m x n matrix filled with row*10 + col
mlc::Tensor2<double> makeMat(int m, int n) {
    mlc::Tensor2<double> mat({(int64_t)m, (int64_t)n});
    for (int i = 0; i < m; i++)
        for (int j = 0; j < n; j++)
            mat(i, j) = (double)(i * 10 + j);
    return mat;
}

// Identity: return the vector unchanged (must clone since Tensor has no copy ctor)
mlc::Tensor1<double> idVec(const mlc::Tensor1<double>& v) {
    mlc::Tensor1<double> out({v.shape(0)});
    for (size_t i = 0; i < v.size(); i++) out[i] = v.data()[i];
    return out;
}

#endif


================================================
FILE: test-suite/golden-tests/tensor-nat-basic/main.loc
================================================
-- Test labeled nat params (m:Int syntax)
-- Labels bind Int args to nat-kinded type params

module main (testMakeVec, testMakeMat, testId)

import root
import root-cpp

source Cpp from "labeled.hpp"
  ( "makeVec"
  , "makeMat"
  , "idVec"
  )

-- Labeled: Int arg determines vector length
makeVec :: n:Int -> Tensor1 n Real

-- Labeled: two Int args determine matrix dims
makeMat :: m:Int -> n:Int -> Tensor2 m n Real

-- Generic: works for any length vector
idVec :: Tensor1 n Real -> Tensor1 n Real

testMakeVec :: Tensor1 3 Real
testMakeVec = makeVec 3

testMakeMat :: Tensor2 2 3 Real
testMakeMat = makeMat 2 3

testId :: Tensor1 4 Real
testId = idVec (makeVec 4)


================================================
FILE: test-suite/golden-tests/tensor-nat-labeled/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- predictDigit ---" > obs.txt
	./nexus predictDigit >> obs.txt 2>> obs.err
	echo "--- testConv ---" >> obs.txt
	./nexus testConv >> obs.txt 2>> obs.err
	echo "--- testRelu ---" >> obs.txt
	./nexus testRelu >> obs.txt 2>> obs.err
	echo "--- testFlatten ---" >> obs.txt
	./nexus testFlatten >> obs.txt 2>> obs.err
	echo "--- testDense ---" >> obs.txt
	./nexus testDense >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/tensor-nat-labeled/cnn.hpp
================================================
#ifndef __CNN_HPP__
#define __CNN_HPP__

#include "mlc_tensor.hpp"
#include <cmath>
#include <algorithm>

// --- Input data (now parameterized by dimension args) ---

// Create an image with a cross pattern of the given dimensions
mlc::Tensor2<double> makeImage(int h, int w) {
    mlc::Tensor2<double> img({(int64_t)h, (int64_t)w});
    int midR = h / 2;
    int midC = w / 2;
    // vertical bar
    for (int i = 0; i < h; i++) img(i, midC) = 1.0;
    // horizontal bar
    for (int j = 0; j < w; j++) img(midR, j) = 1.0;
    return img;
}

// Create k convolution kernels of size fh x fw
// Kernel 0: horizontal edge detector
// Kernel 1: vertical edge detector (if k >= 2)
mlc::Tensor3<double> makeKernels(int k, int fh, int fw) {
    mlc::Tensor3<double> kern({(int64_t)k, (int64_t)fh, (int64_t)fw});
    int ksize = fh * fw;
    if (k >= 1) {
        // Kernel 0: horizontal edges (-1 top, 0 mid, 1 bottom)
        for (int i = 0; i < fh; i++) {
            double row_val = (i < fh/2) ? -1.0 : (i > fh/2) ? 1.0 : 0.0;
            for (int j = 0; j < fw; j++) {
                kern[i * fw + j] = row_val;
            }
        }
    }
    if (k >= 2) {
        // Kernel 1: vertical edges (-1 left, 0 mid, 1 right)
        for (int i = 0; i < fh; i++) {
            for (int j = 0; j < fw; j++) {
                double col_val = (j < fw/2) ? -1.0 : (j > fw/2) ? 1.0 : 0.0;
                kern[ksize + i * fw + j] = col_val;
            }
        }
    }
    return kern;
}

// Bias per filter
mlc::Tensor1<double> makeBias(int k) {
    mlc::Tensor1<double> b({(int64_t)k});
    for (int i = 0; i < k; i++) b[i] = 0.1;
    return b;
}

// --- Layers ---

// 2D convolution (valid, no padding, stride 1)
mlc::Tensor3<double> conv2d(
    const mlc::Tensor2<double>& image,
    const mlc::Tensor3<double>& kernels,
    const mlc::Tensor1<double>& bias)
{
    int64_t H = image.shape(0);
    int64_t W = image.shape(1);
    int64_t F = kernels.shape(0);
    int64_t Kh = kernels.shape(1);
    int64_t Kw = kernels.shape(2);
    int64_t Oh = H - Kh + 1;
    int64_t Ow = W - Kw + 1;

    mlc::Tensor3<double> out({F, Oh, Ow});
    for (int64_t f = 0; f < F; f++) {
        for (int64_t i = 0; i < Oh; i++) {
            for (int64_t j = 0; j < Ow; j++) {
                double sum = bias[f];
                for (int64_t ki = 0; ki < Kh; ki++) {
                    for (int64_t kj = 0; kj < Kw; kj++) {
                        sum += image(i + ki, j + kj)
                             * kernels.data()[f * Kh * Kw + ki * Kw + kj];
                    }
                }
                out.data()[f * Oh * Ow + i * Ow + j] = sum;
            }
        }
    }
    return out;
}

// ReLU: element-wise max(0, x)
mlc::Tensor3<double> reluMap(const mlc::Tensor3<double>& t) {
    mlc::Tensor3<double> out({t.shape(0), t.shape(1), t.shape(2)});
    for (size_t i = 0; i < t.size(); i++) {
        out[i] = std::max(0.0, t.data()[i]);
    }
    return out;
}

// Flatten 3D to 1D
mlc::Tensor1<double> flatten3d(const mlc::Tensor3<double>& t) {
    size_t n = t.size();
    mlc::Tensor1<double> out({(int64_t)n});
    for (size_t i = 0; i < n; i++) {
        out[i] = t.data()[i];
    }
    return out;
}

// Dense layer: out = W * x + b
mlc::Tensor1<double> dense(
    const mlc::Tensor2<double>& W,
    const mlc::Tensor1<double>& b,
    const mlc::Tensor1<double>& x)
{
    int64_t out_dim = W.shape(0);
    int64_t in_dim = W.shape(1);
    mlc::Tensor1<double> out({out_dim});
    for (int64_t i = 0; i < out_dim; i++) {
        double sum = b[i];
        for (int64_t j = 0; j < in_dim; j++) {
            sum += W(i, j) * x[j];
        }
        out[i] = sum;
    }
    return out;
}

// Dense layer weights (parameterized by dimensions)
mlc::Tensor2<double> makeWeights(int out_dim, int in_dim) {
    mlc::Tensor2<double> W({(int64_t)out_dim, (int64_t)in_dim});
    for (int i = 0; i < out_dim; i++) {
        for (int j = 0; j < in_dim; j++) {
            if (i == 0) W(i, j) = 0.01 * (j % 5 - 2);  // small, centered around 0
            else if (i == 1) W(i, j) = 0.1;              // uniformly positive
            else W(i, j) = -0.05;                         // uniformly negative
        }
    }
    return W;
}

// Dense bias (parameterized by dimension)
mlc::Tensor1<double> makeDenseBias(int n) {
    mlc::Tensor1<double> b({(int64_t)n});
    for (int i = 0; i < n; i++) b[i] = 0.0;
    if (n >= 2) b[1] = 0.5;  // boost class 1
    return b;
}

// Argmax: index of maximum element
int argmax(const mlc::Tensor1<double>& v) {
    int best = 0;
    for (int64_t i = 1; i < v.shape(0); i++) {
        if (v[i] > v[best]) best = (int)i;
    }
    return best;
}

#endif


================================================
FILE: test-suite/golden-tests/tensor-nat-labeled/exp.txt
================================================
--- predictDigit ---
1
--- testConv ---
[[[2.1,2.1,2.1],[0.1,0.1,0.1],[-1.9,-1.9,-1.9]],[[2.1,0.1,-1.9],[2.1,0.1,-1.9],[2.1,0.1,-1.9]]]
--- testRelu ---
[[[2.1,2.1,2.1],[0.1,0.1,0.1],[0,0,0]],[[2.1,0.1,0],[2.1,0.1,0],[2.1,0.1,0]]]
--- testFlatten ---
[2.1,2.1,2.1,0.1,0.1,0.1,0,0,0,2.1,0.1,0,2.1,0.1,0,2.1,0.1,0]
--- testDense ---
[-0.064,1.82,-0.66]


================================================
FILE: test-suite/golden-tests/tensor-nat-labeled/main.loc
================================================
-- Simple CNN inference for character recognition using morloc tensors.
-- Architecture: conv2d(3x3, 2 filters) -> relu -> flatten -> dense(18->3) -> argmax
-- Tests labeled nat params (m:Int syntax) and generic nat dimensions.

module main
  ( predictDigit
  , testConv
  , testRelu
  , testFlatten
  , testDense
  )

import root
import root-cpp

source Cpp from "cnn.hpp"
  ( "makeImage"
  , "makeKernels"
  , "makeBias"
  , "makeWeights"
  , "makeDenseBias"
  , "conv2d"
  , "reluMap"
  , "flatten3d"
  , "dense"
  , "argmax"
  )

-- Labeled params: Int args determine tensor dimensions
makeImage :: h:Int -> w:Int -> Tensor2 h w Real
makeKernels :: k:Int -> fh:Int -> fw:Int -> Tensor3 k fh fw Real
makeBias :: k:Int -> Tensor1 k Real

-- Generic dimensions: ops work for any tensor sizes
conv2d :: Tensor2 h w Real -> Tensor3 k fh fw Real -> Tensor1 k Real -> Tensor3 k (h - fh + 1) (w - fw + 1) Real
reluMap :: Tensor3 a b c Real -> Tensor3 a b c Real
flatten3d :: Tensor3 a b c Real -> Tensor1 (a * b * c) Real

-- Dense layer with generic dimensions
makeWeights :: nout:Int -> nin:Int -> Tensor2 nout nin Real
makeDenseBias :: n:Int -> Tensor1 n Real
dense :: Tensor2 m n Real -> Tensor1 m Real -> Tensor1 n Real -> Tensor1 m Real

-- Argmax: find index of maximum value
argmax :: Tensor1 n Real -> Int

-- Full pipeline: image -> predicted class
predictDigit :: Int
predictDigit =
  let image = makeImage 5 5
      kernels = makeKernels 2 3 3
      bias = makeBias 2
      convOut = conv2d image kernels bias
      activated = reluMap convOut
      flat = flatten3d activated
      weights = makeWeights 3 18
      denseBias = makeDenseBias 3
      logits = dense weights denseBias flat
  in argmax logits

-- Individual layer tests
-- testConv :: Tensor3 2 3 3 Real
testConv = conv2d (makeImage 5 5) (makeKernels 2 3 3) (makeBias 2)

-- testRelu :: Tensor3 2 3 3 Real
testRelu = reluMap (conv2d (makeImage 5 5) (makeKernels 2 3 3) (makeBias 2))

-- testFlatten :: Tensor1 18 Real
testFlatten = flatten3d (reluMap (conv2d (makeImage 5 5) (makeKernels 2 3 3) (makeBias 2)))

-- testDense :: Tensor1 3 Real
testDense =
  let flat = flatten3d (reluMap (conv2d (makeImage 5 5) (makeKernels 2 3 3) (makeBias 2)))
  in dense (makeWeights 3 18) (makeDenseBias 3) flat


================================================
FILE: test-suite/golden-tests/tensor-nexus-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus makeMatrix > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/tensor-nexus-cpp/exp.txt
================================================
[[1,2,3,4],[5,6,7,8],[9,10,11,12]]


================================================
FILE: test-suite/golden-tests/tensor-nexus-cpp/main.loc
================================================
module main (makeMatrix)

import root
import root-cpp

source Cpp from "src.hpp" ("makeMatrix")

makeMatrix :: Tensor2 3 4 Int


================================================
FILE: test-suite/golden-tests/tensor-nexus-cpp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"

mlc::Tensor2<int> makeMatrix() {
    mlc::Tensor2<int> m({3, 4});
    for (int i = 0; i < 3; i++)
        for (int j = 0; j < 4; j++)
            m(i, j) = i * 4 + j + 1;
    return m;
}
#endif


================================================
FILE: test-suite/golden-tests/tensor-pc/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-pc/exp.txt
================================================
78


================================================
FILE: test-suite/golden-tests/tensor-pc/main.loc
================================================
module main (result)

import root
import root-cpp
import root-py

source Py from "src.py" ("makeMatrix")
source Cpp from "src.hpp" ("sumAll")

makeMatrix :: Tensor2 3 4 Real
sumAll :: Tensor2 3 4 Real -> Real

result :: Real
result = sumAll makeMatrix


================================================
FILE: test-suite/golden-tests/tensor-pc/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"

double sumAll(const mlc::Tensor2<double>& m) {
    double s = 0;
    for (size_t k = 0; k < m.size(); k++) s += m.data()[k];
    return s;
}
#endif


================================================
FILE: test-suite/golden-tests/tensor-pc/src.py
================================================
import numpy as np

def makeMatrix():
    return np.arange(1, 13, dtype=np.float64).reshape(3, 4)


================================================
FILE: test-suite/golden-tests/tensor-pr/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-pr/exp.txt
================================================
78


================================================
FILE: test-suite/golden-tests/tensor-pr/main.loc
================================================
module main (result)

import root
import root-py
import root-r (Real)

source Py from "src.py" ("makeMatrix")
source R from "src.R" ("sumAll")

makeMatrix :: Tensor2 3 4 Real
sumAll :: Tensor2 3 4 Real -> Real

result :: Real
result = sumAll makeMatrix


================================================
FILE: test-suite/golden-tests/tensor-pr/src.R
================================================
sumAll <- function(m) {
  sum(m)
}


================================================
FILE: test-suite/golden-tests/tensor-pr/src.py
================================================
import numpy as np

def makeMatrix():
    return np.arange(1, 13, dtype=np.float64).reshape(3, 4)


================================================
FILE: test-suite/golden-tests/tensor-rp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err __pycache__


================================================
FILE: test-suite/golden-tests/tensor-rp/exp.txt
================================================
78


================================================
FILE: test-suite/golden-tests/tensor-rp/main.loc
================================================
module main (result)

import root
import root-py
import root-r (Real)

source R from "src.R" ("makeMatrix")
source Py from "src.py" ("sumAll")

makeMatrix :: Tensor2 3 4 Real
sumAll :: Tensor2 3 4 Real -> Real

result :: Real
result = sumAll makeMatrix


================================================
FILE: test-suite/golden-tests/tensor-rp/src.R
================================================
makeMatrix <- function() {
  matrix(as.double(1:12), nrow=3, ncol=4, byrow=TRUE)
}


================================================
FILE: test-suite/golden-tests/tensor-rp/src.py
================================================
import numpy as np

def sumAll(m):
    return float(np.sum(m))


================================================
FILE: test-suite/golden-tests/tensor-table-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus result > obs.txt 2> obs.err

clean:
	rm -rf nexus pools *err


================================================
FILE: test-suite/golden-tests/tensor-table-cpp/exp.txt
================================================
78


================================================
FILE: test-suite/golden-tests/tensor-table-cpp/main.loc
================================================
module main (result)

import root
import root-cpp

source Cpp from "src.hpp" ("makeMatrix", "sumAll")

makeMatrix :: Tensor2 3 4 Real
sumAll :: Tensor2 3 4 Real -> Real

result :: Real
result = sumAll makeMatrix


================================================
FILE: test-suite/golden-tests/tensor-table-cpp/src.hpp
================================================
#ifndef __SRC_HPP__
#define __SRC_HPP__
#include "mlc_tensor.hpp"

mlc::Tensor2<double> makeMatrix() {
    mlc::Tensor2<double> m({3, 4});
    for (int i = 0; i < 3; i++)
        for (int j = 0; j < 4; j++)
            m(i, j) = (double)(i * 4 + j + 1);
    return m;
}

double sumAll(const mlc::Tensor2<double>& m) {
    double s = 0;
    for (size_t k = 0; k < m.size(); k++) s += m.data()[k];
    return s;
}
#endif


================================================
FILE: test-suite/golden-tests/thunk-basic/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- forceConst ---" > obs.txt
	./nexus forceConst >> obs.txt 2>> obs.err
	echo "--- forceFun ---" >> obs.txt
	./nexus forceFun >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-basic/exp.txt
================================================
--- forceConst ---
42
--- forceFun ---
42


================================================
FILE: test-suite/golden-tests/thunk-basic/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

int add(int a, int b){
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-basic/main.loc
================================================
module main (forceConst, forceFun)

import root-cpp

source Cpp from "foo.hpp" ("add")

type Cpp => Int = "int"

add :: Int -> Int -> Int

-- basic: pure constant
forceConst :: Int
forceConst = 42

-- pure function call
forceFun :: Int
forceFun = add 40 2


================================================
FILE: test-suite/golden-tests/thunk-choose/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-choose/exp.txt
================================================
"a"


================================================
FILE: test-suite/golden-tests/thunk-choose/foo.py
================================================
# mock of choose
def choose(xs):
    return xs[0]


================================================
FILE: test-suite/golden-tests/thunk-choose/main.loc
================================================
module main (foo)

import root-py

source Py from "foo.py" ("choose")

choose :: [a] -> <IO> a

foo :: <IO> Str
foo = choose ["a", "b"]


================================================
FILE: test-suite/golden-tests/thunk-cross-force/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- combined ---" > obs.txt
	./nexus combined >> obs.txt 2>> obs.err
	echo "--- addForced ---" >> obs.txt
	./nexus addForced >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-cross-force/exp.txt
================================================
--- combined ---
"hello_42"
--- addForced ---
84


================================================
FILE: test-suite/golden-tests/thunk-cross-force/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>

std::string combine(std::string name, int value) {
    return name + "_" + std::to_string(value);
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-cross-force/foo.py
================================================
def get_value():
    return 42

def get_name():
    return "hello"


================================================
FILE: test-suite/golden-tests/thunk-cross-force/main.loc
================================================
-- Test cross-language nullary effect evaluation as function arguments.

module main (combined, addForced)

import root-cpp
import root-py

source Py from "foo.py" ("get_name", "get_value")
source Cpp from "foo.hpp" ("combine", "add")

type Cpp => Int = "int"
type Py => Int = "int"
type Cpp => Str = "std::string"
type Py => Str = "str"

get_name :: <IO> Str
get_value :: <IO> Int
combine :: Str -> Int -> Str
add :: Int -> Int -> Int

combined :: <IO> Str
combined = do
    n <- get_name
    v <- get_value
    combine n v

addForced :: <IO> Int
addForced = do
    x <- get_value
    y <- get_value
    add x y


================================================
FILE: test-suite/golden-tests/thunk-do/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- doPure ---" > obs.txt
	./nexus doPure >> obs.txt 2>> obs.err
	echo "--- doBind ---" >> obs.txt
	./nexus doBind >> obs.txt 2>> obs.err
	echo "--- doBare ---" >> obs.txt
	./nexus doBare >> obs.txt 2>> obs.err
	echo "--- doChain ---" >> obs.txt
	./nexus doChain >> obs.txt 2>> obs.err
	echo "--- doMixed ---" >> obs.txt
	./nexus doMixed >> obs.txt 2>> obs.err
	echo "--- doLet ---" >> obs.txt
	./nexus doLet >> obs.txt 2>> obs.err
	echo "--- doLetBind ---" >> obs.txt
	./nexus doLetBind >> obs.txt 2>> obs.err
	echo "--- doLetThunk ---" >> obs.txt
	./nexus doLetThunk >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-do/exp.txt
================================================
--- doPure ---
42
--- doBind ---
EVAL 5
11
--- doBare ---
EVAL 3
42
--- doChain ---
EVAL 3
EVAL 6
18
--- doMixed ---
EVAL 1
EVAL 5
EVAL 10
11
--- doLet ---
8
--- doLetBind ---
EVAL 5
21
--- doLetThunk ---
EVAL 1
EVAL 3
8


================================================
FILE: test-suite/golden-tests/thunk-do/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-do/main.loc
================================================
-- Test do-notation with effects:
--   1. doPure: pure value (no do-block needed)
--   2. doBind: bind an evaluated effect to a variable
--   3. doBare: bare statement evaluated and discarded
--   4. doChain: multiple binds feeding into each other
--   5. doMixed: interleaving bare statements and binds
--   6. doLet: pure let binding (no evaluation)
--   7. doLetBind: let mixed with <- bind
--   8. doLetThunk: let binds an effect, evaluated later with <-

module main (doPure, doBind, doBare, doChain, doMixed, doLet, doLetBind, doLetThunk)

import root-cpp

source Cpp from "foo.hpp" ("sideEffect", "add")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int
add :: Int -> Int -> Int

-- pure value: no effects
doPure :: Int
doPure = 42

-- bind: x <- sideEffect 5 evaluates effect, binds x = 10
-- then add x 1 = 11
doBind :: <IO> Int
doBind = do
    x <- sideEffect 5
    add x 1

-- bare statement: evaluates and discards result
-- sideEffect 3 called (prints "EVAL 3"), result discarded, then 42
doBare :: <IO> Int
doBare = do
    sideEffect 3
    42

-- chained binds: result of first feeds into second
-- sideEffect 3 -> "EVAL 3", x = 6
-- sideEffect 6 -> "EVAL 6", y = 12
-- add 6 12 = 18
doChain :: <IO> Int
doChain = do
    x <- sideEffect 3
    y <- sideEffect x
    add x y

-- mix of bare statements and binds
-- sideEffect 1 -> "EVAL 1", discarded
-- sideEffect 5 -> "EVAL 5", x = 10
-- sideEffect 10 -> "EVAL 10", discarded
-- add 10 1 = 11
doMixed :: <IO> Int
doMixed = do
    sideEffect 1
    x <- sideEffect 5
    sideEffect x
    add x 1

-- pure let binding: let y = add 3 4 binds y = 7, no evaluation
-- then add y 1 = 8
doLet :: <IO> Int
doLet = do
    let y = add 3 4
    add y 1

-- let mixed with <- bind:
-- sideEffect 5 -> "EVAL 5", x = 10
-- let y = add x 1 binds y = 11 (pure, no evaluation)
-- add x y = add 10 11 = 21
doLetBind :: <IO> Int
doLetBind = do
    x <- sideEffect 5
    let y = add x 1
    add x y

-- let binds an effect (not evaluated), then <- evaluates it later:
-- let t = sideEffect 3 binds t :: <IO> Int (not yet evaluated)
-- sideEffect 1 -> "EVAL 1", x = 2
-- y <- t evaluates t: sideEffect 3 -> "EVAL 3", y = 6
-- add 2 6 = 8
doLetThunk :: <IO> Int
doLetThunk = do
    let t = sideEffect 3
    x <- sideEffect 1
    y <- t
    add x y


================================================
FILE: test-suite/golden-tests/thunk-effects/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- forceOnce ---" > obs.txt
	./nexus forceOnce >> obs.txt 2>> obs.err
	echo "--- forceTwice ---" >> obs.txt
	./nexus forceTwice >> obs.txt 2>> obs.err
	echo "--- forceShared ---" >> obs.txt
	./nexus forceShared >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-effects/exp.txt
================================================
--- forceOnce ---
EVAL 5
10
--- forceTwice ---
EVAL 5
EVAL 5
20
--- forceShared ---
EVAL 5
20


================================================
FILE: test-suite/golden-tests/thunk-effects/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-effects/main.loc
================================================
-- Test core effect use cases:
--   1. Single effect evaluation
--   2. Two independent evaluations (no sharing)
--   3. Do-block with shared binding evaluates once

module main (forceOnce, forceTwice, forceShared)

import root-cpp

source Cpp from "foo.hpp" ("sideEffect", "add")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int
add :: Int -> Int -> Int

-- Single evaluation
-- sideEffect 5 prints "EVAL 5", returns 10
forceOnce :: <IO> Int
forceOnce = sideEffect 5

-- Two independent evaluations
-- sideEffect 5 called twice: "EVAL 5" appears twice, 10 + 10 = 20
forceTwice :: <IO> Int
forceTwice = do
    x <- sideEffect 5
    y <- sideEffect 5
    add x y

-- Shared binding: evaluates once, result shared
-- sideEffect 5 called once: "EVAL 5" appears once, 10 + 10 = 20
forceShared :: <IO> Int
forceShared = do
    x <- sideEffect 5
    add x x


================================================
FILE: test-suite/golden-tests/thunk-eval-forall/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-eval-forall/exp.txt
================================================
0.639426798457884


================================================
FILE: test-suite/golden-tests/thunk-eval-forall/main.loc
================================================
-- Test: polymorphic effectful typeclass method used with <- in a do-block
-- Mirrors bug-reports/report-2/bug1.loc

module main (test)

import root-py

type Py => Real = "float"
type Py => Int = "int"
type Py => Unit = "None"

class Random a where
  random :: <Random> a

instance Random Real where
  source Py from "rng.py" ("randomReal" as random)

setSeed :: Int -> <Random> Unit
source Py from "rng.py" ("setSeed")

test :: <Random> Real
test = do
  setSeed 42
  x <- random
  x


================================================
FILE: test-suite/golden-tests/thunk-eval-forall/rng.py
================================================
import random as _random

def setSeed(seed):
    _random.seed(seed)
    return None

def randomReal():
    return _random.random()


================================================
FILE: test-suite/golden-tests/thunk-eval-hk/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-eval-hk/exp.txt
================================================
[4,3,1,2,5]


================================================
FILE: test-suite/golden-tests/thunk-eval-hk/main.loc
================================================
-- Test: HK typeclass effectful method used with <- in a do-block
-- Mirrors bug-reports/report-2/bug2.loc

module main (test)

import root-py

type Py => Int = "int"
type Py => Unit = "None"

class RandomGroup f where
  permute :: f a -> <Random> f a

instance RandomGroup List where
  source Py from "rng.py" ("permute")

setSeed :: Int -> <Random> Unit
source Py from "rng.py" ("setSeed")

test :: <Random> [Int]
test = do
  setSeed 42
  x <- permute ([5, 3, 1, 4, 2] :: List Int)
  x


================================================
FILE: test-suite/golden-tests/thunk-eval-hk/rng.py
================================================
import random as _random

def setSeed(seed):
    _random.seed(seed)
    return None

def permute(xs):
    ys = list(xs)
    _random.shuffle(ys)
    return ys


================================================
FILE: test-suite/golden-tests/thunk-export/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- rollOnce ---" > obs.txt
	./nexus rollOnce >> obs.txt 2>> obs.err
	echo "--- rollArg ---" >> obs.txt
	./nexus rollArg 3 >> obs.txt 2>> obs.err
	echo "--- rollPy ---" >> obs.txt
	./nexus rollPy >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-export/exp.txt
================================================
--- rollOnce ---
EVAL 5
10
--- rollArg ---
EVAL 3
6
--- rollPy ---
EVAL 7
14


================================================
FILE: test-suite/golden-tests/thunk-export/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-export/foo.py
================================================
import sys

def pySideEffect(x):
    print("EVAL " + str(x), flush=True)
    return x * 2


================================================
FILE: test-suite/golden-tests/thunk-export/main.loc
================================================
module main (rollOnce, rollArg, rollPy)

source Cpp from "foo.hpp" ("sideEffect")
source Py from "foo.py" ("pySideEffect")

type Cpp => Int = "int"
type Py => Int = "int"

sideEffect :: Int -> <IO> Int
pySideEffect :: Int -> <IO> Int

-- Export a nullary effect: should auto-force
rollOnce :: <IO> Int
rollOnce = sideEffect 5

-- Export a function returning an effect: should auto-force
rollArg :: Int -> <IO> Int
rollArg x = sideEffect x

-- Export a nullary Python effect: should auto-force
rollPy :: <IO> Int
rollPy = pySideEffect 7


================================================
FILE: test-suite/golden-tests/thunk-export-guard/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- guardThunk 5 ---" > obs.txt
	./nexus guardThunk 5 >> obs.txt 2>> obs.err
	echo "--- guardThunk 0 ---" >> obs.txt
	./nexus guardThunk 0 >> obs.txt 2>> obs.err
	echo "--- guardThunk -3 ---" >> obs.txt
	./nexus guardThunk -- -3 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-export-guard/exp.txt
================================================
--- guardThunk 5 ---
EVAL 5
10
--- guardThunk 0 ---
0
--- guardThunk -3 ---
0


================================================
FILE: test-suite/golden-tests/thunk-export-guard/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-export-guard/main.loc
================================================
-- Test exported function returning <IO> Int through guards.

module main (guardThunk)

import root-cpp

source Cpp from "foo.hpp" ("sideEffect")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int

guardThunk :: Int -> <IO> Int
guardThunk x
  ? x > 0 = sideEffect x
  : do
      0


================================================
FILE: test-suite/golden-tests/thunk-force/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus forceOnce >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-force/exp.txt
================================================
EVAL 5
10


================================================
FILE: test-suite/golden-tests/thunk-force/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-force/main.loc
================================================
module main (forceOnce)

source Cpp from "foo.hpp" ("sideEffect")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int

-- Exported effect-typed function: auto-forced at export boundary
forceOnce :: <IO> Int
forceOnce = sideEffect 5


================================================
FILE: test-suite/golden-tests/thunk-guard-cross/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- guardCross 5 ---" > obs.txt
	./nexus guardCross 5 >> obs.txt 2>> obs.err
	echo "--- guardCross 0 ---" >> obs.txt
	./nexus guardCross 0 >> obs.txt 2>> obs.err
	echo "--- guardCross -3 ---" >> obs.txt
	./nexus guardCross -- -3 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-guard-cross/exp.txt
================================================
--- guardCross 5 ---
11
--- guardCross 0 ---
0
--- guardCross -3 ---
0


================================================
FILE: test-suite/golden-tests/thunk-guard-cross/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-guard-cross/foo.py
================================================
def py_double(x):
    return x * 2


================================================
FILE: test-suite/golden-tests/thunk-guard-cross/main.loc
================================================
-- Test cross-language effect evaluation inside guard branches.

module main (guardCross)

import root-cpp
import root-py

source Py from "foo.py" ("py_double")
source Cpp from "foo.hpp" ("add")

type Cpp => Int = "int"
type Py => Int = "int"

py_double :: Int -> <IO> Int
add :: Int -> Int -> Int

guardCross :: Int -> <IO> Int
guardCross x
  ? x > 0 = do
      y <- py_double x
      add y 1
  : do
      0


================================================
FILE: test-suite/golden-tests/thunk-interop/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- cppForce ---" > obs.txt
	./nexus cppForce >> obs.txt 2>> obs.err
	echo "--- pyForce ---" >> obs.txt
	./nexus pyForce >> obs.txt 2>> obs.err
	echo "--- rForce ---" >> obs.txt
	./nexus rForce >> obs.txt 2>> obs.err
	echo "--- crossCppPy ---" >> obs.txt
	./nexus crossCppPy >> obs.txt 2>> obs.err
	echo "--- crossPyR ---" >> obs.txt
	./nexus crossPyR >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-interop/exp.txt
================================================
--- cppForce ---
EVAL_CPP 5
10
--- pyForce ---
EVAL_PY 5
10
--- rForce ---
EVAL_R 5
10
--- crossCppPy ---
EVAL_CPP 3
EVAL_PY 6
18
--- crossPyR ---
EVAL_PY 4
EVAL_R 8
24


================================================
FILE: test-suite/golden-tests/thunk-interop/foo.R
================================================
sideEffectR <- function(x) {
    cat(paste0("EVAL_R ", x, "\n"))
    flush(stdout())
    x * 2L
}

addR <- function(a, b) {
    a + b
}


================================================
FILE: test-suite/golden-tests/thunk-interop/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffectCpp(int x) {
    std::cout << "EVAL_CPP " << x << std::endl;
    return x * 2;
}

int addCpp(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-interop/foo.py
================================================
import sys

def sideEffectPy(x):
    print("EVAL_PY " + str(x))
    sys.stdout.flush()
    return x * 2

def addPy(a, b):
    return a + b


================================================
FILE: test-suite/golden-tests/thunk-interop/main.loc
================================================
-- Test effects across C++, Python, and R:
--   1-3. Evaluate effect in each language independently
--   4-5. Cross-language: do-blocks chaining effect evaluations across languages

module main (cppForce, pyForce, rForce, crossCppPy, crossPyR)

import root-cpp
import root-py
import root-r

source Cpp from "foo.hpp" ("sideEffectCpp", "addCpp")
source Py from "foo.py" ("sideEffectPy", "addPy")
source R from "foo.R" ("sideEffectR", "addR")

type Cpp => Int = "int"
type Py => Int = "int"
type R => Int = "integer"

sideEffectCpp :: Int -> <IO> Int
sideEffectPy :: Int -> <IO> Int
sideEffectR :: Int -> <IO> Int
addCpp :: Int -> Int -> Int
addPy :: Int -> Int -> Int
addR :: Int -> Int -> Int

-- Evaluate a C++ effect
-- sideEffectCpp 5 -> "EVAL_CPP 5", returns 10
cppForce :: <IO> Int
cppForce = sideEffectCpp 5

-- Evaluate a Python effect
-- sideEffectPy 5 -> "EVAL_PY 5", returns 10
pyForce :: <IO> Int
pyForce = sideEffectPy 5

-- Evaluate an R effect
-- sideEffectR 5 -> "EVAL_R 5", returns 10
rForce :: <IO> Int
rForce = sideEffectR 5

-- Cross-language do-block: C++ effect feeds Python effect, result via C++ add
-- sideEffectCpp 3 -> "EVAL_CPP 3", x = 6
-- sideEffectPy 6 -> "EVAL_PY 6", y = 12
-- addCpp 6 12 = 18
crossCppPy :: <IO> Int
crossCppPy = do
    x <- sideEffectCpp 3
    y <- sideEffectPy x
    addCpp x y

-- Cross-language do-block: Python effect feeds R effect, result via Python add
-- sideEffectPy 4 -> "EVAL_PY 4", x = 8
-- sideEffectR 8 -> "EVAL_R 8", y = 16
-- addPy 8 16 = 24
crossPyR :: <IO> Int
crossPyR = do
    x <- sideEffectPy 4
    y <- sideEffectR x
    addPy x y


================================================
FILE: test-suite/golden-tests/thunk-let/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- letShared ---" > obs.txt
	./nexus letShared >> obs.txt 2>> obs.err
	echo "--- letIndep ---" >> obs.txt
	./nexus letIndep >> obs.txt 2>> obs.err
	echo "--- letChain ---" >> obs.txt
	./nexus letChain >> obs.txt 2>> obs.err
	echo "--- letMultiForce ---" >> obs.txt
	./nexus letMultiForce >> obs.txt 2>> obs.err
	echo "--- letNested ---" >> obs.txt
	./nexus letNested >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-let/exp.txt
================================================
--- letShared ---
EVAL 5
20
--- letIndep ---
EVAL 5
EVAL 5
20
--- letChain ---
EVAL 3
EVAL 6
18
--- letMultiForce ---
EVAL 5
EVAL 5
20
--- letNested ---
EVAL 2
EVAL 4
24


================================================
FILE: test-suite/golden-tests/thunk-let/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <iostream>

int sideEffect(int x) {
    std::cout << "EVAL " << x << std::endl;
    return x * 2;
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-let/main.loc
================================================
-- Test let-binding semantics with effects:
--   - do { x <- e } evaluates e once, x is shared (no re-evaluation)
--   - Separate <- evaluations are independent each time
--   - Sequential do-bindings evaluate in order, each exactly once

module main (letShared, letIndep, letChain, letMultiForce, letNested)

import root-cpp

source Cpp from "foo.hpp" ("sideEffect", "add")

type Cpp => Int = "int"

sideEffect :: Int -> <IO> Int
add :: Int -> Int -> Int

-- Shared binding: evaluates once, result shared in both uses
-- sideEffect 5 -> "EVAL 5" once, x = 10, 10 + 10 = 20
letShared :: <IO> Int
letShared = do
    x <- sideEffect 5
    add x x

-- Independent evaluations: each evaluates separately
-- sideEffect 5 called twice -> "EVAL 5" twice, 10 + 10 = 20
letIndep :: <IO> Int
letIndep = do
    x <- sideEffect 5
    y <- sideEffect 5
    add x y

-- Sequential bindings: first result feeds into second
-- sideEffect 3 -> "EVAL 3", x = 6
-- sideEffect 6 -> "EVAL 6", y = 12
-- 6 + 12 = 18
letChain :: <IO> Int
letChain = do
    x <- sideEffect 3
    y <- sideEffect x
    add x y

-- Two independent evaluations of the same expression
-- sideEffect 5 called twice -> "EVAL 5" twice, 10 + 10 = 20
letMultiForce :: <IO> Int
letMultiForce = do
    x <- sideEffect 5
    y <- sideEffect 5
    add x y

-- Nested bindings with sharing at each level
-- sideEffect 2 -> "EVAL 2", a = 4
-- sideEffect 4 -> "EVAL 4", b = 8
-- c = 4 + 8 = 12
-- 12 + 12 = 24
letNested :: <IO> Int
letNested = do
    a <- sideEffect 2
    b <- sideEffect a
    let c = add a b
    add c c


================================================
FILE: test-suite/golden-tests/thunk-nullary-interop/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- pyThunkInCpp ---" > obs.txt
	./nexus pyThunkInCpp >> obs.txt 2>> obs.err
	echo "--- multiPyThunkInCpp ---" >> obs.txt
	./nexus multiPyThunkInCpp >> obs.txt 2>> obs.err
	echo "--- mixedThunkInCpp ---" >> obs.txt
	./nexus mixedThunkInCpp >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/thunk-nullary-interop/exp.txt
================================================
--- pyThunkInCpp ---
"hello"
--- multiPyThunkInCpp ---
"hello_42"
--- mixedThunkInCpp ---
84


================================================
FILE: test-suite/golden-tests/thunk-nullary-interop/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>

std::string combine(std::string name, int value) {
    return name + "_" + std::to_string(value);
}

int add(int a, int b) {
    return a + b;
}

#endif


================================================
FILE: test-suite/golden-tests/thunk-nullary-interop/foo.py
================================================
def get_value():
    return 42

def get_name():
    return "hello"


================================================
FILE: test-suite/golden-tests/thunk-nullary-interop/main.loc
================================================
-- Test nullary (zero-argument) foreign effects evaluated in a cross-language
-- do-block.

module main (pyThunkInCpp, multiPyThunkInCpp, mixedThunkInCpp)

import root-cpp
import root-py

source Py from "foo.py" ("get_value", "get_name")
source Cpp from "foo.hpp" ("combine", "add")

type Cpp => Int = "int"
type Py => Int = "int"
type Cpp => Str = "std::string"
type Py => Str = "str"

get_value :: <IO> Int
get_name :: <IO> Str
combine :: Str -> Int -> Str
add :: Int -> Int -> Int

-- Evaluate a single nullary Python effect from C++ context
pyThunkInCpp :: <IO> Str
pyThunkInCpp = do
    n <- get_name
    n

-- Evaluate multiple nullary Python effects in a C++ do-block
multiPyThunkInCpp :: <IO> Str
multiPyThunkInCpp = do
    n <- get_name
    v <- get_value
    combine n v

-- Mix nullary Python effects with C++ computation in do-block
mixedThunkInCpp :: <IO> Int
mixedThunkInCpp = do
    v1 <- get_value
    v2 <- get_value
    add v1 v2


================================================
FILE: test-suite/golden-tests/two-module/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o tavern tavern.loc 2> build.err
	morloc make -o combat combat.loc 2>> build.err
	./tavern randomClass > obs.txt 2> obs.err
	./combat rollDice >> obs.txt 2>> obs.err

clean:
	rm -rf tavern combat pools __pycache__ *.manifest


================================================
FILE: test-suite/golden-tests/two-module/combat.loc
================================================
module combat (rollDice)

import .util (roll)

rollDice :: <Rand> [Int]
rollDice = roll 2 1


================================================
FILE: test-suite/golden-tests/two-module/exp.txt
================================================
"Fighter"
[1,1]


================================================
FILE: test-suite/golden-tests/two-module/tavern.loc
================================================
module tavern (randomClass)

import .util (choose)

randomClass :: <Rand> Str
randomClass = choose ["Fighter"]


================================================
FILE: test-suite/golden-tests/two-module/util.loc
================================================
module (roll, choose)

import root-py

source Py from "util.py"
  ( "roll" as roll
  , "choose" as choose
  )

roll :: Int -> Int -> <Rand> [Int]

choose :: [a] -> <Rand> a


================================================
FILE: test-suite/golden-tests/two-module/util.py
================================================
import random

def choose(xs):
    return random.choice(xs)

def roll(n, d):
    return [random.randint(1, d) for _ in range(n)]


================================================
FILE: test-suite/golden-tests/type-alias-transitive/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus test > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/type-alias-transitive/exp.txt
================================================
"hello world"


================================================
FILE: test-suite/golden-tests/type-alias-transitive/foo.hpp
================================================
#include <string>

std::string my_concat(std::string a, std::string b) {
    return a + b;
}


================================================
FILE: test-suite/golden-tests/type-alias-transitive/main.loc
================================================
module main (test)

import types-cpp

test :: MyStr
test = myConcat "hello" " world"


================================================
FILE: test-suite/golden-tests/type-alias-transitive/types/main.loc
================================================
module types (*)

type MyStr = Str

myConcat :: MyStr -> MyStr -> MyStr


================================================
FILE: test-suite/golden-tests/type-alias-transitive/types-cpp.loc
================================================
module types-cpp (*)

import types
import root-cpp

-- No explicit `type Cpp => MyStr = "std::string"` mapping.
-- The compiler should transitively resolve: MyStr -> Str -> "std::string"

source Cpp from "foo.hpp" ("my_concat" as myConcat)


================================================
FILE: test-suite/golden-tests/type-annotations-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/type-annotations-1/exp.txt
================================================
0


================================================
FILE: test-suite/golden-tests/type-annotations-1/main.loc
================================================
module main (foo)

type Py => List a = "list" a
type Py => Int = "int"

length :: [a] -> Int
source Py ("len" as length)

foo = length ([] :: [Int])


================================================
FILE: test-suite/golden-tests/type-identities-c/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[12345678,987654321]' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/type-identities-c/exp.txt
================================================
[12345678,987654321]


================================================
FILE: test-suite/golden-tests/type-identities-c/main.loc
================================================
module main (foo)

import root-cpp (idcpp, Packable)

instance Packable (Int) SizeT where
  source Cpp from "types.h"
    ( "packSizeT" as pack
    , "unpackSizeT" as unpack
    )

instance Packable (Int) Long where
  source Cpp from "types.h"
    ( "packLong" as pack
    , "unpackLong" as unpack
    )

type Cpp => SizeT = "size_t" 
type Cpp => Long = "int64_t" 
type Cpp => Int = "int"

foo :: (SizeT, Long) -> (SizeT, Long)
foo x = idcpp x


================================================
FILE: test-suite/golden-tests/type-identities-c/types.h
================================================
#ifndef __MORLOC_TYPE_IDENTITIES_TYPES_H__
#define __MORLOC_TYPE_IDENTITIES_TYPES_H__

#include <cstdint>

// packSizeT   Cpp :: pack   => Int -> SizeT
size_t packSizeT(int x) {
    return static_cast<size_t>(x);
}

// unpackSizeT Cpp :: unpack => SizeT -> Int
int unpackSizeT(size_t x) {
    return static_cast<int>(x);
}

// packLong   Cpp :: pack   => Int -> Long
int64_t packLong(int x) {
    return static_cast<int64_t>(x);
}

// unpackLong Cpp :: unpack => Long -> Int
int unpackLong(int64_t x) {
    return static_cast<int>(x);
}

#endif


================================================
FILE: test-suite/golden-tests/type-synthesis-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo 42 > obs.txt 2> obs.err
	./nexus foos 42 2>> obs.err  >> obs.txt
	./nexus sfoos '[42]' 2>> obs.err  >> obs.txt
	./nexus bar 42 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/type-synthesis-1/exp.txt
================================================
43
[42,42]
[1,[42]]
[[42,43],[42,43]]


================================================
FILE: test-suite/golden-tests/type-synthesis-1/foo.py
================================================
#  foo :: Int -> Int
def foo(x):
    return x + 1

#  foos :: Int -> [Int]
def foos(x):
    return [x, x]

#  sfoos :: [Int] -> (Int, [Int])
def sfoos(xs):
    return (1, xs)

#  toPair a :: a -> (a, a)
def toPair(x):
    return (x,x)

#  swapPair a b :: (a, b) -> (b, a)
def swapPair(xs):
    return (xs[1], xs[0])


================================================
FILE: test-suite/golden-tests/type-synthesis-1/main.loc
================================================
module main (foo, foos, sfoos, bar)

source Py from "foo.py" ("foo", "foos", "sfoos", "toPair", "swapPair")

type Py => Int = "int"
type Py => (List a) = "list" a
type Py => (Tuple2 a b) = "tuple" a b

foo :: Int -> Int
foos :: Int -> [Int]
sfoos :: [Int] -> (Int, [Int])
toPair :: a -> (a, a)
swapPair :: (a, b) -> (b, a)

bar x = toPair (swapPair (foo x, x))


================================================
FILE: test-suite/golden-tests/type-synthesis-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus f '"hello"' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools nexus.cpy lib/foo/__pycache__


================================================
FILE: test-suite/golden-tests/type-synthesis-2/exp.txt
================================================
"hello"


================================================
FILE: test-suite/golden-tests/type-synthesis-2/lib/foo/foo.py
================================================
def f(x):
    return x


================================================
FILE: test-suite/golden-tests/type-synthesis-2/lib/foo/main.loc
================================================
module lib.foo (f, FooType)

import lib.footypes (FooType)

source Py from "foo.py" ("f")

f :: FooType -> FooType


================================================
FILE: test-suite/golden-tests/type-synthesis-2/lib/footypes/main.loc
================================================
module lib.footypes (*)

type Py => Str = "str"

type FooType = Str


================================================
FILE: test-suite/golden-tests/type-synthesis-2/main.loc
================================================
module main (f)

import lib.foo (f)


================================================
FILE: test-suite/golden-tests/typeclass-stress/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	echo "--- testPy ---" > obs.txt
	./nexus testPy >> obs.txt 2>> obs.err
	echo "--- testCpp ---" >> obs.txt
	./nexus testCpp >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools log __pycache__


================================================
FILE: test-suite/golden-tests/typeclass-stress/exp.txt
================================================
--- testPy ---
true
--- testCpp ---
true


================================================
FILE: test-suite/golden-tests/typeclass-stress/main.loc
================================================
-- Stress test for typeclass instance resolution with type aliases.
-- List, Deque, Vector, and Array are all aliases for List, each with
-- their own typeclass instances. The compiler must deduplicate these
-- during instance resolution to avoid exponential blowup.

module main (testPy, testCpp)

import root-py
import root-cpp

-- Use Functor (map)
mapList :: [Int] -> [Int]
mapList xs = map (\x -> x + 1) xs

-- Use Foldable (fold)
foldList :: [Int] -> Int
foldList = fold (\acc x -> acc + x) 0

-- Use Indexed (at)
atList :: [Int] -> Int
atList xs = at 0 xs

-- Use multiple typeclasses: map then fold
mapThenFold :: [Int] -> Int
mapThenFold xs = fold (\a x -> a + x) 0 (map (\x -> x * 2) xs)

-- length (Foldable-derived) with map (Functor)
mapThenLength :: [Int] -> Int
mapThenLength xs = length (map (\x -> x + 1) xs)

-- Nested: map over list of lists
nestedMap :: [[Int]] -> [[Int]]
nestedMap = map (map (\x -> x + 10))

-- Chain: cons (Stack) then map (Functor) then fold (Foldable)
consMapFold :: [Int] -> Int
consMapFold xs = fold (\a x -> a + x) 0 (map (\x -> x * 3) (cons 0 xs))

-- snoc (Queue) + reverse + map (Functor)
snocReverse :: [Int] -> [Int]
snocReverse xs = reverse (map (\x -> x + 1) (snoc xs 99))

-- Eq instance on lists
eqList :: Bool
eqList = [1, 2, 3] == [1, 2, 3]

-- Compose several typeclass-derived ops
stressCompose :: [Int] -> Int
stressCompose xs =
  let ys = map (\x -> x + 1) xs
      zs = filter (\x -> x > 2) ys
      w = fold (\a x -> a + x) 0 zs
  in w

testPy :: Bool
testPy =
  let t1 = mapList [1,2,3] == [2,3,4]
      t2 = foldList [1,2,3,4] == 10
      t3 = atList [10,20,30] == 10
      t4 = mapThenFold [1,2,3] == 12
      t5 = mapThenLength [1,2,3] == 3
      t6 = nestedMap [[1,2],[3]] == [[11,12],[13]]
      t7 = consMapFold [1,2] == 9
      t8 = snocReverse [1,2] == [100,3,2]
      t9 = eqList
      t10 = stressCompose [1,2,3] == 7
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10

testCpp :: Bool
testCpp =
  let t1 = mapList [1,2,3] == [2,3,4]
      t2 = foldList [1,2,3,4] == 10
      t3 = atList [10,20,30] == 10
      t4 = mapThenFold [1,2,3] == 12
      t5 = mapThenLength [1,2,3] == 3
      t6 = nestedMap [[1,2],[3]] == [[11,12],[13]]
      t7 = consMapFold [1,2] == 9
      t8 = snocReverse [1,2] == [100,3,2]
      t9 = eqList
      t10 = stressCompose [1,2,3] == 7
  in t1 && t2 && t3 && t4 && t5 && t6 && t7 && t8 && t9 && t10


================================================
FILE: test-suite/golden-tests/typeclasses-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"a"' '"b"' > obs.txt 2> obs.err
	./nexus bar 6 5 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/typeclasses-1/exp.txt
================================================
"abyolo"
17


================================================
FILE: test-suite/golden-tests/typeclasses-1/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>

int addInt(int x, int y){
  return (x + y);
}

double addReal(double x, double y){
  return (x + y);
}

std::string addStr(std::string x, std::string y){
  return (x + y);
}

#endif


================================================
FILE: test-suite/golden-tests/typeclasses-1/foo.py
================================================
def addInt(x, y):
    return x + y

def addReal(x, y):
    return x + y

def addStr(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/typeclasses-1/main.loc
================================================
module main (foo, bar)

type Cpp => Int = "int"
type Cpp => Real = "double"
type Cpp => Str = "std::string"

type Py => Int = "int"
type Py => Real = "float"
type Py => Str = "str"

class Add a where
  add :: a -> a -> a

instance Add Int where
  source Cpp from "foo.hpp" ("addInt" as add)
  source Py from "foo.py" ("addInt" as add)

instance Add Real where
  source Cpp from "foo.hpp" ("addReal" as add)
  source Py from "foo.py" ("addReal" as add)

instance Add Str where
  source Cpp from "foo.hpp" ("addStr" as add)
  source Py from "foo.py" ("addStr" as add)

bar :: Real -> Real -> Real
bar x y = add x (add y x)

foo x y = add x (add y "yolo")


================================================
FILE: test-suite/golden-tests/typeclasses-2/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus paste '["a","b"]' > obs.txt 2> obs.err
	./nexus sum '[1,2,3]' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__ y z


================================================
FILE: test-suite/golden-tests/typeclasses-2/exp.txt
================================================
"ab"
6


================================================
FILE: test-suite/golden-tests/typeclasses-2/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>
#include <vector>
#include <functional>

int addInt(int x, int y){
  return (x + y);
}

double addReal(double x, double y){
  return (x + y);
}

std::string addStr(std::string x, std::string y){
  return (x + y);
}

template <class A, class B, class F>
B fold(F f, B y, const std::vector<A>& xs){
    for(std::size_t i=0; i < xs.size(); i++){
        y = f(y, xs[i]);
    }
    return y;
}

#endif


================================================
FILE: test-suite/golden-tests/typeclasses-2/foo.py
================================================
def addInt(x, y):
    return x + y

def addReal(x, y):
    return x + y

def addStr(x, y):
    return x + y

def fold(f, b, xs):
    for x in xs:
        b = f(b, x)
    return b


================================================
FILE: test-suite/golden-tests/typeclasses-2/main.loc
================================================
module main (paste, sum)

type Cpp => Int = "int"
type Cpp => Real = "double"
type Cpp => Str = "std::string"
type Cpp => List a = "std::vector<$1>" a

type Py => Int = "int"
type Py => Real = "float"
type Py => Str = "str"
type Py => List a = "list" a

class Monoid a where
  empty :: a
  op :: a -> a -> a

instance Monoid Int where
  source Cpp from "foo.hpp" ("addInt" as op)
  source Py from "foo.py" ("addInt" as op)
  empty = 0

instance Monoid Real where
  source Cpp from "foo.hpp" ("addReal" as op)
  source Py from "foo.py" ("addReal" as op)
  empty = 0.0

instance Monoid Str where
  source Cpp from "foo.hpp" ("addStr" as op)
  source Py from "foo.py" ("addStr" as op)
  empty = ""

source Cpp from "foo.hpp" ("fold")
source Py from "foo.py" ("fold")
fold :: (b -> a -> b) -> b -> [a] -> b

sum :: [Int] -> Int
sum = fold op empty

paste :: [Str] -> Str
paste = fold op empty


================================================
FILE: test-suite/golden-tests/typeclasses-3/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '[6,5]' > obs.txt 2> obs.err
	./nexus bar '[6,5]' 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/typeclasses-3/exp.txt
================================================
"[6, 5]"
2


================================================
FILE: test-suite/golden-tests/typeclasses-3/main.loc
================================================
module main (foo, bar)

type Py => Int = "int"
type Py => Real = "float"
type Py => Str = "str"
type Py => (List a) = "list" a


class Summarizable a b where
  summarize :: a -> b

instance Summarizable [a] Str where
  source Py ("str" as summarize)

instance Summarizable [a] Int where
  source Py ("len" as summarize)


foo :: [Int] -> Str
foo x = summarize x

bar :: [Int] -> Int
bar x = summarize x


================================================
FILE: test-suite/golden-tests/typeclasses-4/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '["a","bad"]' > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-4/exp.txt
================================================
[["a","bad"],[1,3]]


================================================
FILE: test-suite/golden-tests/typeclasses-4/foo.py
================================================
#  class Reversible ([a],[b]) [(a,b)] where
def forward(x):
    return list(zip(x[0], x[1]))

def backward(xys):
    xs = []
    ys = []
    for (x,y) in xys:
        xs.append(x)
        ys.append(y)
    return (xs, ys)

#  addLen :: Str -> (Str, Int)
def addLen(x):
    return (x, len(x))


================================================
FILE: test-suite/golden-tests/typeclasses-4/main.loc
================================================
module main (foo)

import root ((.))

type Py => Int = "int"
type Py => Str = "str"
type Py => (List a) = "list" a
type Py => Tuple2 a b = "tuple" a b


class Reversible a b where
  forward :: a -> b
  backward :: b -> a

instance Reversible ([a],[b]) [(a,b)] where
  source Py from "foo.py" ("forward", "backward")


source Py ("map")
source Py from "foo.py" ("addLen")
addLen :: Str -> (Str, Int)
map :: (a -> b) -> [a] -> [b]

foo :: [Str] -> ([Str],[Int])
foo = backward . map addLen


================================================
FILE: test-suite/golden-tests/typeclasses-5/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus square 4.0 > obs.txt 2> obs.err
	./nexus sumOfSquares [1,2,3] 2>> obs.err  >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-5/exp.txt
================================================
16
14


================================================
FILE: test-suite/golden-tests/typeclasses-5/main.loc
================================================
module main (square, sumOfSquares)

import root-cpp

square :: Real -> Real
square x = x * x

sumOfSquares :: [Real] -> Real
sumOfSquares xs = fold (+) 0.0 (map square xs)


================================================
FILE: test-suite/golden-tests/typeclasses-6/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo '"alice"' 42 > obs.txt 2> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-6/exp.txt
================================================
[["alice"],[42]]


================================================
FILE: test-suite/golden-tests/typeclasses-6/main.loc
================================================
module main (foo)

import map-cpp

foo :: Str -> Int -> Map Str Int
foo k v = pack ([k], [v])


================================================
FILE: test-suite/golden-tests/typeclasses-7/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus appendAllInt 1 2 3 > obs.txt 2> obs.err
	./nexus appendAllStr '"hello"' '" "' '"world"' >> obs.txt 2>> obs.err
	./nexus showAppend 10 20 >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-7/exp.txt
================================================
6
"hello world"
"30"


================================================
FILE: test-suite/golden-tests/typeclasses-7/foo.hpp
================================================
#ifndef __FOO_HPP__
#define __FOO_HPP__

#include <string>

int appendInt(int x, int y){
  return x + y;
}

std::string appendStr(std::string x, std::string y){
  return x + y;
}

std::string showInt(int x){
  return std::to_string(x);
}

std::string showStr(std::string x){
  return x;
}

#endif


================================================
FILE: test-suite/golden-tests/typeclasses-7/foo.py
================================================
def appendInt(x, y):
    return x + y

def appendStr(x, y):
    return x + y

def showInt(x):
    return str(x)

def showStr(x):
    return x


================================================
FILE: test-suite/golden-tests/typeclasses-7/main.loc
================================================
module main (appendAllInt, appendAllStr, showAppend)

type Cpp => Int = "int"
type Cpp => Str = "std::string"

type Py => Int = "int"
type Py => Str = "str"

class Semigroup a where
  append :: a -> a -> a

class Semigroup a => Showable a where
  toStr :: a -> Str

instance Semigroup Int where
  source Cpp from "foo.hpp" ("appendInt" as append)
  source Py from "foo.py" ("appendInt" as append)

instance Showable Int where
  source Cpp from "foo.hpp" ("showInt" as toStr)
  source Py from "foo.py" ("showInt" as toStr)

instance Semigroup Str where
  source Cpp from "foo.hpp" ("appendStr" as append)
  source Py from "foo.py" ("appendStr" as append)

instance Showable Str where
  source Cpp from "foo.hpp" ("showStr" as toStr)
  source Py from "foo.py" ("showStr" as toStr)

-- single constraint, concrete Int
appendAllInt :: Semigroup a => Int -> Int -> Int -> Int
appendAllInt x y z = append x (append y z)

-- single constraint, concrete Str
appendAllStr :: Semigroup a => Str -> Str -> Str -> Str
appendAllStr x y z = append x (append y z)

-- multiple constraints, uses methods from both Showable and Semigroup
showAppend :: (Semigroup a, Showable a) => Int -> Int -> Str
showAppend x y = toStr (append x y)


================================================
FILE: test-suite/golden-tests/typeclasses-8/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testStr > obs.txt 2> obs.err
	./nexus testList >> obs.txt 2>> obs.err
	./nexus testListInt >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-8/exp.txt
================================================
"hello"
["world"]
[1,2,3]


================================================
FILE: test-suite/golden-tests/typeclasses-8/foo.py
================================================
def appendStr(x, y):
    return x + y

def appendList(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/typeclasses-8/main.loc
================================================
module main (testStr, testList, testListInt)

type Py => Int = "int"
type Py => Str = "str"
type Py => (List a) = "list" a

class Monoid a where
  mempty :: a
  mappend :: a -> a -> a

instance Monoid Str where
  source Py from "foo.py" ("appendStr" as mappend)
  mempty = ""

instance Monoid (List a) where
  source Py from "foo.py" ("appendList" as mappend)
  mempty = []

-- The core regression: annotation selects Str, not List
testStr :: Str
testStr = mappend mempty "hello"

-- Annotation selects List
testList :: [Str]
testList = mappend mempty ["world"]

-- Nested: compose methods from same class at different types
testListInt :: [Int]
testListInt = mappend (mappend mempty [1]) [2, 3]


================================================
FILE: test-suite/golden-tests/typeclasses-9/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus testSemiStr > obs.txt 2> obs.err
	./nexus testMonoidStr >> obs.txt 2>> obs.err
	./nexus testMonoidList >> obs.txt 2>> obs.err
	./nexus testGroupNegate >> obs.txt 2>> obs.err

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/typeclasses-9/exp.txt
================================================
"hello world"
"hello"
[1,2,3]
5


================================================
FILE: test-suite/golden-tests/typeclasses-9/foo.py
================================================
def appendStr(x, y):
    return x + y

def addInt(x, y):
    return x + y

def negateInt(x):
    return -x

def appendList(x, y):
    return x + y


================================================
FILE: test-suite/golden-tests/typeclasses-9/main.loc
================================================
module main (testSemiStr, testMonoidStr, testMonoidList, testGroupNegate)

type Py => Int = "int"
type Py => Str = "str"
type Py => (List a) = "list" a

-- Three-level class hierarchy: Semigroup -> Monoid -> Group
class Semigroup a where
  sappend :: a -> a -> a

class Semigroup a => Monoid a where
  mempty :: a

class Monoid a => Group a where
  ginverse :: a -> a

instance Semigroup Str where
  source Py from "foo.py" ("appendStr" as sappend)

instance Monoid Str where
  mempty = ""

instance Semigroup Int where
  source Py from "foo.py" ("addInt" as sappend)

instance Monoid Int where
  mempty = 0

instance Group Int where
  source Py from "foo.py" ("negateInt" as ginverse)

instance Semigroup (List a) where
  source Py from "foo.py" ("appendList" as sappend)

instance Monoid (List a) where
  mempty = []

-- Test superclass method (Semigroup) through concrete type
testSemiStr :: Str
testSemiStr = sappend "hello" " world"

-- Test Monoid method with Str
testMonoidStr :: Str
testMonoidStr = sappend mempty "hello"

-- Test Monoid method with List -- exercises the annotation propagation fix
testMonoidList :: [Int]
testMonoidList = sappend mempty [1, 2, 3]

-- Test three-level hierarchy: Group's ginverse uses Monoid's mempty indirectly
testGroupNegate :: Int
testGroupNegate = sappend (ginverse 5) 10


================================================
FILE: test-suite/golden-tests/unicode-edge-cases/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus singleChar 2>> obs.err >> obs.txt
	./nexus emptyLike 2>> obs.err >> obs.txt
	./nexus rtl 2>> obs.err >> obs.txt
	./nexus combining 2>> obs.err >> obs.txt
	./nexus surrogateLike 2>> obs.err >> obs.txt
	./nexus nullLike 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/unicode-edge-cases/exp.txt
================================================
"世"
"​"
"مرحبا بالعالم"
"é"
"😀💩"
"a​b​c"


================================================
FILE: test-suite/golden-tests/unicode-edge-cases/foo.py
================================================
def py_identity(x):
    return x


================================================
FILE: test-suite/golden-tests/unicode-edge-cases/main.loc
================================================
module main (emptyLike, singleChar, surrogateLike, rtl, combining, nullLike)

source Py from "foo.py" ("py_identity" as pyId)

pyId :: Str -> Str
type Py => Str = "str"

-- Single multi-byte character
singleChar :: Str
singleChar = pyId "世"

-- Characters that look like JSON special chars but aren't
emptyLike :: Str
emptyLike = pyId "​"

-- Right-to-left text (Arabic)
rtl :: Str
rtl = pyId "مرحبا بالعالم"

-- Combining characters (e + combining acute = é)
combining :: Str
combining = pyId "é"

-- String with surrogate-like high codepoints (valid UTF-8, 4-byte sequences)
surrogateLike :: Str
surrogateLike = pyId "😀💩"

-- Null-like zero-width chars mixed with ASCII
nullLike :: Str
nullLike = pyId "a​b​c"


================================================
FILE: test-suite/golden-tests/unicode-interop/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus pyToCpp 2>> obs.err >> obs.txt
	./nexus cppToPy 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/unicode-interop/exp.txt
================================================
"[cpp:[py:café-你好]]"
"[py:[cpp:café-你好]]"


================================================
FILE: test-suite/golden-tests/unicode-interop/foo.hpp
================================================
#include <string>

std::string cpp_wrap(std::string x) {
    return "[cpp:" + x + "]";
}


================================================
FILE: test-suite/golden-tests/unicode-interop/foo.py
================================================
def py_wrap(x):
    return "[py:" + x + "]"


================================================
FILE: test-suite/golden-tests/unicode-interop/main.loc
================================================
module main (pyToCpp, cppToPy)

import root ((.))

source Py from "foo.py" ("py_wrap" as pyWrap)
source Cpp from "foo.hpp" ("cpp_wrap" as cppWrap)

pyWrap :: Str -> Str
cppWrap :: Str -> Str

type Py => Str = "str"
type Cpp => Str = "std::string"

-- Unicode string crosses Python -> C++ boundary
pyToCpp :: Str
pyToCpp = (cppWrap . pyWrap) "café-你好"

-- Unicode string crosses C++ -> Python boundary
cppToPy :: Str
cppToPy = (pyWrap . cppWrap) "café-你好"


================================================
FILE: test-suite/golden-tests/unicode-interpolation/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus greet 2>> obs.err >> obs.txt
	./nexus multiByteInterp 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/unicode-interpolation/exp.txt
================================================
"你好 World ❤"
"café World üñ"


================================================
FILE: test-suite/golden-tests/unicode-interpolation/foo.py
================================================
def py_identity(x):
    return x

def py_name():
    return "World"


================================================
FILE: test-suite/golden-tests/unicode-interpolation/main.loc
================================================
module main (greet, multiByteInterp)

source Py from "foo.py" ("py_identity" as pyId, "py_name" as pyName)

pyId :: Str -> Str
pyName :: Str

type Py => Str = "str"

-- Test: Unicode in string interpolation - surrounding text is Unicode
greet :: Str
greet = pyId "你好 #{pyName} ❤"

-- Test: Multi-byte chars on both sides of interpolation
multiByteInterp :: Str
multiByteInterp = pyId "café #{pyName} üñ"


================================================
FILE: test-suite/golden-tests/unicode-source/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus hello 2>> obs.err >> obs.txt
	./nexus chinese 2>> obs.err >> obs.txt
	./nexus emoji 2>> obs.err >> obs.txt
	./nexus mixed 2>> obs.err >> obs.txt
	./nexus roundtrip 2>> obs.err >> obs.txt
	./nexus tripleQuoted 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/unicode-source/exp.txt
================================================
"Élève café"
"你知道得太多了"
"❤ hello ☃"
"abc-éèê-你好-❤-xyz"
"Hello, café-你好!"
"line1: café\nline2: 你好\nline3: ❤\n"


================================================
FILE: test-suite/golden-tests/unicode-source/foo.hpp
================================================
#include <string>

std::string cpp_hello(std::string name) {
    return "Hello, " + name + "!";
}

std::string cpp_identity(std::string x) {
    return x;
}


================================================
FILE: test-suite/golden-tests/unicode-source/foo.py
================================================
def py_hello(name):
    return f"Hello, {name}!"

def py_identity(x):
    return x


================================================
FILE: test-suite/golden-tests/unicode-source/main.loc
================================================
module main (hello, chinese, emoji, mixed, roundtrip, tripleQuoted)

-- À propos: test Unicode in line comments — em-dash, accented letters, CJK
-- 你好世界 – Chinese hello world in a comment

{- Block comment with Unicode:
   éèêë ñ ü ß ☃ ❤ ★
   Japanese: こんにちは
   Arabic: مرحبا
-}

source Py from "foo.py" ("py_hello" as pyHello, "py_identity" as pyId)

pyHello :: Str -> Str
pyId :: Str -> Str

type Py => Str = "str"

-- Test 1: Unicode string literal in .loc source (accented chars)
hello :: Str
hello = pyId "Élève café"

-- Test 2: CJK characters in string literal
chinese :: Str
chinese = pyId "你知道得太多了"

-- Test 3: Emoji-like symbols in string literal
emoji :: Str
emoji = pyId "❤ hello ☃"

-- Test 4: Mixed ASCII and multi-byte in same string  
mixed :: Str
mixed = pyId "abc-éèê-你好-❤-xyz"

-- Test 5: Unicode survives function application round-trip
roundtrip :: Str
roundtrip = pyHello "café-你好"

-- Test 6: Unicode in triple-quoted string
tripleQuoted :: Str
tripleQuoted = pyId """line1: café
line2: 你好
line3: ❤"""


================================================
FILE: test-suite/golden-tests/unicode-source-cpp/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	>obs.txt
	./nexus hello 2>> obs.err >> obs.txt
	./nexus chinese 2>> obs.err >> obs.txt
	./nexus mixed 2>> obs.err >> obs.txt

clean:
	rm -rf nexus pools __pycache__


================================================
FILE: test-suite/golden-tests/unicode-source-cpp/exp.txt
================================================
"Élève café"
"你知道得太多了"
"Hello, café-你好-❤!"


================================================
FILE: test-suite/golden-tests/unicode-source-cpp/foo.hpp
================================================
#include <string>

std::string cpp_identity(std::string x) {
    return x;
}

std::string cpp_hello(std::string name) {
    return "Hello, " + name + "!";
}


================================================
FILE: test-suite/golden-tests/unicode-source-cpp/main.loc
================================================
module main (hello, chinese, mixed)

-- Test Unicode strings through C++ pool — exercises the codegen subprocess

source Cpp from "foo.hpp" ("cpp_identity" as cppId, "cpp_hello" as cppHello)

cppId :: Str -> Str
cppHello :: Str -> Str

type Cpp => Str = "std::string"

hello :: Str
hello = cppId "Élève café"

chinese :: Str
chinese = cppId "你知道得太多了"

mixed :: Str
mixed = cppHello "café-你好-❤"


================================================
FILE: test-suite/golden-tests/unit-1/Makefile
================================================
all:
	rm -f *.err obs.txt
	morloc make -o nexus main.loc 2> build.err
	./nexus foo > obs.txt 2> obs.err

clean:
	rm -rf nexus pools


================================================
FILE: test-suite/golden-tests/unit-1/exp.txt
================================================
42


================================================
FILE: test-suite/golden-tests/unit-1/foo.py
================================================
# note, this is a fake urand number generator
def urand():
    return 42


================================================
FILE: test-suite/golden-tests/unit-1/main.loc
================================================
module main (foo)

import root-py

source Py from "foo.py" ("urand")

urand :: () -> Int

foo = urand ()


================================================
FILE: test-suite/install-tests/.gitignore
================================================
nexus


================================================
FILE: test-suite/install-tests/README.md
================================================
# Test installation

These suite tests the `morloc make --install` command.

Each test verifies 6 things:

1. Binary installed to ~/.local/share/morloc/bin/
2. Exe directory created under ~/.local/share/morloc/exe/
3. Pools directory / included files/folders copied correctly
4. Program produces correct output when run
5. morloc uninstall --program removes the binary
6. Cleanup is complete

  ┌──────────┬──────────┬───────────────────────────────────────────────────────────────────┐
  │  Module  │ Language │                           What it tests                           │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testpy1  │ Python   │ Direct source in cwd, file include via package.yaml               │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testpy2  │ Python   │ Source in src/, whole folder include via package.yaml             │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testpy3  │ Python   │ Direct source + indirect Python import, include via --include CLI │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testcpp1 │ C++      │ Direct .hpp source in cwd, file include via package.yaml          │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testcpp2 │ C++      │ Source in src/, whole folder include via package.yaml             │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testcpp3 │ C++      │ Direct source + indirect #include, include via --include CLI      │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testr1   │ R        │ Direct source in cwd, file include via package.yaml               │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testr2   │ R        │ Source in src/, whole folder include via package.yaml             │
  ├──────────┼──────────┼───────────────────────────────────────────────────────────────────┤
  │ testr3   │ R        │ Direct source + indirect source(), include via --include CLI      │
  └──────────┴──────────┴───────────────────────────────────────────────────────────────────┘


================================================
FILE: test-suite/install-tests/run-tests.sh
================================================
#!/usr/bin/env bash
# run-tests.sh - Installation test suite for morloc
#
# Tests `morloc make --install` with package.yaml include fields and
# `morloc make --install --include` CLI flags across Python, C++, and R.
#
# Covers:
#   - Source files in cwd vs nested directories (src/)
#   - Directly and indirectly sourced files
#   - Whole-folder includes
#   - CLI --include flag
#
# Usage: ./run-tests.sh [test...]
#   With no arguments, runs all test groups. Pass partial names to filter:
#   ./run-tests.sh testpy testcpp testr

set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"

MORLOC_HOME="${MORLOC_HOME:-$HOME/.local/share/morloc}"
BIN_DIR="$MORLOC_HOME/bin"
EXE_DIR="$MORLOC_HOME/exe"
FDB_DIR="$MORLOC_HOME/fdb"

PASSED=0
FAILED=0
TOTAL=0
FAILURES=()

if [[ -t 1 ]]; then
    GREEN=$'\033[32m' RED=$'\033[31m' YELLOW=$'\033[33m' BOLD=$'\033[1m' RESET=$'\033[0m'
else
    GREEN='' RED='' YELLOW='' BOLD='' RESET=''
fi

# ======================================================================
# Test helpers
# ======================================================================

assert_test() {
    local label="$1"
    local expected="$2"
    local actual="$3"

    TOTAL=$((TOTAL + 1))
    printf "  %-55s " "$label"

    if [[ "$actual" == "$expected" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      expected: $expected"
        echo "      actual:   $actual"
    fi
}

assert_file_exists() {
    local label="$1"
    local filepath="$2"

    TOTAL=$((TOTAL + 1))
    printf "  %-55s " "$label"

    if [[ -e "$filepath" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      file not found: $filepath"
    fi
}

assert_dir_exists() {
    local label="$1"
    local dirpath="$2"

    TOTAL=$((TOTAL + 1))
    printf "  %-55s " "$label"

    if [[ -d "$dirpath" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      directory not found: $dirpath"
    fi
}

assert_not_exists() {
    local label="$1"
    local filepath="$2"

    TOTAL=$((TOTAL + 1))
    printf "  %-55s " "$label"

    if [[ ! -e "$filepath" ]]; then
        printf "%sPASS%s\n" "$GREEN" "$RESET"
        PASSED=$((PASSED + 1))
    else
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$label")
        echo "      should not exist: $filepath"
    fi
}

should_run() {
    local name="$1"
    if [[ $# -eq 0 ]] || [[ ${#FILTERS[@]} -eq 0 ]]; then
        return 0
    fi
    for pat in "${FILTERS[@]}"; do
        if [[ "$name" == *"$pat"* ]]; then
            return 0
        fi
    done
    return 1
}

# Build, install, test, and uninstall a module.
#
# Usage: run_install_test <test_name> <test_dir> <subcommand> <arg> <expected> [extra_make_args...]
#
# test_name:  group label
# test_dir:   directory containing main.loc + sources
# subcommand: the exported function to call
# arg:        argument to pass to the subcommand
# expected:   expected output
# extra_make_args: additional args for `morloc make` (e.g. --include foo.py)
run_install_test() {
    local test_name="$1"
    local test_dir="$2"
    local subcommand="$3"
    local arg="$4"
    local expected="$5"
    shift 5
    local extra_args=("$@")

    local work_dir
    work_dir=$(mktemp -d)

    # Copy test module to a temp working directory
    cp -r "$test_dir"/. "$work_dir"/

    # Build and install
    local build_err
    build_err=$(cd "$work_dir" && morloc make --install --force -o "$test_name" "${extra_args[@]}" main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "$test_name: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("$test_name: build")
        echo "$build_err" | tail -5 | sed 's/^/      /'
        rm -rf "$work_dir"
        return
    }

    local bin_path="$BIN_DIR/$test_name"
    local exe_path="$EXE_DIR/$test_name"

    # Check binary exists
    assert_file_exists "$test_name: binary installed" "$bin_path"

    # Check exe directory exists
    assert_dir_exists "$test_name: exe directory created" "$exe_path"

    # Check pools directory copied
    assert_dir_exists "$test_name: pools directory copied" "$exe_path/pools"

    # Return included-file checks to the caller via the callback pattern
    # (caller adds assert_file_exists calls after this function)

    # Run the installed program and check output
    local actual
    actual=$("$bin_path" "$subcommand" "$arg" 2>&1) || actual="ERROR: rc=$?"
    assert_test "$test_name: output correct" "$expected" "$actual"

    # Uninstall
    morloc uninstall --program "$test_name" >/dev/null 2>&1 || true

    # Verify uninstall cleaned up
    assert_not_exists "$test_name: binary removed after uninstall" "$bin_path"

    rm -rf "$work_dir"
}

# Collect filter arguments
FILTERS=("$@")

echo "${BOLD}morloc install tests${RESET}"
echo ""

# ======================================================================
# Python tests
# ======================================================================

# --- testpy1: direct source in cwd, include file via package.yaml ---
if should_run "testpy1"; then
    echo "${BOLD}[testpy1] Python: direct source in cwd, include via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testpy1"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testpy1 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testpy1: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testpy1: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testpy1: binary installed" "$BIN_DIR/testpy1"
        assert_dir_exists  "testpy1: exe directory created" "$EXE_DIR/testpy1"
        assert_dir_exists  "testpy1: pools directory copied" "$EXE_DIR/testpy1/pools"
        assert_file_exists "testpy1: helpers.py included" "$EXE_DIR/testpy1/helpers.py"

        ACTUAL=$("$BIN_DIR/testpy1" pygreet '"world"' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testpy1: output correct" '"hello world"' "$ACTUAL"

        morloc uninstall --program testpy1 >/dev/null 2>&1 || true
        assert_not_exists "testpy1: cleaned up after uninstall" "$BIN_DIR/testpy1"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testpy2: source in src/, include whole folder via package.yaml ---
if should_run "testpy2"; then
    echo "${BOLD}[testpy2] Python: source in src/, include folder via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testpy2"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testpy2 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testpy2: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testpy2: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testpy2: binary installed" "$BIN_DIR/testpy2"
        assert_dir_exists  "testpy2: exe directory created" "$EXE_DIR/testpy2"
        assert_dir_exists  "testpy2: src/ folder included" "$EXE_DIR/testpy2/src"
        assert_file_exists "testpy2: src/mathutil.py included" "$EXE_DIR/testpy2/src/mathutil.py"

        ACTUAL=$("$BIN_DIR/testpy2" pyadd '3' '4' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testpy2: output correct" "7" "$ACTUAL"

        morloc uninstall --program testpy2 >/dev/null 2>&1 || true
        assert_not_exists "testpy2: cleaned up after uninstall" "$BIN_DIR/testpy2"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testpy3: direct source + indirect import, include via --include CLI ---
if should_run "testpy3"; then
    echo "${BOLD}[testpy3] Python: indirect dependency, include via --include CLI${RESET}"

    TEST_DIR="$SCRIPT_DIR/testpy3"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testpy3 --include "formatter.py" --include "fmtlib.py" main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testpy3: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testpy3: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testpy3: binary installed" "$BIN_DIR/testpy3"
        assert_dir_exists  "testpy3: exe directory created" "$EXE_DIR/testpy3"
        assert_file_exists "testpy3: formatter.py included" "$EXE_DIR/testpy3/formatter.py"
        assert_file_exists "testpy3: fmtlib.py included (indirect)" "$EXE_DIR/testpy3/fmtlib.py"

        ACTUAL=$("$BIN_DIR/testpy3" pyformat '"x"' '5' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testpy3: output correct" '"x=5"' "$ACTUAL"

        morloc uninstall --program testpy3 >/dev/null 2>&1 || true
        assert_not_exists "testpy3: cleaned up after uninstall" "$BIN_DIR/testpy3"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# ======================================================================
# C++ tests
# ======================================================================

# --- testcpp1: direct source in cwd, include file via package.yaml ---
if should_run "testcpp1"; then
    echo "${BOLD}[testcpp1] C++: direct source in cwd, include via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testcpp1"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testcpp1 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testcpp1: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testcpp1: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testcpp1: binary installed" "$BIN_DIR/testcpp1"
        assert_dir_exists  "testcpp1: exe directory created" "$EXE_DIR/testcpp1"
        assert_dir_exists  "testcpp1: pools directory copied" "$EXE_DIR/testcpp1/pools"
        assert_file_exists "testcpp1: square.hpp included" "$EXE_DIR/testcpp1/square.hpp"

        ACTUAL=$("$BIN_DIR/testcpp1" cppsquare '7' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testcpp1: output correct" "49" "$ACTUAL"

        morloc uninstall --program testcpp1 >/dev/null 2>&1 || true
        assert_not_exists "testcpp1: cleaned up after uninstall" "$BIN_DIR/testcpp1"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testcpp2: source in src/, include whole folder via package.yaml ---
if should_run "testcpp2"; then
    echo "${BOLD}[testcpp2] C++: source in src/, include folder via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testcpp2"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testcpp2 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testcpp2: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testcpp2: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testcpp2: binary installed" "$BIN_DIR/testcpp2"
        assert_dir_exists  "testcpp2: exe directory created" "$EXE_DIR/testcpp2"
        assert_dir_exists  "testcpp2: src/ folder included" "$EXE_DIR/testcpp2/src"
        assert_file_exists "testcpp2: src/dbl.hpp included" "$EXE_DIR/testcpp2/src/dbl.hpp"

        ACTUAL=$("$BIN_DIR/testcpp2" cppdouble '6' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testcpp2: output correct" "12" "$ACTUAL"

        morloc uninstall --program testcpp2 >/dev/null 2>&1 || true
        assert_not_exists "testcpp2: cleaned up after uninstall" "$BIN_DIR/testcpp2"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testcpp3: direct source + indirect #include, include via --include CLI ---
if should_run "testcpp3"; then
    echo "${BOLD}[testcpp3] C++: indirect #include, include via --include CLI${RESET}"

    TEST_DIR="$SCRIPT_DIR/testcpp3"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testcpp3 --include "inc.hpp" --include "offset.hpp" main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testcpp3: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testcpp3: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testcpp3: binary installed" "$BIN_DIR/testcpp3"
        assert_dir_exists  "testcpp3: exe directory created" "$EXE_DIR/testcpp3"
        assert_file_exists "testcpp3: inc.hpp included" "$EXE_DIR/testcpp3/inc.hpp"
        assert_file_exists "testcpp3: offset.hpp included (indirect)" "$EXE_DIR/testcpp3/offset.hpp"

        ACTUAL=$("$BIN_DIR/testcpp3" cppinc '10' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testcpp3: output correct" "11" "$ACTUAL"

        morloc uninstall --program testcpp3 >/dev/null 2>&1 || true
        assert_not_exists "testcpp3: cleaned up after uninstall" "$BIN_DIR/testcpp3"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# ======================================================================
# R tests
# ======================================================================

# --- testr1: direct source in cwd, include file via package.yaml ---
if should_run "testr1"; then
    echo "${BOLD}[testr1] R: direct source in cwd, include via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testr1"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testr1 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testr1: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testr1: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testr1: binary installed" "$BIN_DIR/testr1"
        assert_dir_exists  "testr1: exe directory created" "$EXE_DIR/testr1"
        assert_dir_exists  "testr1: pools directory copied" "$EXE_DIR/testr1/pools"
        assert_file_exists "testr1: negate.R included" "$EXE_DIR/testr1/negate.R"

        ACTUAL=$("$BIN_DIR/testr1" rnegate '5.0' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testr1: output correct" "-5" "$ACTUAL"

        morloc uninstall --program testr1 >/dev/null 2>&1 || true
        assert_not_exists "testr1: cleaned up after uninstall" "$BIN_DIR/testr1"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testr2: source in src/, include whole folder via package.yaml ---
if should_run "testr2"; then
    echo "${BOLD}[testr2] R: source in src/, include folder via package.yaml${RESET}"

    TEST_DIR="$SCRIPT_DIR/testr2"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testr2 main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testr2: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testr2: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testr2: binary installed" "$BIN_DIR/testr2"
        assert_dir_exists  "testr2: exe directory created" "$EXE_DIR/testr2"
        assert_dir_exists  "testr2: src/ folder included" "$EXE_DIR/testr2/src"
        assert_file_exists "testr2: src/triple.R included" "$EXE_DIR/testr2/src/triple.R"

        ACTUAL=$("$BIN_DIR/testr2" rtriple '4' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testr2: output correct" "12" "$ACTUAL"

        morloc uninstall --program testr2 >/dev/null 2>&1 || true
        assert_not_exists "testr2: cleaned up after uninstall" "$BIN_DIR/testr2"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# --- testr3: direct source + indirect source(), include via --include CLI ---
if should_run "testr3"; then
    echo "${BOLD}[testr3] R: indirect source(), include via --include CLI${RESET}"

    TEST_DIR="$SCRIPT_DIR/testr3"
    WORK_DIR=$(mktemp -d)
    cp -r "$TEST_DIR"/. "$WORK_DIR"/

    BUILD_ERR=$(cd "$WORK_DIR" && morloc make --install --force -o testr3 --include "glue.R" --include "rutil.R" main.loc 2>&1) || {
        TOTAL=$((TOTAL + 1))
        printf "  %-55s " "testr3: build"
        printf "%sFAIL%s\n" "$RED" "$RESET"
        FAILED=$((FAILED + 1))
        FAILURES+=("testr3: build")
        echo "$BUILD_ERR" | tail -5 | sed 's/^/      /'
        rm -rf "$WORK_DIR"
    }

    if [[ -d "$WORK_DIR" ]]; then
        assert_file_exists "testr3: binary installed" "$BIN_DIR/testr3"
        assert_dir_exists  "testr3: exe directory created" "$EXE_DIR/testr3"
        assert_file_exists "testr3: glue.R included" "$EXE_DIR/testr3/glue.R"
        assert_file_exists "testr3: rutil.R included (indirect)" "$EXE_DIR/testr3/rutil.R"

        ACTUAL=$("$BIN_DIR/testr3" rpaste '"foo"' '"bar"' 2>&1) || ACTUAL="ERROR: rc=$?"
        assert_test "testr3: output correct" '"foobar"' "$ACTUAL"

        morloc uninstall --program testr3 >/dev/null 2>&1 || true
        assert_not_exists "testr3: cleaned up after uninstall" "$BIN_DIR/testr3"

        rm -rf "$WORK_DIR"
    fi
    echo ""
fi

# ======================================================================
# Results
# ======================================================================

echo "=== Results ==="
echo "${GREEN}Passed: $PASSED${RESET}, ${RED}Failed: $FAILED${RESET}, Total: $TOTAL"

if (( FAILED > 0 )); then
    echo ""
    echo "${RED}Failures:${RESET}"
    for f in "${FAILURES[@]}"; do
        echo "  ${RED}-${RESET} $f"
    done
    exit 1
fi
echo "${GREEN}${BOLD}ALL PASSED${RESET}"


================================================
FILE: test-suite/install-tests/testcpp1/main.loc
================================================
module testcpp1 (cppsquare)

import root-cpp

source Cpp from "square.hpp" ("cppsquare")

cppsquare :: Int -> Int


================================================
FILE: test-suite/install-tests/testcpp1/package.yaml
================================================
name: testcpp1
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "square.hpp"


================================================
FILE: test-suite/install-tests/testcpp1/square.hpp
================================================
#ifndef SQUARE_HPP
#define SQUARE_HPP

int cppsquare(int x) {
    return x * x;
}

#endif


================================================
FILE: test-suite/install-tests/testcpp2/main.loc
================================================
module testcpp2 (cppdouble)

import root-cpp

source Cpp from "src/dbl.hpp" ("cppdouble")

cppdouble :: Int -> Int


================================================
FILE: test-suite/install-tests/testcpp2/package.yaml
================================================
name: testcpp2
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "src/"


================================================
FILE: test-suite/install-tests/testcpp2/src/dbl.hpp
================================================
#ifndef DBL_HPP
#define DBL_HPP

int cppdouble(int x) {
    return x + x;
}

#endif


================================================
FILE: test-suite/install-tests/testcpp3/inc.hpp
================================================
#ifndef INC_HPP
#define INC_HPP

#include "offset.hpp"

int cppinc(int x) {
    return x + OFFSET;
}

#endif


================================================
FILE: test-suite/install-tests/testcpp3/main.loc
================================================
module testcpp3 (cppinc)

import root-cpp

source Cpp from "inc.hpp" ("cppinc")

cppinc :: Int -> Int


================================================
FILE: test-suite/install-tests/testcpp3/offset.hpp
================================================
#ifndef OFFSET_HPP
#define OFFSET_HPP

#define OFFSET 1

#endif


================================================
FILE: test-suite/install-tests/testdatafile1/data.txt
================================================
hello from datafile

================================================
FILE: test-suite/install-tests/testdatafile1/main.loc
================================================
module testdatafile1 (readData)

import root-py

source Py from "reader.py" ("readfile")

readfile :: Str -> Str

readData :: Str
readData = readfile (@datafile "data.txt")


================================================
FILE: test-suite/install-tests/testdatafile1/package.yaml
================================================
name: testdatafile1
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "reader.py"
  - "data.txt"


================================================
FILE: test-suite/install-tests/testdatafile1/reader.py
================================================
def readfile(path):
    with open(path) as f:
        return f.read().strip()


================================================
FILE: test-suite/install-tests/testpy1/helpers.py
================================================
def pygreet(name):
    return "hello " + name


================================================
FILE: test-suite/install-tests/testpy1/main.loc
================================================
module testpy1 (pygreet)

import root-py

source Py from "helpers.py" ("pygreet")

pygreet :: Str -> Str


================================================
FILE: test-suite/install-tests/testpy1/package.yaml
================================================
name: testpy1
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "helpers.py"


================================================
FILE: test-suite/install-tests/testpy2/main.loc
================================================
module testpy2 (pyadd)

import root-py

source Py from "src/mathutil.py" ("pyadd")

pyadd :: Int -> Int -> Int


================================================
FILE: test-suite/install-tests/testpy2/package.yaml
================================================
name: testpy2
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "src/"


================================================
FILE: test-suite/install-tests/testpy2/src/mathutil.py
================================================
def pyadd(x, y):
    return x + y


================================================
FILE: test-suite/install-tests/testpy3/fmtlib.py
================================================
def fmt_pair(name, n):
    return name + "=" + str(n)


================================================
FILE: test-suite/install-tests/testpy3/formatter.py
================================================
from fmtlib import fmt_pair

def pyformat(name, n):
    return fmt_pair(name, n)


================================================
FILE: test-suite/install-tests/testpy3/main.loc
================================================
module testpy3 (pyformat)

import root-py

source Py from "formatter.py" ("pyformat")

pyformat :: Str -> Int -> Str


================================================
FILE: test-suite/install-tests/testr1/main.loc
================================================
module testr1 (rnegate)

import root-r

source R from "negate.R" ("rnegate")

rnegate :: Real -> Real


================================================
FILE: test-suite/install-tests/testr1/negate.R
================================================
rnegate <- function(x) {
  -x
}


================================================
FILE: test-suite/install-tests/testr1/package.yaml
================================================
name: testr1
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "negate.R"


================================================
FILE: test-suite/install-tests/testr2/main.loc
================================================
module testr2 (rtriple)

import root-r

source R from "src/triple.R" ("rtriple")

rtriple :: Int -> Int


================================================
FILE: test-suite/install-tests/testr2/package.yaml
================================================
name: testr2
version: 0.1.0
homepage: null
synopsis: null
description: null
category: null
license: MIT
author: null
maintainer: null
github: null
bug-reports: null
dependencies: []
include:
  - "src/"


================================================
FILE: test-suite/install-tests/testr2/src/triple.R
================================================
rtriple <- function(x) {
  as.integer(x * 3L)
}


================================================
FILE: test-suite/install-tests/testr3/glue.R
================================================
source("rutil.R")

rpaste <- function(a, b) {
  rjoin(a, b)
}


================================================
FILE: test-suite/install-tests/testr3/main.loc
================================================
module testr3 (rpaste)

import root-r

source R from "glue.R" ("rpaste")

rpaste :: Str -> Str -> Str


================================================
FILE: test-suite/install-tests/testr3/rutil.R
================================================
rjoin <- function(a, b) {
  paste0(a, b)
}


================================================
FILE: test-suite/integration/Main.hs
================================================
module Main (main) where

import System.Directory (getHomeDirectory, makeAbsolute)
import System.Environment (getArgs, lookupEnv, withArgs)
import System.FilePath ((</>))
import Test.Tasty (defaultMain, testGroup)

import Morloc.Test.Common (TestEnv (..))
import Morloc.Test.ConcurrencyTests (concurrencyTests)
import Morloc.Test.DaemonTests (daemonTests)
import Morloc.Test.InstallTests (installTests)
import Morloc.Test.ShmTests (shmTests)
import Morloc.Test.StressTests (stressTests)

main :: IO ()
main = do
  suiteDir <- makeAbsolute "test-suite"
  home <- getHomeDirectory
  morlocHome <- maybe (home </> ".local/share/morloc") id <$> lookupEnv "MORLOC_HOME"
  let env =
        TestEnv
          { teSuiteDir = suiteDir
          , teMorlocHome = morlocHome
          }
  -- Default to sequential execution: stress tests measure global resources
  -- (SHM segments in /dev/shm) and cannot run concurrently with other tests.
  -- Override with: --test-arguments="--num-threads N"
  args <- getArgs
  let hasNumThreads =
        any
          ( \a ->
              "--num-threads" == a
                || "-j" == a
                || take 14 a == "--num-threads="
                || take 3 a == "-j="
          )
          args
      args' = if hasNumThreads then args else "--num-threads" : "1" : args
  withArgs args' $
    defaultMain $
      testGroup
        "Integration Tests"
        [ installTests env
        , concurrencyTests env
        , daemonTests env
        , stressTests env
        , shmTests env
        ]


================================================
FILE: test-suite/integration/Morloc/Test/Common.hs
================================================
module Morloc.Test.Common
  ( TestEnv (..)
  , withTestCopy
  , withTestDir
  , morlocMake
  , morlocInstall
  , morlocUninstall
  , runProgram
  , runNexus
  , runNexusQuiet
  , assertFileExists
  , assertDirExists
  , assertNotExists
  , assertContains
  , assertJsonEq
  -- Daemon helpers
  , DaemonHandle (..)
  , withDaemon
  , pickFreePort
  , waitForHttp
  , httpGet
  , httpPost
  , lpRequest
  , jsonField
  -- Resource tracking
  , countZombies
  , countShm
  , countTmp
  , listShm
  , listShmWithAge
  -- Utilities
  , strip
  , readDef
  , cleanupMorlocResources
  ) where

import Control.Concurrent (threadDelay)
import Control.Exception (SomeException, bracket, try)
import Data.List (isInfixOf)
import Data.Maybe (catMaybes)
import Data.Time.Clock (UTCTime, diffUTCTime, getCurrentTime)
import GHC.Stack (HasCallStack)
import System.Directory
  ( copyFile
  , createDirectoryIfMissing
  , doesDirectoryExist
  , doesFileExist
  , doesPathExist
  , getModificationTime
  , listDirectory
  , removeDirectoryRecursive
  )
import System.Exit (ExitCode (..))
import System.FilePath (takeDirectory, (</>))
import System.IO (IOMode (..), hClose, openFile)
import System.IO.Temp (createTempDirectory, getCanonicalTemporaryDirectory)
import System.Process
  ( CreateProcess (cwd, std_err, std_out)
  , ProcessHandle
  , StdStream (..)
  , createProcess
  , proc
  , readCreateProcessWithExitCode
  , readProcessWithExitCode
  , terminateProcess
  , waitForProcess
  )
import Test.Tasty.HUnit (Assertion, assertBool, assertFailure)

data TestEnv = TestEnv
  { teSuiteDir :: FilePath
  , teMorlocHome :: FilePath
  }

-- | Create a temp directory, run action, clean up
withTestDir :: (FilePath -> IO a) -> IO a
withTestDir action = bracket setup cleanup action
  where
    setup = do
      tmpBase <- getCanonicalTemporaryDirectory
      createTempDirectory tmpBase "morloc-test"
    cleanup = removeDirectoryRecursive

-- | Copy source dir into a temp dir, run action, clean up
withTestCopy :: FilePath -> (FilePath -> IO a) -> IO a
withTestCopy srcDir action = bracket setup cleanup action
  where
    setup = do
      tmpBase <- getCanonicalTemporaryDirectory
      tmpDir <- createTempDirectory tmpBase "morloc-test"
      copyDirRecursive srcDir tmpDir
      return tmpDir
    cleanup = removeDirectoryRecursive

copyDirRecursive :: FilePath -> FilePath -> IO ()
copyDirRecursive src dst = do
  entries <- listDirectory src
  mapM_ (copyEntry src dst) entries
  where
    copyEntry s d name = do
      let sp = s </> name
          dp = d </> name
      isDir <- doesDirectoryExist sp
      if isDir
        then do
          createDirectoryIfMissing True dp
          copyDirRecursive sp dp
        else do
          createDirectoryIfMissing True (takeDirectory dp)
          copyFile sp dp

-- | Compile a .loc file with morloc make
morlocMake ::
  FilePath ->
  String ->
  String ->
  IO (ExitCode, String, String)
morlocMake workDir outName locFile = do
  let args = ["make", "-o", outName, locFile]
      cp = (proc "morloc" args) {cwd = Just workDir}
  readCreateProcessWithExitCode cp ""

-- | Compile and install a .loc file
morlocInstall ::
  FilePath ->
  String ->
  [String] ->
  String ->
  IO (ExitCode, String, String)
morlocInstall workDir outName extraArgs locFile = do
  let args = ["make", "--install", "--force", "-o", outName] ++ extraArgs ++ [locFile]
      cp = (proc "morloc" args) {cwd = Just workDir}
  readCreateProcessWithExitCode cp ""

morlocUninstall :: String -> IO ()
morlocUninstall progName = do
  _ <- readProcessWithExitCode "morloc" ["uninstall", "--program", progName] ""
  return ()

-- | Run an installed program
runProgram :: FilePath -> String -> [String] -> IO (ExitCode, String, String)
runProgram binPath subcmd args =
  readProcessWithExitCode binPath (subcmd : args) ""

-- | Run a nexus binary in a working directory
runNexus :: FilePath -> String -> [String] -> IO (ExitCode, String, String)
runNexus workDir subcmd args = do
  let cp = (proc (workDir </> "nexus") (subcmd : args)) {cwd = Just workDir}
  readCreateProcessWithExitCode cp ""

{- | Run a nexus binary with output redirected to /dev/null.
Unlike runNexus, this does not capture stdout/stderr via pipes, so child
pool processes inherit /dev/null and won't be affected by pipe closure.
Use this in stress tests to match the shell test behavior.
-}
runNexusQuiet :: FilePath -> String -> [String] -> IO ExitCode
runNexusQuiet workDir subcmd args = do
  devNull <- openFile "/dev/null" WriteMode
  let cp =
        (proc (workDir </> "nexus") (subcmd : args))
          { cwd = Just workDir
          , std_out = UseHandle devNull
          , std_err = UseHandle devNull
          }
  (_, _, _, ph) <- createProcess cp
  ec <- waitForProcess ph
  hClose devNull
  return ec

-- ======================================================================
-- Daemon lifecycle
-- ======================================================================

data DaemonHandle = DaemonHandle
  { dhProcess :: ProcessHandle
  , dhWorkDir :: FilePath
  }

-- | Start a daemon, run action, stop daemon
withDaemon ::
  -- | working directory with compiled nexus
  FilePath ->
  -- | extra daemon args (e.g. ["--http-port", "12345"])
  [String] ->
  (DaemonHandle -> IO a) ->
  IO a
withDaemon workDir extraArgs action = bracket startD stopD action
  where
    startD = do
      devNull <- openFile "/dev/null" WriteMode
      let cp =
            (proc (workDir </> "nexus") ("--daemon" : extraArgs))
              { cwd = Just workDir
              , std_out = UseHandle devNull
              , std_err = UseHandle devNull
              }
      (_, _, _, ph) <- createProcess cp
      return (DaemonHandle ph workDir)
    stopD dh = do
      terminateProcess (dhProcess dh)
      _ <- waitForProcess (dhProcess dh)
      return ()

-- | Pick a random free TCP port
pickFreePort :: IO Int
pickFreePort = do
  (_, out, _) <-
    readProcessWithExitCode
      "python3"
      [ "-c"
      , "import socket; s=socket.socket(); s.bind(('127.0.0.1',0)); print(s.getsockname()[1]); s.close()"
      ]
      ""
  return (read (strip out))

-- | Wait for an HTTP port to respond, with retries
waitForHttp :: Int -> Int -> IO Bool
waitForHttp port maxWaitMs = go 0
  where
    stepMs = 200
    go elapsed
      | elapsed >= maxWaitMs = return False
      | otherwise = do
          result <-
            try $ httpGet ("http://127.0.0.1:" ++ show port ++ "/health") ::
              IO (Either SomeException (ExitCode, String, String))
          case result of
            Right (ExitSuccess, _, _) -> return True
            _ -> do
              threadDelay (stepMs * 1000)
              go (elapsed + stepMs)

-- | HTTP GET via curl
httpGet :: String -> IO (ExitCode, String, String)
httpGet url = readProcessWithExitCode "curl" ["-s", url] ""

-- | HTTP POST via curl
httpPost :: String -> String -> IO (ExitCode, String, String)
httpPost url body =
  readProcessWithExitCode
    "curl"
    ["-s", "-X", "POST", url, "-H", "Content-Type: application/json", "-d", body]
    ""

-- | Send a length-prefixed JSON message to a Unix socket or TCP endpoint
lpRequest :: String -> String -> IO String
lpRequest target jsonMsg = do
  let script =
        unlines
          [ "import socket, struct, sys, json"
          , "target = sys.argv[1]"
          , "msg = sys.argv[2].encode('utf-8')"
          , "if target.startswith('/'):"
          , "    s = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)"
          , "    s.connect(target)"
          , "else:"
          , "    host, port = target.rsplit(':', 1)"
          , "    s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)"
          , "    s.connect((host, int(port)))"
          , "s.settimeout(10)"
          , "s.sendall(struct.pack('>I', len(msg)) + msg)"
          , "resp_len_bytes = b''"
          , "while len(resp_len_bytes) < 4:"
          , "    chunk = s.recv(4 - len(resp_len_bytes))"
          , "    if not chunk: break"
          , "    resp_len_bytes += chunk"
          , "resp_len = struct.unpack('>I', resp_len_bytes)[0]"
          , "resp = b''"
          , "while len(resp) < resp_len:"
          , "    chunk = s.recv(resp_len - len(resp))"
          , "    if not chunk: break"
          , "    resp += chunk"
          , "s.close()"
          , "print(resp.decode('utf-8'))"
          ]
  (_, out, _) <- readProcessWithExitCode "python3" ["-c", script, target, jsonMsg] ""
  return (strip out)

-- | Extract a JSON field value using python3
jsonField :: String -> String -> IO String
jsonField jsonStr field = do
  let script =
        unlines
          [ "import json, sys"
          , "data = json.loads(sys.argv[1])"
          , "val = data.get(sys.argv[2])"
          , "if val is None:"
          , "    print('')"
          , "elif isinstance(val, (dict, list)):"
          , "    print(json.dumps(val, separators=(',', ':')))"
          , "elif isinstance(val, bool):"
          , "    print('true' if val else 'false')"
          , "else:"
          , "    print(val)"
          ]
  (_, out, _) <- readProcessWithExitCode "python3" ["-c", script, jsonStr, field] ""
  return (strip out)

-- ======================================================================
-- Resource tracking
-- ======================================================================

countZombies :: IO Int
countZombies = do
  (_, out, _) <-
    readProcessWithExitCode "sh" ["-c", "ps -eo stat 2>/dev/null | grep -c '^Z' || echo 0"] ""
  return (readDef 0 (strip out))

countShm :: IO Int
countShm = do
  (_, out, _) <-
    readProcessWithExitCode
      "sh"
      ["-c", "ls -1 /dev/shm/morloc-* 2>/dev/null | wc -l || echo 0"]
      ""
  return (readDef 0 (strip out))

countTmp :: IO Int
countTmp = do
  (_, out, _) <-
    readProcessWithExitCode
      "sh"
      ["-c", "ls -1d /tmp/morloc.* 2>/dev/null | wc -l || echo 0"]
      ""
  return (readDef 0 (strip out))

-- | List actual SHM segment names for diagnostics
listShm :: IO [String]
listShm = do
  (_, out, _) <-
    readProcessWithExitCode
      "sh"
      ["-c", "ls -1 /dev/shm/morloc-* 2>/dev/null || true"]
      ""
  return (filter (not . null) (lines out))

-- | List SHM segments with age in seconds (from stat mtime)
listShmWithAge :: IO [(String, Double)]
listShmWithAge = do
  segs <- listShm
  now <- getCurrentTime
  catMaybes <$> mapM (getAge now) segs
  where
    getAge now seg = do
      result <- try (getModificationTime seg) :: IO (Either SomeException UTCTime)
      return $ case result of
        Right mtime -> Just (seg, realToFrac (diffUTCTime now mtime))
        Left _ -> Nothing

-- ======================================================================
-- Assertions
-- ======================================================================

assertFileExists :: (HasCallStack) => String -> FilePath -> Assertion
assertFileExists label path = do
  exists <- doesFileExist path
  if exists
    then return ()
    else assertFailure (label ++ ": file not found: " ++ path)

assertDirExists :: (HasCallStack) => String -> FilePath -> Assertion
assertDirExists label path = do
  exists <- doesDirectoryExist path
  if exists
    then return ()
    else assertFailure (label ++ ": directory not found: " ++ path)

assertNotExists :: (HasCallStack) => String -> FilePath -> Assertion
assertNotExists label path = do
  exists <- doesPathExist path
  if exists
    then assertFailure (label ++ ": should not exist: " ++ path)
    else return ()

assertContains :: (HasCallStack) => String -> String -> String -> Assertion
assertContains label needle haystack =
  assertBool
    (label ++ ": expected to contain " ++ show needle ++ " in " ++ show (take 200 haystack))
    (needle `isInfixOf` haystack)

-- | Assert a JSON field equals an expected value, showing the raw response on failure
assertJsonEq :: (HasCallStack) => String -> String -> String -> String -> Assertion
assertJsonEq label rawJson field expected = do
  val <- jsonField rawJson field
  if val == expected
    then return ()
    else
      assertFailure $
        label
          ++ ": field "
          ++ show field
          ++ " expected "
          ++ show expected
          ++ " but got "
          ++ show val
          ++ "\n  raw response: "
          ++ show (take 500 rawJson)

-- ======================================================================
-- Internal utilities
-- ======================================================================

strip :: String -> String
strip = reverse . dropWhile (== '\n') . reverse . dropWhile (== '\n')

readDef :: Int -> String -> Int
readDef def s = case reads s of
  [(n, _)] -> n
  _ -> def

-- | Remove stale morloc SHM segments and tmp dirs to get a clean baseline
cleanupMorlocResources :: IO ()
cleanupMorlocResources = do
  _ <- readProcessWithExitCode "sh" ["-c", "rm -f /dev/shm/morloc-* 2>/dev/null"] ""
  _ <- readProcessWithExitCode "sh" ["-c", "rm -rf /tmp/morloc.* 2>/dev/null"] ""
  return ()


================================================
FILE: test-suite/integration/Morloc/Test/ConcurrencyTests.hs
================================================
module Morloc.Test.ConcurrencyTests (concurrencyTests) where

import System.Directory (copyFile, doesDirectoryExist, listDirectory)
import System.Exit (ExitCode (..))
import System.FilePath ((</>))
import Test.Tasty (TestTree, testGroup)
import Test.Tasty.HUnit (assertFailure, testCase)

import Morloc.Test.Common

-- | A concurrency test spec: compile a .loc file, run each subcommand
data ConcSpec = ConcSpec
  { csLocFile :: String -- .loc filename (relative to concurrency-tests/)
  , csSubcommands :: [String] -- exported functions to run
  }

concurrencyTest :: TestEnv -> String -> ConcSpec -> TestTree
concurrencyTest env name spec =
  testGroup
    name
    [ testCase subcmd $ runSubcmd env spec subcmd
    | subcmd <- csSubcommands spec
    ]

runSubcmd :: TestEnv -> ConcSpec -> String -> IO ()
runSubcmd env spec subcmd = do
  let srcDir = teSuiteDir env </> "concurrency-tests"
  withTestDir $ \workDir -> do
    -- Copy .loc file and helpers
    copyLocAndHelpers srcDir (csLocFile spec) workDir

    -- Compile
    (ec, _, err) <- morlocMake workDir "nexus" (csLocFile spec)
    case ec of
      ExitSuccess -> return ()
      ExitFailure c ->
        assertFailure $
          csLocFile spec ++ ": compile failed (exit " ++ show c ++ "):\n" ++ err

    -- Run with timeout (handled by tasty's timeout mechanism)
    (rc, _, stderr) <- runNexus workDir subcmd []
    case rc of
      ExitSuccess -> return ()
      ExitFailure c ->
        assertFailure $
          csLocFile spec ++ ":" ++ subcmd ++ " failed (exit " ++ show c ++ "):\n" ++ stderr

copyLocAndHelpers :: FilePath -> String -> FilePath -> IO ()
copyLocAndHelpers srcDir locFile workDir = do
  copyFile (srcDir </> locFile) (workDir </> locFile)
  let helpersDir = srcDir </> "helpers"
  helpersExist <- doesDirectoryExist helpersDir
  if helpersExist
    then do
      entries <- listDirectory helpersDir
      mapM_ (\f -> copyFile (helpersDir </> f) (workDir </> f)) entries
    else return ()

concurrencyTests :: TestEnv -> TestTree
concurrencyTests env =
  testGroup
    "Concurrency"
    [ concurrencyTest env "bidi-py-r" $
        ConcSpec
          { csLocFile = "bidi-py-r.loc"
          , csSubcommands = ["testUni", "testBidi1", "testBidi5", "testBidi10", "testBidi11", "testBidi15"]
          }
    , concurrencyTest env "bidi-r-py" $
        ConcSpec
          { csLocFile = "bidi-r-py.loc"
          , csSubcommands = ["testBidi1", "testBidi5", "testBidi10", "testBidi11", "testBidi15"]
          }
    , concurrencyTest env "concurrent-uni" $
        ConcSpec
          { csLocFile = "concurrent-uni.loc"
          , csSubcommands = ["testPyToR15", "testRToPy15", "testPyToR20"]
          }
    , concurrencyTest env "deep-callback" $
        ConcSpec
          { csLocFile = "deep-callback.loc"
          , csSubcommands =
              ["testDepth2", "testDepth4", "testDepth6", "testDepth12", "testDeep4x5", "testDeep6x5"]
          }
    ]


================================================
FILE: test-suite/integration/Morloc/Test/DaemonTests.hs
================================================
module Morloc.Test.DaemonTests (daemonTests) where

import Control.Concurrent (threadDelay)
import Control.Exception (SomeException, try)
import System.Directory (copyFile, doesFileExist, listDirectory, removeFile)
import System.Exit (ExitCode (..))
import System.FilePath ((</>))
import System.IO.Temp (createTempDirectory, getCanonicalTemporaryDirectory)
import Test.Tasty (TestTree, testGroup)
import Test.Tasty.HUnit (assertBool, assertFailure, testCase)

import Morloc.Test.Common

-- ======================================================================
-- Test data compilation
-- ======================================================================

compileDaemonProgram :: TestEnv -> String -> IO FilePath
compileDaemonProgram env locFile = do
  let srcDir = teSuiteDir env </> "daemon-tests"
  tmpDir <- do
    tmpBase <- getCanonicalTemporaryDirectory
    createTempDirectory tmpBase "morloc-daemon"
  copyFile (srcDir </> locFile) (tmpDir </> locFile)
  entries <- listDirectory srcDir
  mapM_
    ( \f -> do
        let src = srcDir </> f
        isFile <- doesFileExist src
        if isFile && (hasSuffix ".py" f || hasSuffix ".R" f || hasSuffix ".hpp" f)
          then copyFile src (tmpDir </> f)
          else return ()
    )
    entries
  (ec, _, err) <- morlocMake tmpDir "nexus" locFile
  case ec of
    ExitSuccess -> return tmpDir
    ExitFailure c -> do
      assertFailure $ locFile ++ ": compile failed (exit " ++ show c ++ "):\n" ++ err
      return tmpDir

hasSuffix :: String -> String -> Bool
hasSuffix suf s = reverse suf == take (length suf) (reverse s)

-- | Wait for the daemon to be fully ready (health + discover responding)
waitForDaemonReady :: Int -> Int -> IO Bool
waitForDaemonReady port maxWaitMs = go 0
  where
    stepMs = 300
    go elapsed
      | elapsed >= maxWaitMs = return False
      | otherwise = do
          result <-
            try $ httpGet ("http://127.0.0.1:" ++ show port ++ "/discover") ::
              IO (Either SomeException (ExitCode, String, String))
          case result of
            Right (ExitSuccess, body, _)
              | length body > 10 -> return True
            _ -> do
              threadDelay (stepMs * 1000)
              go (elapsed + stepMs)

-- | Wait for a socket/TCP endpoint to respond
waitForSocket :: String -> Int -> IO Bool
waitForSocket target maxWaitMs = go 0
  where
    stepMs = 500
    go elapsed
      | elapsed >= maxWaitMs = return False
      | otherwise = do
          result <-
            try $ lpRequest target "{\"method\":\"health\"}" ::
              IO (Either SomeException String)
          case result of
            Right r | length r > 2 -> return True
            _ -> do
              threadDelay (stepMs * 1000)
              go (elapsed + stepMs)

-- ======================================================================
-- HTTP API tests
-- ======================================================================

httpTests :: TestEnv -> TestTree
httpTests env = testCase "HTTP API (arithmetic)" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  withDaemon arithDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not become ready (port " ++ show port ++ ", dir " ++ arithDir ++ ")") ok

    -- Health
    (_, body, _) <- httpGet ("http://127.0.0.1:" ++ show port ++ "/health")
    assertJsonEq "health" body "status" "ok"

    -- Discovery
    (_, disco, _) <- httpGet ("http://127.0.0.1:" ++ show port ++ "/discover")
    assertContains "discover lists add" "add" disco
    assertContains "discover lists mul" "mul" disco
    assertContains "discover lists neg" "neg" disco
    assertContains "discover lists square" "square" disco

    -- add(3,4) -> 7
    (_, r1, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/add") "[3, 4]"
    assertJsonEq "add" r1 "status" "ok"
    assertJsonEq "add" r1 "result" "7"

    -- mul(5,6) -> 30
    (_, r2, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/mul") "[5, 6]"
    assertJsonEq "mul" r2 "result" "30"

    -- neg(42) -> -42
    (_, r3, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/neg") "[42]"
    assertJsonEq "neg" r3 "result" "-42"

    -- square(7) -> 49
    (_, r4, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/square") "[7]"
    assertJsonEq "square" r4 "result" "49"

    -- Args as object form
    (_, r5, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/add") "{\"args\": [10, 20]}"
    assertJsonEq "add object form" r5 "result" "30"

    -- Float args
    (_, r6, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/add") "[1.5, 2.5]"
    assertJsonEq "add float" r6 "result" "4"

    -- Unknown command
    (_, r7, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/nonexistent") "[1]"
    assertJsonEq "unknown command" r7 "status" "error"

httpPyTests :: TestEnv -> TestTree
httpPyTests env = testCase "HTTP API (Python strings)" $ do
  strDir <- compileDaemonProgram env "strings.loc"
  port <- pickFreePort
  withDaemon strDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ", dir " ++ strDir ++ ")") ok

    (_, r1, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/greet") "[\"world\"]"
    assertJsonEq "greet" r1 "status" "ok"
    assertJsonEq "greet" r1 "result" "Hello, world!"

    (_, r2, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/strlen") "[\"morloc\"]"
    assertJsonEq "strlen" r2 "result" "6"

    (_, r3, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/strlen") "[\"\"]"
    assertJsonEq "strlen empty" r3 "result" "0"

httpPureTests :: TestEnv -> TestTree
httpPureTests env = testCase "HTTP API (pure commands)" $ do
  pureDir <- compileDaemonProgram env "pure.loc"
  port <- pickFreePort
  withDaemon pureDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ", dir " ++ pureDir ++ ")") ok

    (_, r1, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/checkInt") "[]"
    assertJsonEq "checkInt" r1 "status" "ok"
    assertJsonEq "checkInt" r1 "result" "42"

    (_, r2, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/checkReal") "[]"
    assertJsonEq "checkReal" r2 "result" "3.14"

    (_, r3, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/checkBool") "[]"
    assertJsonEq "checkBool" r3 "result" "true"

    (_, r4, _) <- httpPost ("http://127.0.0.1:" ++ show port ++ "/call/checkStr") "[]"
    assertJsonEq "checkStr" r4 "result" "hello"

-- ======================================================================
-- Unix socket tests
-- ======================================================================

socketTests :: TestEnv -> TestTree
socketTests env = testCase "Unix socket API" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  let sockPath = "/tmp/morloc-test-haskell-socket.sock"
  removeIfExists sockPath
  withDaemon arithDir ["--socket", sockPath] $ \_ -> do
    ok <- waitForSocket sockPath 15000
    assertBool ("socket daemon did not start (socket " ++ sockPath ++ ", dir " ++ arithDir ++ ")") ok

    r1 <- lpRequest sockPath "{\"method\":\"health\"}"
    assertJsonEq "socket health" r1 "status" "ok"

    r2 <- lpRequest sockPath "{\"method\":\"discover\"}"
    assertContains "socket discover" "add" r2

    r3 <- lpRequest sockPath "{\"method\":\"call\",\"command\":\"add\",\"args\":[10,20]}"
    assertJsonEq "socket add" r3 "status" "ok"
    assertJsonEq "socket add" r3 "result" "30"

    r4 <-
      lpRequest sockPath "{\"id\":\"req-42\",\"method\":\"call\",\"command\":\"mul\",\"args\":[3,7]}"
    assertJsonEq "socket mul" r4 "id" "req-42"
    assertJsonEq "socket mul" r4 "result" "21"

    r5 <- lpRequest sockPath "{\"method\":\"call\",\"command\":\"bogus\",\"args\":[1]}"
    assertJsonEq "socket unknown cmd" r5 "status" "error"

  removeIfExists sockPath

-- ======================================================================
-- TCP tests
-- ======================================================================

tcpTests :: TestEnv -> TestTree
tcpTests env = testCase "TCP API" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  withDaemon arithDir ["--port", show port] $ \_ -> do
    ok <- waitForSocket ("127.0.0.1:" ++ show port) 15000
    assertBool ("tcp daemon did not start (port " ++ show port ++ ", dir " ++ arithDir ++ ")") ok

    r1 <- lpRequest ("127.0.0.1:" ++ show port) "{\"method\":\"health\"}"
    assertJsonEq "tcp health" r1 "status" "ok"

    r2 <-
      lpRequest
        ("127.0.0.1:" ++ show port)
        "{\"method\":\"call\",\"command\":\"add\",\"args\":[100,200]}"
    assertJsonEq "tcp add" r2 "status" "ok"
    assertJsonEq "tcp add" r2 "result" "300"

    r3 <-
      lpRequest
        ("127.0.0.1:" ++ show port)
        "{\"method\":\"call\",\"command\":\"square\",\"args\":[9]}"
    assertJsonEq "tcp square" r3 "result" "81"

-- ======================================================================
-- Multi-listener tests
-- ======================================================================

multiListenerTests :: TestEnv -> TestTree
multiListenerTests env = testCase "Multi-listener (HTTP+TCP+socket)" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  let sockPath = "/tmp/morloc-test-haskell-multi.sock"
  removeIfExists sockPath
  httpPort <- pickFreePort
  tcpPort <- pickFreePort
  withDaemon arithDir ["--socket", sockPath, "--port", show tcpPort, "--http-port", show httpPort] $ \_ -> do
    ok <- waitForDaemonReady httpPort 15000
    assertBool
      ( "multi daemon did not start (http="
          ++ show httpPort
          ++ ", tcp="
          ++ show tcpPort
          ++ ", dir "
          ++ arithDir
          ++ ")"
      )
      ok

    (_, r1, _) <- httpPost ("http://127.0.0.1:" ++ show httpPort ++ "/call/add") "[1, 2]"
    assertJsonEq "multi HTTP" r1 "result" "3"

    r2 <-
      lpRequest ("127.0.0.1:" ++ show tcpPort) "{\"method\":\"call\",\"command\":\"add\",\"args\":[1,2]}"
    assertJsonEq "multi TCP" r2 "result" "3"

    r3 <- lpRequest sockPath "{\"method\":\"call\",\"command\":\"add\",\"args\":[1,2]}"
    assertJsonEq "multi socket" r3 "result" "3"

  removeIfExists sockPath

-- ======================================================================
-- Sequential requests tests
-- ======================================================================

sequentialTests :: TestEnv -> TestTree
sequentialTests env = testCase "Sequential requests" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  withDaemon arithDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ", dir " ++ arithDir ++ ")") ok

    mapM_
      ( \i -> do
          (_, r, _) <-
            httpPost
              ("http://127.0.0.1:" ++ show port ++ "/call/add")
              ("[" ++ show i ++ ", " ++ show i ++ "]")
          assertJsonEq ("sequential add " ++ show i) r "result" (show (i + i))
      )
      [1 .. 10 :: Int]

-- ======================================================================
-- Concurrent requests tests
-- ======================================================================

concurrentHttpTests :: TestEnv -> TestTree
concurrentHttpTests env = testCase "Concurrent HTTP requests" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  withDaemon arithDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ", dir " ++ arithDir ++ ")") ok

    mapM_
      ( \i -> do
          (_, r, _) <-
            httpPost
              ("http://127.0.0.1:" ++ show port ++ "/call/square")
              ("[" ++ show i ++ "]")
          assertJsonEq ("concurrent square " ++ show i) r "result" (show (i * i))
      )
      [1 .. 5 :: Int]

-- ======================================================================
-- Graceful shutdown tests
-- ======================================================================

shutdownTests :: TestEnv -> TestTree
shutdownTests env = testCase "Graceful shutdown" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  let sockPath = "/tmp/morloc-test-haskell-shutdown.sock"
  removeIfExists sockPath

  withDaemon arithDir ["--http-port", show port, "--socket", sockPath] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ")") ok

    (_, body, _) <- httpGet ("http://127.0.0.1:" ++ show port ++ "/health")
    assertJsonEq "alive before shutdown" body "status" "ok"

  threadDelay 500000
  sockExists <- doesFileExist sockPath
  assertBool "socket file should be removed after shutdown" (not sockExists)
  removeIfExists sockPath

-- ======================================================================
-- Pool health tests
-- ======================================================================

poolHealthTests :: TestEnv -> TestTree
poolHealthTests env = testCase "Health reports pool status" $ do
  arithDir <- compileDaemonProgram env "arithmetic.loc"
  port <- pickFreePort
  withDaemon arithDir ["--http-port", show port] $ \_ -> do
    ok <- waitForDaemonReady port 15000
    assertBool ("daemon did not start (port " ++ show port ++ ")") ok

    (_, body, _) <- httpGet ("http://127.0.0.1:" ++ show port ++ "/health")
    assertContains "health includes ok" "ok" body

-- ======================================================================
-- Helpers
-- ======================================================================

removeIfExists :: FilePath -> IO ()
removeIfExists path = do
  exists <- doesFileExist path
  if exists then removeFile path else return ()

-- ======================================================================
-- Top-level test tree
-- ======================================================================

daemonTests :: TestEnv -> TestTree
daemonTests env =
  testGroup
    "Daemon"
    [ httpTests env
    , httpPyTests env
    , httpPureTests env
    , socketTests env
    , tcpTests env
    , multiListenerTests env
    , sequentialTests env
    , concurrentHttpTests env
    , shutdownTests env
    , poolHealthTests env
    ]


================================================
FILE: test-suite/integration/Morloc/Test/InstallTests.hs
================================================
module Morloc.Test.InstallTests (installTests) where

import System.Exit (ExitCode (..))
import System.FilePath ((</>))
import Test.Tasty (TestTree, testGroup)
import Test.Tasty.HUnit (assertEqual, assertFailure, testCase)

import Morloc.Test.Common

data InstallSpec = InstallSpec
  { isSourceDir :: String -- relative to test-suite/, e.g. "install-tests/testpy1"
  , isExtraArgs :: [String] -- extra morloc make args
  , isSubcommand :: String -- exported function to call
  , isArgs :: [String] -- arguments to pass
  , isExpected :: String -- expected stdout output
  , isFiles :: [String] -- files that must exist in exe dir
  , isDirs :: [String] -- dirs that must exist in exe dir
  }

installTest :: TestEnv -> String -> InstallSpec -> TestTree
installTest env name spec = testCase name $ do
  let srcDir = teSuiteDir env </> isSourceDir spec
      binDir = teMorlocHome env </> "bin"
      exeDir = teMorlocHome env </> "exe"
      binPath = binDir </> name
      exePath = exeDir </> name

  withTestCopy srcDir $ \workDir -> do
    -- Build and install
    (ec, _out, err) <- morlocInstall workDir name (isExtraArgs spec) "main.loc"
    case ec of
      ExitSuccess -> return ()
      ExitFailure c ->
        assertFailure $
          name ++ ": morloc make failed (exit " ++ show c ++ "):\n" ++ err

    -- Check binary and exe directory exist
    assertFileExists (name ++ ": binary installed") binPath
    assertDirExists (name ++ ": exe directory created") exePath
    assertDirExists (name ++ ": pools directory copied") (exePath </> "pools")

    -- Check expected files
    mapM_
      (\f -> assertFileExists (name ++ ": " ++ f ++ " included") (exePath </> f))
      (isFiles spec)

    -- Check expected directories
    mapM_
      (\d -> assertDirExists (name ++ ": " ++ d ++ " included") (exePath </> d))
      (isDirs spec)

    -- Run the installed program
    (rc, stdout, stderr) <- runProgram binPath (isSubcommand spec) (isArgs spec)
    let actual = case rc of
          ExitSuccess -> strip stdout
          ExitFailure c -> "ERROR: rc=" ++ show c ++ "\n" ++ stderr
    assertEqual (name ++ ": output") (isExpected spec) actual

    -- Uninstall and verify cleanup
    morlocUninstall name
    assertNotExists (name ++ ": binary removed after uninstall") binPath

installTests :: TestEnv -> TestTree
installTests env =
  testGroup
    "Install"
    [ testGroup
        "Python"
        [ installTest env "testpy1" $
            InstallSpec
              { isSourceDir = "install-tests/testpy1"
              , isExtraArgs = []
              , isSubcommand = "pygreet"
              , isArgs = ["\"world\""]
              , isExpected = "\"hello world\""
              , isFiles = ["helpers.py"]
              , isDirs = []
              }
        , installTest env "testpy2" $
            InstallSpec
              { isSourceDir = "install-tests/testpy2"
              , isExtraArgs = []
              , isSubcommand = "pyadd"
              , isArgs = ["3", "4"]
              , isExpected = "7"
              , isFiles = ["src/mathutil.py"]
              , isDirs = ["src"]
              }
        , installTest env "testpy3" $
            InstallSpec
              { isSourceDir = "install-tests/testpy3"
              , isExtraArgs = ["--include", "formatter.py", "--include", "fmtlib.py"]
              , isSubcommand = "pyformat"
              , isArgs = ["\"x\"", "5"]
              , isExpected = "\"x=5\""
              , isFiles = ["formatter.py", "fmtlib.py"]
              , isDirs = []
              }
        ]
    , testGroup
        "Cpp"
        [ installTest env "testcpp1" $
            InstallSpec
              { isSourceDir = "install-tests/testcpp1"
              , isExtraArgs = []
              , isSubcommand = "cppsquare"
              , isArgs = ["7"]
              , isExpected = "49"
              , isFiles = ["square.hpp"]
              , isDirs = []
              }
        , installTest env "testcpp2" $
            InstallSpec
              { isSourceDir = "install-tests/testcpp2"
              , isExtraArgs = []
              , isSubcommand = "cppdouble"
              , isArgs = ["6"]
              , isExpected = "12"
              , isFiles = ["src/dbl.hpp"]
              , isDirs = ["src"]
              }
        , installTest env "testcpp3" $
            InstallSpec
              { isSourceDir = "install-tests/testcpp3"
              , isExtraArgs = ["--include", "inc.hpp", "--include", "offset.hpp"]
              , isSubcommand = "cppinc"
              , isArgs = ["10"]
              , isExpected = "11"
              , isFiles = ["inc.hpp", "offset.hpp"]
              , isDirs = []
              }
        ]
    , testGroup
        "R"
        [ installTest env "testr1" $
            InstallSpec
              { isSourceDir = "install-tests/testr1"
              , isExtraArgs = []
              , isSubcommand = "rnegate"
              , isArgs = ["5.0"]
              , isExpected = "-5"
              , isFiles = ["negate.R"]
              , isDirs = []
              }
        , installTest env "testr2" $
            InstallSpec
              { isSourceDir = "install-tests/testr2"
              , isExtraArgs = []
              , isSubcommand = "rtriple"
              , isArgs = ["4"]
              , isExpected = "12"
              , isFiles = ["src/triple.R"]
              , isDirs = ["src"]
              }
        , installTest env "testr3" $
            InstallSpec
              { isSourceDir = "install-tests/testr3"
              , isExtraArgs = ["--include", "glue.R", "--include", "rutil.R"]
              , isSubcommand = "rpaste"
              , isArgs = ["\"foo\"", "\"bar\""]
              , isExpected = "\"foobar\""
              , isFiles = ["glue.R", "rutil.R"]
              , isDirs = []
              }
        ]
    , testGroup
        "Datafile"
        [ installTest env "testdatafile1" $
            InstallSpec
              { isSourceDir = "install-tests/testdatafile1"
              , isExtraArgs = []
              , isSubcommand = "readData"
              , isArgs = []
              , isExpected = "\"hello from datafile\""
              , isFiles = ["reader.py", "data.txt"]
              , isDirs = []
              }
        ]
    ]


================================================
FILE: test-suite/integration/Morloc/Test/ShmTests.hs
================================================
module Morloc.Test.ShmTests (shmTests) where

import Control.Concurrent (threadDelay)
import Control.Concurrent.Async (mapConcurrently)
import Control.Exception (SomeException, try)
import Control.Monad (when)
import Data.List (intercalate)
import System.Directory (copyFile, listDirectory, removeDirectoryRecursive)
import System.Exit (ExitCode (..))
import System.FilePath (takeExtension, (</>))
import System.IO (IOMode (..), hClose, openFile)
import System.IO.Temp (createTempDirectory, getCanonicalTemporaryDirectory)
import System.Process
  ( StdStream (..)
  , createProcess
  , proc
  , terminateProcess
  , waitForProcess
  )
import qualified System.Process as P
import Test.Tasty (TestTree, testGroup, withResource)
import Test.Tasty.HUnit (assertFailure, testCase)

import Morloc.Test.Common

-- | Compile the SHM stress test program into a temp directory
compileStressProgram :: TestEnv -> IO FilePath
compileStressProgram env = do
  let srcDir = teSuiteDir env </> "shm-tests"
  tmpBase <- getCanonicalTemporaryDirectory
  workDir <- createTempDirectory tmpBase "morloc-shm"
  entries <- listDirectory srcDir
  mapM_
    ( \f -> do
        let ext = takeExtension f
        when (ext `elem` [".loc", ".py", ".hpp"]) $
          copyFile (srcDir </> f) (workDir </> f)
    )
    entries
  (ec, _, err) <- morlocMake workDir "nexus" "main.loc"
  case ec of
    ExitSuccess -> return workDir
    ExitFailure c ->
      error $
        "SHM stress program compile failed (exit " ++ show c ++ "):\n" ++ err

shmTests :: TestEnv -> TestTree
shmTests env = withResource (compileStressProgram env) removeDirectoryRecursive $
  \getWorkDir ->
    testGroup
      "SHM"
      [ normalConcurrentCleanup getWorkDir
      , rapidFireCleanup getWorkDir
      , sigtermBehavior getWorkDir
      ]

-- ======================================================================
-- Test 1: Concurrent SHM cleanup
-- ======================================================================

normalConcurrentCleanup :: IO FilePath -> TestTree
normalConcurrentCleanup getWorkDir = testCase "normalConcurrentCleanup" $ do
  workDir <- getWorkDir
  let conc = 8 :: Int
      rounds = 3 :: Int
  cleanupMorlocResources
  threadDelay 100000 -- 100ms settle
  mapM_ (runRound workDir conc rounds) [1 .. rounds]
  where
    runRound workDir conc totalRounds roundNum = do
      before <- countShm

      results <-
        mapConcurrently
          ( \_ ->
              try (runNexus workDir "stress" ["1000", "2.0"]) ::
                IO (Either SomeException (ExitCode, String, String))
          )
          [1 .. conc :: Int]

      -- 1s settle
      threadDelay 1000000

      after <- countShm
      afterSegs <- listShmWithAge

      let ecs = [ec | Right (ec, _, _) <- results]
          outs = [strip out | Right (_, out, _) <- results]
          numFailed = length [() | Left _ <- results]
          allExitOk = all (== ExitSuccess) ecs && numFailed == 0
          allOutputOk = all (== "499500") outs
          shmDelta = after - before

      when (not allExitOk || not allOutputOk || shmDelta /= 0) $
        assertFailure $
          unlines $
            [ "normalConcurrentCleanup: SHM leak detected"
            , "  workDir: " ++ workDir
            , "  round "
                ++ show roundNum
                ++ "/"
                ++ show totalRounds
                ++ ": "
                ++ show conc
                ++ " concurrent, "
                ++ show (length ecs)
                ++ " succeeded"
            , "    before: " ++ show before ++ " segments"
            , "    after:  " ++ show after ++ " segments (after 1s settle)"
            ]
              ++ [ "    leaked: "
                  ++ intercalate
                    "\n            "
                    [seg ++ " (" ++ show age ++ "s old)" | (seg, age) <- afterSegs]
                 | not (null afterSegs)
                 ]
              ++ [ "    exit codes: " ++ show (map exitToInt ecs)
                 , "    outputs: " ++ show outs
                 ]
              ++ ["    exceptions: " ++ show numFailed | numFailed > 0]

-- ======================================================================
-- Test 2: Rapid-fire sequential cleanup
-- ======================================================================

rapidFireCleanup :: IO FilePath -> TestTree
rapidFireCleanup getWorkDir = testCase "rapidFireCleanup" $ do
  workDir <- getWorkDir
  let iterations = 50 :: Int
  cleanupMorlocResources
  threadDelay 100000 -- 100ms settle
  before <- countShm

  failures <- runIterations workDir iterations (0 :: Int)

  -- 1s settle
  threadDelay 1000000

  after <- countShm
  afterSegs <- listShmWithAge
  let shmDelta = after - before

  when (failures > 0 || shmDelta > 0) $
    assertFailure $
      unlines $
        [ "rapidFireCleanup:"
        , "  workDir: " ++ workDir
        , "  iterations: " ++ show iterations
        , "  failures: " ++ show failures
        , "  before: " ++ show before ++ " segments"
        , "  after:  " ++ show after ++ " segments (after 1s settle)"
        ]
          ++ [ "  leaked: "
              ++ intercalate
                "\n          "
                [seg ++ " (" ++ show age ++ "s old)" | (seg, age) <- afterSegs]
             | not (null afterSegs)
             ]
  where
    runIterations _ 0 failures = return failures
    runIterations wd remaining failures = do
      result <-
        try (runNexus wd "stress" ["100", "0.0"]) ::
          IO (Either SomeException (ExitCode, String, String))
      let failed = case result of
            Right (ExitSuccess, out, _) -> strip out /= "4950"
            _ -> True
      threadDelay 10000 -- 10ms
      runIterations wd (remaining - 1) (if failed then failures + 1 else failures)

-- ======================================================================
-- Test 3: SIGTERM triggers clean SHM cleanup
-- ======================================================================

sigtermBehavior :: IO FilePath -> TestTree
sigtermBehavior getWorkDir = testCase "sigtermBehavior" $ do
  workDir <- getWorkDir
  cleanupMorlocResources
  threadDelay 100000 -- 100ms settle
  before <- countShm

  -- Launch nexus with a long-running command (5s sleep)
  devNull <- openFile "/dev/null" WriteMode
  let cp =
        (proc (workDir </> "nexus") ["stress", "1000", "5.0"])
          { P.cwd = Just workDir
          , P.std_out = UseHandle devNull
          , P.std_err = UseHandle devNull
          }
  (_, _, _, ph) <- createProcess cp

  -- Wait 1s for the process to start and create SHM segments
  threadDelay 1000000

  -- Send SIGTERM (terminateProcess sends SIGTERM on Unix)
  terminateProcess ph

  -- Wait for exit
  _ec <- waitForProcess ph
  hClose devNull

  -- 1s settle
  threadDelay 1000000

  after <- countShm
  afterSegs <- listShmWithAge
  let shmDelta = after - before

  when (shmDelta > 0) $
    assertFailure $
      unlines $
        [ "sigtermBehavior: SHM leak after SIGTERM"
        , "  workDir: " ++ workDir
        , "  before: " ++ show before ++ " segments"
        , "  after:  " ++ show after ++ " segments (after 1s settle)"
        , "  leaked: "
            ++ intercalate
              "\n          "
              [seg ++ " (" ++ show age ++ "s old)" | (seg, age) <- afterSegs]
        ]

  -- Clean up leaked segments so they don't affect other tests
  cleanupMorlocResources

-- ======================================================================
-- Helpers
-- ======================================================================

exitToInt :: ExitCode -> Int
exitToInt ExitSuccess = 0
exitToInt (ExitFailure n) = n


================================================
FILE: test-suite/integration/Morloc/Test/StressTests.hs
================================================
module Morloc.Test.StressTests (stressTests) where

import Control.Concurrent (threadDelay)
import Control.Concurrent.Async (mapConcurrently)
import Control.Exception (SomeException, try)
import Data.List (intercalate)
import System.Directory
  ( copyFile
  , doesFileExist
  , listDirectory
  , removeDirectoryRecursive
  )
import System.Exit (ExitCode (..))
import System.FilePath (takeExtension, (</>))
import System.IO.Temp (createTempDirectory, getCanonicalTemporaryDirectory)
import System.Process (readProcessWithExitCode)
import Test.Tasty (TestTree, testGroup, withResource)
import Test.Tasty.HUnit (assertFailure, testCase)

import Morloc.Test.Common

-- | A workload: a golden test directory + calls to make against its nexus
data Workload = Workload
  { wlName :: String -- label (e.g. "cpp", "py-r")
  , wlTestDir :: String -- relative to test-suite/golden-tests/
  , wlCalls :: [(String, [String])] -- (subcommand, args) pairs
  }

workloads :: [Workload]
workloads =
  [ Workload "cpp" "argument-form-1-c" [("foo", ["2"])]
  , Workload "py" "argument-form-1-py" [("foo", ["2"])]
  , Workload "r" "argument-form-1-r" [("foo", ["2"])]
  , Workload "cpp-py" "interop-3a-cp" [("foo", ["[1,2,3]"])]
  , Workload "cpp-r" "interop-3a-rc" [("foo", ["[1,2,3]"])]
  , Workload "py-r" "interop-3a-pr" [("foo", ["[1,2,3]"])]
  ]

-- | Compile a golden test into a temp directory, returning the work dir
compileWorkload :: TestEnv -> Workload -> IO FilePath
compileWorkload env wl = do
  let goldenDir = teSuiteDir env </> "golden-tests" </> wlTestDir wl
  tmpBase <- getCanonicalTemporaryDirectory
  workDir <- createTempDirectory tmpBase "morloc-stress"

  -- Copy source files
  entries <- listDirectory goldenDir
  mapM_
    ( \f -> do
        let ext = takeExtension f
        if ext `elem` [".loc", ".py", ".hpp", ".R"]
          then copyFile (goldenDir </> f) (workDir </> f)
          else return ()
    )
    entries

  -- Find the .loc file referenced in the Makefile
  locFile <- findLocFile goldenDir
  (ec, _, err) <- morlocMake workDir "nexus" locFile
  case ec of
    ExitSuccess -> return workDir
    ExitFailure c -> do
      assertFailure $ wlName wl ++ ": compile failed (exit " ++ show c ++ "):\n" ++ err
      return workDir

findLocFile :: FilePath -> IO String
findLocFile dir = do
  let mkfile = dir </> "Makefile"
  exists <- doesFileExist mkfile
  if exists
    then do
      (_, out, _) <-
        readProcessWithExitCode
          "sh"
          ["-c", "grep 'morloc make' " ++ show mkfile ++ " | head -1 | grep -oP '[^ ]+\\.loc'"]
          ""
      return (strip out)
    else do
      entries <- listDirectory dir
      case filter (\f -> takeExtension f == ".loc") entries of
        (f : _) -> return f
        [] -> assertFailure ("No .loc file found in " ++ dir) >> return ""

-- | Snapshot of resource counts for comparison
data ResourceSnapshot = ResourceSnapshot
  { rsZombies :: Int
  , rsShm :: Int
  , rsTmp :: Int
  , rsShmList :: [String] -- actual segment names
  }

takeSnapshot :: IO ResourceSnapshot
takeSnapshot =
  ResourceSnapshot
    <$> countZombies
    <*> countShm
    <*> countTmp
    <*> listShm

-- | Format a resource delta for failure messages
formatDelta :: String -> ResourceSnapshot -> ResourceSnapshot -> String
formatDelta label before after =
  unlines $
    [ label
    , "  shm: "
        ++ show (rsShm before)
        ++ " -> "
        ++ show (rsShm after)
        ++ " (delta: "
        ++ show (rsShm after - rsShm before)
        ++ ")"
    , "  tmp: "
        ++ show (rsTmp before)
        ++ " -> "
        ++ show (rsTmp after)
        ++ " (delta: "
        ++ show (rsTmp after - rsTmp before)
        ++ ")"
    , "  zombies: "
        ++ show (rsZombies before)
        ++ " -> "
        ++ show (rsZombies after)
        ++ " (delta: "
        ++ show (rsZombies after - rsZombies before)
        ++ ")"
    ]
      ++ if null (rsShmList after)
        then []
        else ["  segments: " ++ intercalate ", " (rsShmList after)]

-- ======================================================================
-- Zombie stress test: 50 concurrent nexus invocations, check for leaks
-- ======================================================================

zombieTest :: Workload -> IO FilePath -> TestTree
zombieTest wl getWorkDir = testCase "zombie" $ do
  workDir <- getWorkDir
  cleanupMorlocResources
  let iterations = 50 :: Int
      (subcmd, args) = head (wlCalls wl)
  before <- takeSnapshot

  _ <-
    mapConcurrently
      ( \_ ->
          try (runNexusQuiet workDir subcmd args) :: IO (Either SomeException ExitCode)
      )
      [1 .. iterations]

  threadDelay 2000000 -- 2s settle
  after <- takeSnapshot
  let newShm = rsShm after - rsShm before
      newTmp = rsTmp after - rsTmp before
      problems =
        concat
          [ ["shm leaked: " ++ show newShm | newShm > 0]
          , ["tmp leaked: " ++ show newTmp | newTmp > 0]
          ]

  if null problems
    then return ()
    else
      assertFailure $
        unlines
          [ "workDir: " ++ workDir
          , formatDelta ("after " ++ show iterations ++ " concurrent + 2s settle") before after
          , intercalate "; " problems
          ]

-- ======================================================================
-- Concurrent stress test: 10 rounds x 10 concurrent, check for leaks
-- ======================================================================

concurrentStressTest :: Workload -> IO FilePath -> TestTree
concurrentStressTest wl getWorkDir = testCase "concurrent" $ do
  workDir <- getWorkDir
  cleanupMorlocResources
  let concurrent = 10 :: Int
      rounds = 10 :: Int
  before <- takeSnapshot

  leakRounds <- goRounds workDir (0 :: Int) rounds concurrent before

  threadDelay 2000000 -- 2s settle
  after <- takeSnapshot
  let newShm = rsShm after - rsShm before
      newTmp = rsTmp after - rsTmp before
      problems =
        concat
          [ ["shm leaked: " ++ show newShm | newShm > 0]
          , ["tmp leaked: " ++ show newTmp | newTmp > 0]
          , [ "leaks observed during "
              ++ show leakRounds
              ++ "/"
              ++ show rounds
              ++ " rounds"
            | leakRounds > 0
            ]
          ]

  if null problems
    then return ()
    else
      assertFailure $
        unlines
          [ "workDir: " ++ workDir
          , formatDelta
              ( "after "
                  ++ show rounds
                  ++ " rounds x "
                  ++ show concurrent
                  ++ " concurrent + 2s settle"
              )
              before
              after
          , intercalate "; " problems
          ]
  where
    goRounds _ leakR 0 _ _ = return leakR
    goRounds wd leakR remaining conc before0 = do
      let (subcmd, args) = head (wlCalls wl)
      _ <-
        mapConcurrently
          ( \_ ->
              try (runNexusQuiet wd subcmd args) :: IO (Either SomeException ExitCode)
          )
          [1 .. conc :: Int]
      threadDelay 50000 -- 50ms between rounds
      cur <- takeSnapshot
      let leaked = rsShm cur - rsShm before0 > 0 || rsTmp cur - rsTmp before0 > 0
      goRounds
        wd
        (if leaked then leakR + 1 else leakR)
        (remaining - 1)
        conc
        before0

-- ======================================================================
-- Crash recovery: 10 concurrent crash-and-recover cycles
-- ======================================================================

crashRecoveryTest :: Workload -> IO FilePath -> TestTree
crashRecoveryTest wl getWorkDir = testCase "crash-recovery" $ do
  workDir <- getWorkDir
  cleanupMorlocResources
  let iterations = 10 :: Int
      (subcmd, args) = head (wlCalls wl)
  before <- takeSnapshot

  results <-
    mapConcurrently
      ( \_ -> do
          (_, out, _) <-
            readProcessWithExitCode
              "sh"
              [ "-c"
              , "cd "
                  ++ show workDir
                  ++ " && "
                  ++ "./nexus "
                  ++ subcmd
                  ++ " "
                  ++ unwords args
                  ++ " > /dev/null 2>&1 &"
                  ++ " NPID=$!; sleep 0.1;"
                  ++ " CPID=$(ps -o pid= --ppid $NPID 2>/dev/null | head -1 | tr -d ' ');"
                  ++ " if [ -n \"$CPID\" ]; then kill -9 $CPID 2>/dev/null; fi;"
                  ++ " HUNG=0; for i in $(seq 1 50); do"
                  ++ "   if ! kill -0 $NPID 2>/dev/null; then break; fi;"
                  ++ "   sleep 0.1;"
                  ++ "   if [ $i -eq 50 ]; then HUNG=1; kill -9 $NPID 2>/dev/null; fi;"
                  ++ " done;"
                  ++ " wait $NPID 2>/dev/null;"
                  ++ " echo $HUNG"
              ]
              ""
          return (strip out == "1")
      )
      [1 .. iterations]

  threadDelay 2000000 -- 2s settle
  after <- takeSnapshot
  let hangs = length (filter id results)
      newShm = rsShm after - rsShm before
      newTmp = rsTmp after - rsTmp before
      problems =
        concat
          [ [ "hung: "
              ++ show hangs
              ++ "/"
              ++ show iterations
              ++ " (nexus did not exit after child kill)"
            | hangs > 0
            ]
          , ["shm leaked: " ++ show newShm | newShm > 0]
          , ["tmp leaked: " ++ show newTmp | newTmp > 0]
          ]

  if null problems
    then return ()
    else
      assertFailure $
        unlines
          [ "workDir: " ++ workDir
          , formatDelta ("after " ++ show iterations ++ " crash iterations + 2s settle") before after
          , intercalate "\n" problems
          ]

-- ======================================================================
-- Top-level: compile each workload once, share across test types
-- ======================================================================

workloadGroup :: TestEnv -> Workload -> TestTree
workloadGroup env wl =
  withResource (compileWorkload env wl) removeDirectoryRecursive $ \getWorkDir ->
    testGroup
      (wlName wl)
      [ zombieTest wl getWorkDir
      , concurrentStressTest wl getWorkDir
      , crashRecoveryTest wl getWorkDir
      ]

stressTests :: TestEnv -> TestTree
stressTests env =
  testGroup
    "Stress"
    [workloadGroup env wl | wl <- workloads]


================================================
FILE: test-suite/shm-tests/cppfuncs.loc
================================================
module cppfuncs (*)

import types

sum_list :: [Int] -> Int

source Cpp from "stress.hpp" ("sum_list")


================================================
FILE: test-suite/shm-tests/main.loc
================================================
module main (stress)

import types (Int, Real, List)
import pyfuncs (make_list)
import cppfuncs (sum_list)

stress :: Int -> Real -> Int
stress n delay = sum_list (make_list n delay)


================================================
FILE: test-suite/shm-tests/pyfuncs.loc
================================================
module pyfuncs (*)

import types

make_list :: Int -> Real -> [Int]

source Py from "stress.py" ("make_list")


================================================
FILE: test-suite/shm-tests/stress.hpp
================================================
#ifndef MORLOC_STRESS_HPP
#define MORLOC_STRESS_HPP

#include <vector>

int sum_list(const std::vector<int>& xs) {
    int s = 0;
    for (auto x : xs) s += x;
    return s;
}

#endif


================================================
FILE: test-suite/shm-tests/stress.py
================================================
import time

def make_list(n, delay):
    time.sleep(delay)
    return list(range(n))


================================================
FILE: test-suite/shm-tests/types.loc
================================================
module types (*)

type Py => Int = "int"
type Py => Real = "float"
type Py => List a = "list" a
type Cpp => Int = "int"
type Cpp => Real = "double"
type Cpp => List a = "std::vector<$1>" a


================================================
FILE: test-suite/stress/.gitignore
================================================
*log


================================================
FILE: test-suite/stress/README.md
================================================
# Stress Tests

Tests for process management, resource cleanup, and stability under load.

## Interface

All tests take a golden test directory and one or more nexus calls:

```bash
./<test>.sh <golden-test-dir> <call> [<call> ...] [-- options...]
```

A call is a nexus subcommand with arguments, e.g. `"foo '[1,2,3]'"`.

## Tests

**zombie-stress.sh** `[-- iterations]` — Runs the nexus repeatedly (default 50)
and checks that no shared memory segments or temp directories accumulate.

**concurrent-stress.sh** `[-- concurrent rounds]` — Launches multiple nexus
invocations simultaneously (default 10x10) to test for resource leaks under
contention.

**crash-recovery.sh** `[-- iterations]` — Kills a pool process mid-execution
with SIGKILL (default 10 iterations) and verifies the nexus exits promptly
without leaking resources.

**valgrind-check.sh** — Runs the nexus under valgrind and checks for large
memory leaks (>4KB) or file descriptor leaks (>3 extra). Requires valgrind.

## Examples

```bash
# Single test, single workload
./zombie-stress.sh ../golden-tests/interop-3a-cp "foo '[1,2,3]'" -- 100

# Crash recovery on R-only workload
./crash-recovery.sh ../golden-tests/argument-form-1-r "foo 2" -- 20

# Run all tests across all language combinations
./run-all.sh

# Run only zombie and concurrent tests
./run-all.sh zombie concurrent
```

## run-all.sh

Loops all stress tests across six workloads covering every language combination:
C++ only, Python only, R only, C++/Python, C++/R, Python/R.


================================================
FILE: test-suite/stress/common.sh
================================================
#!/usr/bin/env bash
# common.sh - Shared setup for stress tests
# Source this file: source "$(dirname "$0")/common.sh"
#
# After sourcing, the caller should call:
#   parse_args "$@"
#   compile_workload
#
# This sets:
#   WORK_DIR   - temp directory containing compiled nexus
#   CALLS[@]   - array of "subcommand args..." strings to invoke

set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
WORK_DIR=$(mktemp -d)
NEXUS_TIMEOUT=15
STDERR_LOG="$SCRIPT_DIR/stress-test.log"
STRESS_SCRIPT="$(basename "${0}")"

cleanup() {
    jobs -p 2>/dev/null | xargs -r kill -9 2>/dev/null || true
    wait 2>/dev/null || true
    rm -rf "$WORK_DIR"
}
trap cleanup EXIT

count_zombies() {
    local n
    n=$(ps -eo stat 2>/dev/null | grep -c '^Z') || true
    echo "${n:-0}"
}

count_shm() {
    local n=0
    if ls /dev/shm/morloc-* &>/dev/null; then
        n=$(ls -1 /dev/shm/morloc-* 2>/dev/null | wc -l)
    fi
    echo "$n"
}

count_tmp() {
    local n=0
    if ls -d /tmp/morloc.* &>/dev/null; then
        n=$(ls -1d /tmp/morloc.* 2>/dev/null | wc -l)
    fi
    echo "$n"
}

# Parse: <test_dir> <call> [<call> ...]
# Each <call> is a quoted string like "foo '[1,2,3]'"
parse_args() {
    if [ $# -lt 2 ]; then
        echo "Usage: $(basename "$0") <golden-test-dir> <call> [<call> ...]" >&2
        echo "  <call> is a nexus invocation, e.g. \"foo '[1,2,3]'\"" >&2
        exit 1
    fi
    TEST_DIR="$(cd "$1" && pwd)"
    shift
    CALLS=("$@")
}

compile_workload() {
    local test_name
    test_name=$(basename "$TEST_DIR")

    # Extract the morloc source file from the Makefile
    local loc_file
    loc_file=$(grep 'morloc make' "$TEST_DIR/Makefile" | head -1 | grep -oP '[^ ]+\.loc')

    cp "$TEST_DIR"/*.loc "$WORK_DIR"/ 2>/dev/null || true
    cp "$TEST_DIR"/*.py "$WORK_DIR"/ 2>/dev/null || true
    cp "$TEST_DIR"/*.hpp "$WORK_DIR"/ 2>/dev/null || true
    cp "$TEST_DIR"/*.R "$WORK_DIR"/ 2>/dev/null || true

    cd "$WORK_DIR"
    echo "Compiling $test_name ($loc_file)..."
    morloc make -o nexus "$loc_file" > /dev/null 2>&1
    echo "Done. Calls: ${CALLS[*]}"
}

# Run a random call from CALLS[@], logging stderr to STDERR_LOG
run_nexus() {
    local call="${CALLS[RANDOM % ${#CALLS[@]}]}"
    local _tmp_err
    _tmp_err=$(mktemp)
    eval timeout "$NEXUS_TIMEOUT" ./nexus $call > /dev/null 2>"$_tmp_err"
    local _rc=$?
    if [ -s "$_tmp_err" ]; then
        {
            printf "=== %s | %s | call: %s | %s ===\n" \
                "$STRESS_SCRIPT" "$(basename "$TEST_DIR")" "$call" "$(date '+%H:%M:%S')"
            cat "$_tmp_err"
            echo ""
        } >> "$STDERR_LOG"
    fi
    rm -f "$_tmp_err"
    return $_rc
}


================================================
FILE: test-suite/stress/concurrent-stress.sh
================================================
#!/usr/bin/env bash
# concurrent-stress.sh - Test concurrent nexus execution
#
# Usage: ./concurrent-stress.sh <golden-test-dir> <call> [<call> ...] [-- concurrent rounds]
#   e.g. ./concurrent-stress.sh ../golden-tests/interop-3a-cp "foo '[1,2,3]'" -- 10 10

source "$(dirname "$0")/common.sh"

POSITIONAL=()
CONCURRENT=10
ROUNDS=10
while [ $# -gt 0 ]; do
    if [ "$1" = "--" ]; then
        shift; CONCURRENT=${1:-10}; shift; ROUNDS=${1:-10}; break
    fi
    POSITIONAL+=("$1"); shift
done
parse_args "${POSITIONAL[@]}"

echo "=== Concurrent Stress Test ==="
echo "Concurrent: $CONCURRENT, Rounds: $ROUNDS"
compile_workload

INITIAL_SHM=$(count_shm)
INITIAL_TMP=$(count_tmp)
INITIAL_ZOMBIES=$(count_zombies)
RESOURCE_LEAK_ROUNDS=0

for round in $(seq 1 "$ROUNDS"); do
    PIDS=()
    for j in $(seq 1 "$CONCURRENT"); do
        run_nexus &
        PIDS+=($!)
    done

    EXEC_FAILURES=0
    for pid in "${PIDS[@]}"; do
        if ! wait "$pid" 2>/dev/null; then
            EXEC_FAILURES=$((EXEC_FAILURES + 1))
        fi
    done

    sleep 0.05

    SHM=$(( $(count_shm) - INITIAL_SHM ))
    TMP=$(( $(count_tmp) - INITIAL_TMP ))
    ZOMBIES=$(( $(count_zombies) - INITIAL_ZOMBIES ))

    printf "Round %3d: %d/%d succeeded, zombies=%d, shm=%d, tmp=%d\n" \
        "$round" "$((CONCURRENT - EXEC_FAILURES))" "$CONCURRENT" \
        "$ZOMBIES" "$SHM" "$TMP"

    if (( SHM > 0 || TMP > 0 )); then
        RESOURCE_LEAK_ROUNDS=$((RESOURCE_LEAK_ROUNDS + 1))
    fi
done

echo ""
echo "=== Summary ==="
FINAL_SHM=$(( $(count_shm) - INITIAL_SHM ))
FINAL_TMP=$(( $(count_tmp) - INITIAL_TMP ))
FINAL_ZOMBIES=$(( $(count_zombies) - INITIAL_ZOMBIES ))

echo "New zombies: $FINAL_ZOMBIES"
echo "Leaked SHM: $FINAL_SHM"
echo "Leaked tmpdir: $FINAL_TMP"
echo "Rounds with resource leaks: $RESOURCE_LEAK_ROUNDS / $ROUNDS"

if (( FINAL_SHM > 0 || FINAL_TMP > 0 )); then
    echo "FAIL: Resources leaked"
    exit 1
fi
echo "PASS"


================================================
FILE: test-suite/stress/crash-recovery.sh
================================================
#!/usr/bin/env bash
# crash-recovery.sh - Test nexus behavior when a pool crashes
#
# Starts the nexus in background, kills one of its pool child processes with
# SIGKILL, and verifies the nexus exits within a reasonable time without
# hanging. Also checks for resource leaks.
#
# Usage: ./crash-recovery.sh <golden-test-dir> <call> [<call> ...] [-- iterations]
#   e.g. ./crash-recovery.sh ../golden-tests/interop-3a-cp "foo '[1,2,3]'" -- 10

source "$(dirname "$0")/common.sh"

POSITIONAL=()
ITERATIONS=10
while [ $# -gt 0 ]; do
    if [ "$1" = "--" ]; then
        shift; ITERATIONS=${1:-10}; break
    fi
    POSITIONAL+=("$1"); shift
done
parse_args "${POSITIONAL[@]}"

MAX_WAIT_SECONDS=5

echo "=== Crash Recovery Test ==="
echo "Iterations: $ITERATIONS"
compile_workload

INITIAL_SHM=$(count_shm)
INITIAL_TMP=$(count_tmp)
FAILURES=0

for i in $(seq 1 "$ITERATIONS"); do
    # Start nexus in background with a random call
    local_call="${CALLS[RANDOM % ${#CALLS[@]}]}"
    iter_err="$WORK_DIR/iter-${i}.err"
    eval exec ./nexus $local_call 2>"$iter_err" > /dev/null &
    NEXUS_PID=$!

    # Wait for pools to start
    sleep 0.1

    # Find and kill a pool child process
    POOL_PID=$(ps -o pid= --ppid "$NEXUS_PID" 2>/dev/null | head -1 | tr -d ' ') || true

    if [ -n "$POOL_PID" ]; then
        kill -9 "$POOL_PID" 2>/dev/null || true
    fi

    # Wait for nexus to exit (with timeout)
    HUNG=0
    ELAPSED=0
    while kill -0 "$NEXUS_PID" 2>/dev/null; do
        if (( ELAPSED >= MAX_WAIT_SECONDS * 10 )); then
            HUNG=1
            kill -9 "$NEXUS_PID" 2>/dev/null || true
            break
        fi
        sleep 0.1
        ELAPSED=$((ELAPSED + 1))
    done
    wait "$NEXUS_PID" 2>/dev/null || true

    # Log any nexus stderr
    if [ -s "$iter_err" ]; then
        {
            printf "=== %s | %s | iteration %d | call: %s | %s ===\n" \
                "$STRESS_SCRIPT" "$(basename "$TEST_DIR")" "$i" "$local_call" "$(date '+%H:%M:%S')"
            cat "$iter_err"
            echo ""
        } >> "$STDERR_LOG"
    fi
    rm -f "$iter_err"

    SHM=$(( $(count_shm) - INITIAL_SHM ))
    TMP=$(( $(count_tmp) - INITIAL_TMP ))

    if (( HUNG )); then
        printf "Iteration %3d: HUNG (nexus did not exit within %ds)\n" "$i" "$MAX_WAIT_SECONDS"
        FAILURES=$((FAILURES + 1))
    elif (( SHM > 0 || TMP > 0 )); then
        printf "Iteration %3d: LEAK (shm=%d, tmp=%d)\n" "$i" "$SHM" "$TMP"
        FAILURES=$((FAILURES + 1))
    else
        printf "Iteration %3d: OK\n" "$i"
    fi
done

echo ""
echo "=== Summary ==="
echo "Failures: $FAILURES / $ITERATIONS"

if (( FAILURES > 0 )); then
    echo "FAIL"
    exit 1
fi
echo "PASS"


================================================
FILE: test-suite/stress/run-all.sh
================================================
#!/usr/bin/env bash
# run-all.sh - Run all stress tests across language combinations
#
# Usage: ./run-all.sh [test...]
#   With no arguments, runs all tests. Pass test names to run a subset:
#   ./run-all.sh zombie concurrent

set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
GOLDEN="$SCRIPT_DIR/../golden-tests"

# Workloads: golden-test-dir + nexus calls
declare -A WORKLOAD_DIR=(
    [cpp]="$GOLDEN/argument-form-1-c"
    [py]="$GOLDEN/argument-form-1-py"
    [r]="$GOLDEN/argument-form-1-r"
    [cpp-py]="$GOLDEN/interop-3a-cp"
    [cpp-r]="$GOLDEN/interop-3a-rc"
    [py-r]="$GOLDEN/interop-3a-pr"
)
declare -A WORKLOAD_CALL=(
    [cpp]="foo 2"
    [py]="foo 2"
    [r]="foo 2"
    [cpp-py]="foo '[1,2,3]'"
    [cpp-r]="foo '[1,2,3]'"
    [py-r]="foo '[1,2,3]'"
)

WORKLOAD_ORDER=(cpp py r cpp-py cpp-r py-r)

PASSED=0
FAILED=0
SKIPPED=0
FAILURES=()

# Colors (disabled if stdout is not a terminal)
if [[ -t 1 ]]; then
    GREEN=$'\033[32m' RED=$'\033[31m' YELLOW=$'\033[33m' BOLD=$'\033[1m' RESET=$'\033[0m'
else
    GREEN='' RED='' YELLOW='' BOLD='' RESET=''
fi

run_test() {
    local test_script="$1"
    local test_name="$2"
    local workload="$3"
    local dir="${WORKLOAD_DIR[$workload]}"
    local call="${WORKLOAD_CALL[$workload]}"

    printf "%-20s %-8s ... " "$test_name" "[$workload]"

    local output start_time elapsed
    start_time=$(date +%s%N)
    if output=$("$SCRIPT_DIR/$test_script" "$dir" "$call" 2>&1); then
        elapsed=$(( ($(date +%s%N) - start_time) / 1000000 ))
        if (( elapsed >= 1000 )); then
            printf "%sPASS%s (%d.%01ds)\n" "$GREEN" "$RESET" "$((elapsed/1000))" "$(( (elapsed%1000) / 100 ))"
        else
            echo "${GREEN}PASS${RESET} (${elapsed}ms)"
        fi
        PASSED=$((PASSED + 1))
    else
        elapsed=$(( ($(date +%s%N) - start_time) / 1000000 ))
        local last_line
        last_line=$(echo "$output" | tail -1)
        if [[ "$last_line" == SKIP* ]]; then
            echo "${YELLOW}SKIP${RESET}"
            SKIPPED=$((SKIPPED + 1))
        else
            echo "${RED}FAIL${RESET}"
            FAILED=$((FAILED + 1))
            FAILURES+=("$test_name [$workload]")
            # Print last 5 lines of output for context
            echo "$output" | tail -5 | sed 's/^/    /'
        fi
    fi
}

# Determine which tests to run
SELECTED=("$@")
should_run() {
    if [ ${#SELECTED[@]} -eq 0 ]; then return 0; fi
    for s in "${SELECTED[@]}"; do
        if [[ "$1" == *"$s"* ]]; then return 0; fi
    done
    return 1
}

STDERR_LOG="$SCRIPT_DIR/stress-test.log"
> "$STDERR_LOG"

echo "=== Morloc Stress Test Suite ==="
echo "Stderr log: $STDERR_LOG"
echo ""

for workload in "${WORKLOAD_ORDER[@]}"; do
    if should_run "zombie"; then
        run_test "zombie-stress.sh" "zombie" "$workload"
    fi
    if should_run "concurrent"; then
        run_test "concurrent-stress.sh" "concurrent" "$workload"
    fi
    if should_run "crash"; then
        run_test "crash-recovery.sh" "crash-recovery" "$workload"
    fi
    if should_run "valgrind"; then
        run_test "valgrind-check.sh" "valgrind" "$workload"
    fi
done

echo ""
echo "=== Results ==="
echo "${GREEN}Passed: $PASSED${RESET}, ${RED}Failed: $FAILED${RESET}, ${YELLOW}Skipped: $SKIPPED${RESET}"

if [ -s "$STDERR_LOG" ]; then
    echo "Nexus stderr logged to: $STDERR_LOG"
fi

if (( FAILED > 0 )); then
    echo ""
    echo "${RED}Failures:${RESET}"
    for f in "${FAILURES[@]}"; do
        echo "  ${RED}-${RESET} $f"
    done
    exit 1
fi
echo "${GREEN}${BOLD}ALL PASSED${RESET}"


================================================
FILE: test-suite/stress/valgrind-check.sh
================================================
#!/usr/bin/env bash
# valgrind-check.sh - Check for memory leaks and leaked file descriptors
#
# Runs the nexus under valgrind with leak checking and fd tracking.
# Requires valgrind to be installed; skips gracefully if not available.
#
# Usage: ./valgrind-check.sh <golden-test-dir> <call>
#   e.g. ./valgrind-check.sh ../golden-tests/interop-3a-cp "foo '[1,2,3]'"

source "$(dirname "$0")/common.sh"

parse_args "$@"

echo "=== Valgrind Memory/FD Leak Check ==="

if ! command -v valgrind &>/dev/null; then
    echo "SKIP: valgrind not found"
    exit 0
fi

compile_workload

VALGRIND_LOG="/tmp/morloc-valgrind-$$.log"

# Use first call only for valgrind (deterministic)
CALL="${CALLS[0]}"

# The nexus file may be a shell wrapper (#!/bin/sh + exec morloc-nexus "$0" "$@").
# Valgrind can't instrument through exec, so unwrap to call morloc-nexus directly.
if head -1 ./nexus | grep -q '^#!'; then
    NEXUS_BIN=$(sed -n '2s/^exec \([^ ]*\) .*/\1/p' ./nexus)
    if [ -z "$NEXUS_BIN" ] || ! command -v "$NEXUS_BIN" &>/dev/null; then
        echo "FAIL: Cannot find morloc-nexus binary from nexus wrapper"
        exit 1
    fi
    VALGRIND_CMD="$NEXUS_BIN ./nexus $CALL"
else
    VALGRIND_CMD="./nexus $CALL"
fi

echo "Running under valgrind: $VALGRIND_CMD"
NEXUS_ERR="$WORK_DIR/valgrind-nexus.err"
eval timeout 60 valgrind \
    --leak-check=full \
    --show-leak-kinds=definite,indirect \
    --track-fds=yes \
    --log-file="$VALGRIND_LOG" \
    $VALGRIND_CMD > /dev/null 2>"$NEXUS_ERR"
EXIT_CODE=$?

# Log any nexus/valgrind stderr
if [ -s "$NEXUS_ERR" ]; then
    {
        printf "=== %s | %s | call: %s | %s ===\n" \
            "$STRESS_SCRIPT" "$(basename "$TEST_DIR")" "$CALL" "$(date '+%H:%M:%S')"
        cat "$NEXUS_ERR"
        echo ""
    } >> "$STDERR_LOG"
fi
rm -f "$NEXUS_ERR"

echo ""
if [ ! -f "$VALGRIND_LOG" ]; then
    echo "FAIL: No valgrind log produced"
    exit 1
fi

if (( EXIT_CODE == 124 )); then
    echo "FAIL: Timed out under valgrind"
    rm -f "$VALGRIND_LOG"
    exit 1
fi

# Extract definite leak count
DEFINITELY_LOST=$(grep 'definitely lost:' "$VALGRIND_LOG" | grep -oP '\d+(?= bytes)' | head -1)
DEFINITELY_LOST=${DEFINITELY_LOST:-0}
FD_LEAK=$(grep 'FILE DESCRIPTORS:' "$VALGRIND_LOG" | grep -oP '\d+(?= open)' | head -1)
FD_LEAK=${FD_LEAK:-3}
EXTRA_FDS=$((FD_LEAK - 3))  # subtract stdin/stdout/stderr

echo "Definitely lost: ${DEFINITELY_LOST} bytes"
echo "Extra file descriptors at exit: ${EXTRA_FDS}"

# Fail on large leaks (>4KB) or many leaked fds (>3)
if (( DEFINITELY_LOST > 4096 )); then
    echo ""
    echo "FAIL: Large memory leak detected (log: $VALGRIND_LOG)"
    cat "$VALGRIND_LOG"
    exit 1
fi
if (( EXTRA_FDS > 3 )); then
    echo ""
    echo "FAIL: File descriptor leak detected (log: $VALGRIND_LOG)"
    cat "$VALGRIND_LOG"
    exit 1
fi

rm -f "$VALGRIND_LOG"
echo "PASS"


================================================
FILE: test-suite/stress/zombie-stress.sh
================================================
#!/usr/bin/env bash
# zombie-stress.sh - Test for resource accumulation over repeated runs
#
# Usage: ./zombie-stress.sh <golden-test-dir> <call> [<call> ...] [-- iterations]
#   e.g. ./zombie-stress.sh ../golden-tests/interop-3a-cp "foo '[1,2,3]'" -- 50

source "$(dirname "$0")/common.sh"

# Split args at "--" into calls and options
POSITIONAL=()
ITERATIONS=50
while [ $# -gt 0 ]; do
    if [ "$1" = "--" ]; then
        shift; ITERATIONS=${1:-50}; break
    fi
    POSITIONAL+=("$1"); shift
done
parse_args "${POSITIONAL[@]}"

echo "=== Zombie Stress Test ==="
echo "Iterations: $ITERATIONS"
compile_workload

INITIAL_ZOMBIES=$(count_zombies)
INITIAL_SHM=$(count_shm)
INITIAL_TMP=$(count_tmp)
FAILURES=0

printf "\n%-6s  %-8s  %-8s  %-8s\n" "ITER" "ZOMBIES" "SHM" "TMPDIR"
printf "%-6s  %-8s  %-8s  %-8s\n" "----" "-------" "---" "------"

for i in $(seq 1 "$ITERATIONS"); do
    run_nexus || true
    sleep 0.02

    ZOMBIES=$(( $(count_zombies) - INITIAL_ZOMBIES ))
    SHM=$(( $(count_shm) - INITIAL_SHM ))
    TMP=$(( $(count_tmp) - INITIAL_TMP ))

    if (( i % 10 == 0 || SHM > 0 || TMP > 0 )); then
        printf "%-6d  %-8d  %-8d  %-8d\n" "$i" "$ZOMBIES" "$SHM" "$TMP"
    fi

    if (( SHM > 0 || TMP > 0 )); then
        FAILURES=$((FAILURES + 1))
    fi
done

echo ""
echo "=== Summary ==="
FINAL_ZOMBIES=$(( $(count_zombies) - INITIAL_ZOMBIES ))
FINAL_SHM=$(( $(count_shm) - INITIAL_SHM ))
FINAL_TMP=$(( $(count_tmp) - INITIAL_TMP ))

echo "New zombies: $FINAL_ZOMBIES"
echo "Leaked SHM: $FINAL_SHM"
echo "Leaked tmpdir: $FINAL_TMP"
echo "Iterations with resource leaks: $FAILURES / $ITERATIONS"

if (( FINAL_SHM > 0 || FINAL_TMP > 0 )); then
    echo "FAIL: Resources leaked"
    exit 1
fi
echo "PASS"


================================================
FILE: test-suite/test.sh
================================================
#!/usr/bin/env bash

./typecheck-benchmark/run-benchmarks.sh

./concurrency-tests/run-tests.sh

./daemon-tests/run-tests.sh

./stress/run-all.sh

echo "libmorloc tests not defined yet"
# cmorloc-tests:

echo "error-message tests not defined yet"
# error-message-tests:

echo "executable benchmarks not yet up" 
# executable-benchmark/distributed:
# executable-benchmark/parallel-interop:
# executable-benchmark/serial-interop:


================================================
FILE: test-suite/typecheck-benchmark/apply-ann-20.loc
================================================
module aa20 (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (x :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int) :: Int)


================================================
FILE: test-suite/typecheck-benchmark/apply-deep-10.loc
================================================
module ad10 (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f x)))))))))


================================================
FILE: test-suite/typecheck-benchmark/apply-deep-100.loc
================================================
module ad100 (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (x))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))


================================================
FILE: test-suite/typecheck-benchmark/apply-deep-30.loc
================================================
module ad30 (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f x)))))))))))))))))))))))))))))


================================================
FILE: test-suite/typecheck-benchmark/apply-deep-50.loc
================================================
module ad50 (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (x))))))))))))))))))))))))))))))))))))))))))))))))))


================================================
FILE: test-suite/typecheck-benchmark/apply-deep.loc
================================================
module ad (foo)

f :: Int -> Int
f x = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f x)))))))))))))))))))


================================================
FILE: test-suite/typecheck-benchmark/apply-multi-arg-20.loc
================================================
module ma20 (foo)

f :: Int -> Int -> Int
f x y = x

foo :: Int -> Int
foo x = f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f (f x 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1) 1


================================================
FILE: test-suite/typecheck-benchmark/compose-10.loc
================================================
module c10 (foo)

import root ((.))

id_ :: Int -> Int
id_ x = x

foo = id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_


================================================
FILE: test-suite/typecheck-benchmark/compose-20.loc
================================================
module c20 (foo)

import root ((.))

id_ :: Int -> Int
id_ x = x

foo = id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_


================================================
FILE: test-suite/typecheck-benchmark/compose-40.loc
================================================
module c40 (foo)

import root ((.))

id_ :: Int -> Int
id_ x = x

foo = id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_


================================================
FILE: test-suite/typecheck-benchmark/partial-app.loc
================================================
module pa (foo)

import root ((.))

add :: Int -> Int -> Int
add x y = x

inc :: Int -> Int
inc = add 1

foo = inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc . inc


================================================
FILE: test-suite/typecheck-benchmark/poly-compose.loc
================================================
module pc (foo)

import root ((.))

id_ x = x

foo = id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_ . id_


================================================
FILE: test-suite/typecheck-benchmark/run-benchmarks.sh
================================================
#!/bin/bash
# Typecheck performance benchmarks
# Usage: ./run-benchmarks.sh [timeout_seconds] [warn_threshold_ms]
#
# All benchmarks should complete well under 1 second. Any result over the
# warning threshold (default 500ms) is flagged as SLOW.

TIMEOUT=${1:-10}
WARN_MS=${2:-500}
SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"

RED='\033[0;31m'
GREEN='\033[0;32m'
YELLOW='\033[0;33m'
BOLD='\033[1m'
RESET='\033[0m'

pass=0
fail=0

printf "${BOLD}%-25s %10s %8s${RESET}\n" "program" "time (ms)" "status"
printf "%-25s %10s %8s\n" "-------------------------" "----------" "--------"

for loc_file in "$SCRIPT_DIR"/*.loc; do
    name=$(basename "$loc_file" .loc)
    start_ns=$(date +%s%N)
    timeout "$TIMEOUT" morloc typecheck "$loc_file" > /dev/null 2>&1
    exit_code=$?
    end_ns=$(date +%s%N)
    diff_ms=$(( (end_ns - start_ns) / 1000000 ))

    if [ $exit_code -eq 124 ]; then
        color="$RED"
        status="TIMEOUT"
        fail=$((fail + 1))
    elif [ $exit_code -ne 0 ]; then
        color="$RED"
        status="ERROR"
        fail=$((fail + 1))
    elif [ $diff_ms -gt $WARN_MS ]; then
        color="$YELLOW"
        status="SLOW"
        fail=$((fail + 1))
    else
        color="$GREEN"
        status="ok"
        pass=$((pass + 1))
    fi

    printf "%-25s %10d ${color}%8s${RESET}\n" "$name" "$diff_ms" "$status"
done

echo ""
if [ $fail -eq 0 ]; then
    printf "${GREEN}${BOLD}All %d benchmarks passed${RESET} (warn threshold: ${WARN_MS}ms)\n" "$pass"
else
    printf "${RED}${BOLD}%d failed${RESET}, %d passed (warn threshold: ${WARN_MS}ms)\n" "$fail" "$pass"
fi
[ $fail -eq 0 ] && exit 0 || exit 1


================================================
FILE: test-suite/typecheck-benchmark/tuple-nested-20.loc
================================================
module tn20 (foo)

f :: (Int, Int) -> Int
f x = 1

g :: Int -> (Int, Int)
g x = (x, x)

foo :: Int -> Int
foo x = f (g (f (g (f (g (f (g (f (g (f (g (f (g (f (g (f (g (f (g x)))))))))))))))))))