Repository: stephenslab/susieR
Branch: master
Commit: 00f8ea82d576
Files: 222
Total size: 1.9 MB

Directory structure:
gitextract_f5azyrwd/

├── .Rbuildignore
├── .github/
│   ├── dependabot.yml
│   ├── rattler-build_container.df
│   ├── recipe/
│   │   ├── recipe.yaml
│   │   ├── variant_r44.yaml
│   │   └── variant_r45.yaml
│   └── workflows/
│       ├── ci.yml
│       ├── conda_build.yml
│       ├── dispatch_pkgdown_build.yml
│       └── release.yml
├── .gitignore
├── DESCRIPTION
├── LICENSE
├── LICENSE.md
├── Makefile
├── NAMESPACE
├── R/
│   ├── cpp11.R
│   ├── diagnosis_reports.R
│   ├── example_dataset.R
│   ├── generic_methods.R
│   ├── individual_data_methods.R
│   ├── iterative_bayesian_stepwise_selection.R
│   ├── mixture_prior.R
│   ├── model_methods.R
│   ├── mr.ash.R
│   ├── mr.ash.rss.R
│   ├── predict.susie.R
│   ├── refinement.R
│   ├── rss_lambda_methods.R
│   ├── rss_mismatch.R
│   ├── single_effect_regression.R
│   ├── slot_prior.R
│   ├── sparse_multiplication.R
│   ├── ss_mixture_methods.R
│   ├── sufficient_stats_methods.R
│   ├── summary.susie.R
│   ├── susie.R
│   ├── susieR-package.R
│   ├── susie_auto.R
│   ├── susie_constructors.R
│   ├── susie_get_functions.R
│   ├── susie_plot.R
│   ├── susie_post_outcome_configuration.R
│   ├── susie_rss_utils.R
│   ├── susie_trendfilter.R
│   ├── susie_trendfilter_utils.R
│   ├── susie_utils.R
│   ├── susie_workhorse.R
│   └── univariate_regression.R
├── README.md
├── _pkgdown.yml
├── data/
│   ├── FinemappingConvergence.RData
│   ├── N2finemapping.RData
│   ├── N3finemapping.RData
│   ├── SummaryConsistency.RData
│   ├── data_small.RData
│   └── unmappable_data.RData
├── inst/
│   ├── CITATION
│   ├── analysis/
│   │   ├── optimize.Rmd
│   │   ├── test_susie_auto.Rmd
│   │   └── testing.Rmd
│   ├── code/
│   │   ├── caviar.R
│   │   ├── compute_ss_memory.R
│   │   ├── dap-g.py
│   │   ├── finemap.R
│   │   ├── finemap_1p4.R
│   │   ├── gen_original_results.R
│   │   ├── monitor_memory.py
│   │   ├── python_example/
│   │   │   ├── N3finemapping_python.ipynb
│   │   │   └── environment.yml
│   │   ├── simulate_lambda_pop_ld_bias.R
│   │   ├── small_sim.R
│   │   ├── sparse_matrix_strategy.Rmd
│   │   ├── summarize_small_sim.R
│   │   ├── susie_memory.R
│   │   └── susie_rss_memory.R
│   ├── datafiles/
│   │   ├── FinemappingConvergence1k.RData
│   │   ├── N3finemapping.CAVIAR.RData
│   │   ├── N3finemapping.DAP.RData
│   │   ├── N3finemapping.FINEMAP.RData
│   │   ├── SummaryConsistency1k.RData
│   │   └── small_sim_out_v0.14.48.RData
│   ├── misc/
│   │   ├── README_susie_v2.md
│   │   ├── format_r_code.sh
│   │   ├── post-commit.sh
│   │   ├── pre-commit.sh
│   │   └── uncrustify_default.cfg
│   └── notebooks/
│       ├── benchmark_mix_vs_sp.R
│       ├── small_sample_benchmark.ipynb
│       └── stochastic_ld_benchmark.ipynb
├── man/
│   ├── FinemappingConvergence.Rd
│   ├── N2finemapping.Rd
│   ├── N3finemapping.Rd
│   ├── SummaryConsistency.Rd
│   ├── absolute.order.Rd
│   ├── add_delta_features.Rd
│   ├── block_coordinate_ascent.Rd
│   ├── calculate_posterior_moments_mixture_common.Rd
│   ├── check_alpha_pip_cycle_convergence.Rd
│   ├── cleanup_extra_fields.Rd
│   ├── coef.mr.ash.Rd
│   ├── coef.susie.Rd
│   ├── collect_ash_diag.Rd
│   ├── compare_ash_methods.Rd
│   ├── compute_marginal_bhat_shat.Rd
│   ├── compute_suff_stat.Rd
│   ├── data_small.Rd
│   ├── diagnose_ash_filter_archived_iter.Rd
│   ├── diagnose_bb_ash_iter.Rd
│   ├── estimate_s_rss.Rd
│   ├── extract_bb_ash_features.Rd
│   ├── format_extra_diag.Rd
│   ├── format_sigma2_summary.Rd
│   ├── get.full.posterior.Rd
│   ├── get_alpha_l.Rd
│   ├── get_cs_correlation.Rd
│   ├── get_objective.Rd
│   ├── get_posterior_mean_l.Rd
│   ├── get_posterior_mean_sum.Rd
│   ├── get_posterior_moments_l.Rd
│   ├── get_prior_variance_l.Rd
│   ├── get_slot_weight.Rd
│   ├── ibss_finalize.Rd
│   ├── ibss_initialize.Rd
│   ├── is_symmetric_matrix.Rd
│   ├── kriging_rss.Rd
│   ├── label_diag_truth.Rd
│   ├── loglik_mixture_common.Rd
│   ├── mr.ash.Rd
│   ├── mr.ash.rss.Rd
│   ├── path.order.Rd
│   ├── post_loglik_prior_hook.Rd
│   ├── pre_loglik_prior_hook.Rd
│   ├── predict.mr.ash.Rd
│   ├── predict.susie.Rd
│   ├── print.summary.susie_post_outcome_configuration.Rd
│   ├── resolve_mixture_prior.Rd
│   ├── safe_cor.Rd
│   ├── safe_cov2cor.Rd
│   ├── scale_design_matrix.Rd
│   ├── set_prior_variance_l.Rd
│   ├── slot_prior_betabinom.Rd
│   ├── summary.susie.Rd
│   ├── summary.susie_post_outcome_configuration.Rd
│   ├── susie.Rd
│   ├── susieR-package.Rd
│   ├── susie_auto.Rd
│   ├── susie_get_methods.Rd
│   ├── susie_init_coef.Rd
│   ├── susie_plot_changepoint.Rd
│   ├── susie_plots.Rd
│   ├── susie_post_outcome_configuration.Rd
│   ├── susie_rss.Rd
│   ├── susie_rss_lambda.Rd
│   ├── susie_ss.Rd
│   ├── susie_trendfilter.Rd
│   ├── susie_workhorse.Rd
│   ├── univar.order.Rd
│   ├── univariate_regression.Rd
│   └── unmappable_data.Rd
├── pixi.toml
├── src/
│   ├── Makevars
│   ├── Makevars.win
│   ├── caisa.cpp
│   ├── cpp11.cpp
│   ├── mr_ash.h
│   ├── mr_ash_rss.cpp
│   └── mr_ash_rss.h
├── tests/
│   ├── README.md
│   ├── testthat/
│   │   ├── helper_nig_reference.R
│   │   ├── helper_reference.R
│   │   ├── helper_testthat.R
│   │   ├── reference/
│   │   │   ├── test_susie_auto_reference.R
│   │   │   ├── test_susie_nig_reference.R
│   │   │   ├── test_susie_reference.R
│   │   │   ├── test_susie_rss_lambda_reference.R
│   │   │   ├── test_susie_rss_reference.R
│   │   │   └── test_susie_ss_reference.R
│   │   ├── test_X_centering.R
│   │   ├── test_coef_predict.R
│   │   ├── test_compute_marginal_bhat_shat.R
│   │   ├── test_generic_methods.R
│   │   ├── test_ibss.R
│   │   ├── test_individual_data_methods.R
│   │   ├── test_l_greedy.R
│   │   ├── test_mixture_prior.R
│   │   ├── test_mr_ash_equivalence.R
│   │   ├── test_plotting.R
│   │   ├── test_post_outcome_configuration_summary.R
│   │   ├── test_refinement.R
│   │   ├── test_rss_lambda_methods.R
│   │   ├── test_rss_mismatch.R
│   │   ├── test_rss_utils.R
│   │   ├── test_single_effect_regression.R
│   │   ├── test_slot_prior.R
│   │   ├── test_slot_weights.R
│   │   ├── test_sparse_multiplication.R
│   │   ├── test_sufficient_stats_methods.R
│   │   ├── test_summary_print.R
│   │   ├── test_susie.R
│   │   ├── test_susie_ash_ss_equivalence.R
│   │   ├── test_susie_auto.R
│   │   ├── test_susie_constructors.R
│   │   ├── test_susie_get_functions.R
│   │   ├── test_susie_small.R
│   │   ├── test_susie_utils.R
│   │   ├── test_susie_workhorse.R
│   │   ├── test_trendfilter.R
│   │   └── test_univariate_regression.R
│   └── testthat.R
└── vignettes/
    ├── announcements.Rmd
    ├── finemapping.Rmd
    ├── finemapping_summary_statistics.Rmd
    ├── l0_initialization.Rmd
    ├── mwe.Rmd
    ├── small_sample.Rmd
    ├── sparse_susie_eval.Rmd
    ├── susie_refine.Rmd
    ├── susie_rss.Rmd
    ├── susie_unmappable_effects.Rmd
    ├── susierss_diagnostic.Rmd
    └── trend_filtering.Rmd

================================================
FILE CONTENTS
================================================

================================================
FILE: .Rbuildignore
================================================
^docs$
^.gitignore$
^appveyor\.yml$
^_pkgdown\.yml$
^Makefile$
^\.circleci$
^susieR\.Rproj$
^\.Rproj\.user$
^\.travis\.yml$
^.*\.Rproj$
^tests/testthat/full_data_1_sim_gaussian_null_1\.rds$
^inst/datafiles$
^inst/code/compute_ss_data\.RData$
^inst/code/susie_data\.RData$
^inst/code/susie_rss_data\.RData$
^LICENSE\.md$
^NOTES\.txt$
^\.Renviron$
^pixi\.toml$
^pixi\.lock$
^\.pixi/.*
^\.github$


================================================
FILE: .github/dependabot.yml
================================================
version: 2
updates:
  - package-ecosystem: "github-actions"
    directory: "/"
    schedule:
      interval: "weekly"

================================================
FILE: .github/rattler-build_container.df
================================================
FROM ghcr.io/prefix-dev/pixi:latest

SHELL ["/bin/bash", "-c"]
RUN apt-get update
RUN apt-get install -y libgl1 ca-certificates
RUN groupadd -g 118 github
RUN useradd -m -u 1001 -g 118 -s /bin/bash runner
USER runner
RUN pixi global install rattler-build git patch
ENV PATH=/home/runner/.pixi/bin:${PATH}


================================================
FILE: .github/recipe/recipe.yaml
================================================
context:
  version: VERSION_PLACEHOLDER

package:
  name: r-susier
  version: ${{ version }}

source:
  path: susieR-${{ version }}.tar.gz
  sha256: SHA256SUM_PLACEHOLDER

build:
  number: BUILD_PLACEHOLDER
  dynamic_linking:
    rpaths:
      - lib/R/lib/
      - lib/
  script: R CMD INSTALL --build .

requirements:
  build:
    - ${{ compiler('c') }}
    - ${{ stdlib('c') }}
    - ${{ compiler('cxx') }}
  host:
    - r-base
    - r-cowplot
    - r-crayon
    - r-curl
    - r-ggplot2
    - r-knitr
    - r-l0learn
    - r-matrix
    - r-matrixstats
    - r-microbenchmark
    - r-mixsqp
    - r-cpp11
    - r-cpp11armadillo
    - r-reshape
    - r-rfast
    - r-rmarkdown
    - r-survival
    - r-testthat
  run:
    - r-base
    - r-cowplot
    - r-crayon
    - r-curl
    - r-ggplot2
    - r-knitr
    - r-l0learn
    - r-matrix
    - r-matrixstats
    - r-microbenchmark
    - r-mixsqp
    - r-cpp11
    - r-cpp11armadillo
    - r-reshape
    - r-rfast
    - r-rmarkdown
    - r-survival
    - r-testthat

tests:
  - script:
      - R -e "library('susieR')"

about:
  license: BSD-3-Clause
  license_file: LICENSE
  summary: Implements methods for variable selection in linear regression based on the Sum of Single Effects (SuSiE) model.
  homepage: https://github.com/stephenslab/susieR

extra:
  recipe-maintainers:
    - danielnachun


================================================
FILE: .github/recipe/variant_r44.yaml
================================================
MACOSX_DEPLOYMENT_TARGET:
  - '11.0'
c_stdlib_version:
  - if: linux
    then: 2.17
  - if: osx
    then: 11.0
c_stdlib:
  - if: linux
    then: sysroot
  - if: osx
    then: macosx_deployment_target
r_base:
  - 4.4


================================================
FILE: .github/recipe/variant_r45.yaml
================================================
MACOSX_DEPLOYMENT_TARGET:
  - '11.0'
c_stdlib_version:
  - if: linux
    then: 2.17
  - if: osx
    then: 11.0
c_stdlib:
  - if: linux
    then: sysroot
  - if: osx
    then: macosx_deployment_target
r_base:
  - 4.5


================================================
FILE: .github/workflows/ci.yml
================================================
name: Continuous Integration

on:
  push:
    branches: master
  pull_request:
    paths-ignore:
      - .github/*
      - .gitignore
      - README.md

jobs:
  ci_linux-64:
    name: linux-64 CI
    runs-on: ubuntu-latest
    env:
      CODECOV_TOKEN: ${{ secrets.CODECOV_TOKEN }}
    strategy:
      fail-fast: false
      matrix:
        environment: ["r44", "r45"]

    steps:
      - name: Checkout pull request branch
        uses: actions/checkout@v4
        with:
          fetch-depth: 0

      - name: Copy TOML
        run: |
          mkdir /tmp/pixi
          cp ${GITHUB_WORKSPACE}/pixi.toml /tmp/pixi

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4
        with:
          run-install: false

      - name: Run unit tests
        run: pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml devtools_test

      - name: Run R CMD CHECK
        run: |
          pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml build
          pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml rcmdcheck

      - name: Check unit test code coverage
        if: ${{ matrix.environment == 'r44' }}
        run: pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml codecov

  ci_osx-arm64:
    name: osx-arm64 CI
    runs-on: macos-latest
    strategy:
      fail-fast: false
      matrix:
        environment: ["r44", "r45"]
    
    steps:
      - name: Checkout pull request branch
        uses: actions/checkout@v4
        with:
          fetch-depth: 0

      - name: Copy TOML
        run: |
          mkdir /tmp/pixi
          cp ${GITHUB_WORKSPACE}/pixi.toml /tmp/pixi

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4
        with:
          run-install: false

      - name: Run unit tests
        run: pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml devtools_test

      - name: Run R CMD CHECK
        run: |
          pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml build
          pixi run --environment ${{ matrix.environment }} --manifest-path /tmp/pixi/pixi.toml rcmdcheck


================================================
FILE: .github/workflows/conda_build.yml
================================================
name: Build conda package

on:
  release:
    types: [published]
  workflow_dispatch:
    inputs:
      version:
        description: Version to package
        required: true
        default: 'latest'
      build:
        description: "Build revision of package (default: 0)"
        required: false
        default: '0'

jobs:
  build_package_linux-64:
    name: Build conda package for linux-64
    runs-on: ubuntu-latest
    strategy:
      fail-fast: false
      matrix:
        variant: ["r44", "r45"]

    env:
      ANACONDA_API_KEY: ${{ secrets.ANACONDA_API_TOKEN }}
      ANACONDA_OWNER: ${{ vars.ANACONDA_OWNER }}

    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          fetch-depth: 0

      - name: Get latest version
        id: latest-version
        if: github.event_name == 'workflow_dispatch' && github.event.inputs.version == 'latest'
        uses: pozetroninc/github-action-get-latest-release@v0.8.0
        with:
          repository: ${{ github.repository }}
          token: ${{ secrets.CI_TOKEN }}

      - name: Set version
        id: set-version
        run: |
          if [[ "${{ github.event_name }}" == "release" ]]; then
            version="${{ github.event.release.tag_name }}"
          elif [[ "${{ github.event.inputs.version }}" != "latest" ]]; then
            version="${{ github.event.inputs.version }}"
          else
            version="${{ steps.latest-version.outputs.release }}"
          fi
          echo "version=${version}" >> "$GITHUB_OUTPUT"

      - name: Set build number
        id: set-build
        run: |
          if [[ "${{ github.event_name }}" == "release" ]]; then
            echo "build=0" >> "$GITHUB_OUTPUT"
          else
            echo "build=${{ github.event.inputs.build }}" >> "$GITHUB_OUTPUT"
          fi

      - name: Download release
        uses: robinraju/release-downloader@v1
        with:
          tag: ${{ steps.set-version.outputs.version }}
          token: ${{ secrets.CI_TOKEN }}
          out-file-path: /tmp/recipe
          tarBall: true

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4
        with:
          run-install: false

      - name: Create recipe from template
        shell: pixi exec --spec sed --spec coreutils --spec wget -- bash -e {0}
        run: |
          cp .github/recipe/recipe.yaml /tmp/recipe/recipe.yaml
          cp .github/recipe/variant_${{ matrix.variant }}.yaml /tmp/recipe/variants.yaml
          repository=${{ github.repository }}
          build=${{ steps.set-build.outputs.build }}
          version=${{ steps.set-version.outputs.version }}
          sha256sum=$(sha256sum /tmp/recipe/${repository//*\//}-${version}.tar.gz | cut -d ' ' -f 1)
          sed -i "s/VERSION_PLACEHOLDER/${version}/g" /tmp/recipe/recipe.yaml
          sed -i "s/SHA256SUM_PLACEHOLDER/${sha256sum}/g" /tmp/recipe/recipe.yaml
          sed -i "s/BUILD_PLACEHOLDER/${build}/g" /tmp/recipe/recipe.yaml

      - name: Setup up docker buildx
        uses: docker/setup-buildx-action@v4

      - name: Build and export docker containers
        uses: docker/build-push-action@v7
        with:
          load: true
          file: .github/rattler-build_container.df
          tags: rattler-build:latest

      - name: Build conda packages
        run: |
          docker run --rm --volume /tmp:/tmp  \
            --volume /etc/passwd:/etc/passwd:ro \
            --volume /etc/group:/etc/group:ro \
            --volume $(pwd) --workdir $(pwd) \
            --user $(id -u) rattler-build \
            rattler-build build -c dnachun -c conda-forge -c bioconda \
            --output-dir /tmp/rattler-build --recipe-dir /tmp/recipe

      - name: Upload package
        shell: pixi exec --spec rattler-build -- bash -e {0}
        run: rattler-build upload anaconda --force /tmp/rattler-build/linux-64/*.conda

  build_package_osx-arm64:
    name: Build conda package for osx-arm64
    runs-on: macos-14
    strategy:
      fail-fast: false
      matrix:
        variant: ["r44", "r45"]
    env:
      ANACONDA_API_KEY: ${{ secrets.ANACONDA_API_TOKEN }}
      ANACONDA_OWNER: ${{ vars.ANACONDA_OWNER }}

    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          fetch-depth: 0

      - name: Get latest version
        id: latest-version
        if: github.event_name == 'workflow_dispatch' && github.event.inputs.version == 'latest'
        uses: pozetroninc/github-action-get-latest-release@v0.8.0
        with:
          repository: ${{ github.repository }}
          token: ${{ secrets.CI_TOKEN }}

      - name: Set version
        id: set-version
        run: |
          if [[ "${{ github.event_name }}" == "release" ]]; then
            version="${{ github.event.release.tag_name }}"
          elif [[ "${{ github.event.inputs.version }}" != "latest" ]]; then
            version="${{ github.event.inputs.version }}"
          else
            version="${{ steps.latest-version.outputs.release }}"
          fi
          echo "version=${version}" >> "$GITHUB_OUTPUT"

      - name: Set build number
        id: set-build
        run: |
          if [[ "${{ github.event_name }}" == "release" ]]; then
            echo "build=0" >> "$GITHUB_OUTPUT"
          else
            echo "build=${{ github.event.inputs.build }}" >> "$GITHUB_OUTPUT"
          fi

      - name: Download release
        uses: robinraju/release-downloader@v1
        with:
          tag: ${{ steps.set-version.outputs.version }}
          token: ${{ secrets.CI_TOKEN }}
          out-file-path: /tmp/recipe
          tarBall: true

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4
        with:
          run-install: false

      - name: Create recipe from template
        shell: pixi exec --spec sed --spec coreutils --spec wget -- bash -e {0}
        run: |
          cp .github/recipe/recipe.yaml /tmp/recipe/recipe.yaml
          cp .github/recipe/variant_${{ matrix.variant }}.yaml /tmp/recipe/variants.yaml
          repository=${{ github.repository }}
          build=${{ steps.set-build.outputs.build }}
          version=${{ steps.set-version.outputs.version }}
          sha256sum=$(sha256sum /tmp/recipe/${repository//*\//}-${version}.tar.gz | cut -d ' ' -f 1)
          sed -i "s/VERSION_PLACEHOLDER/${version}/g" /tmp/recipe/recipe.yaml
          sed -i "s/SHA256SUM_PLACEHOLDER/${sha256sum}/g" /tmp/recipe/recipe.yaml
          sed -i "s/BUILD_PLACEHOLDER/${build}/g" /tmp/recipe/recipe.yaml

      - name: Build conda package
        shell: pixi exec --spec rattler-build -- bash -e {0}
        run: rattler-build build -c dnachun -c conda-forge -c bioconda --output-dir /tmp/rattler-build --recipe-dir /tmp/recipe

      - name: Upload package
        shell: pixi exec --spec rattler-build -- bash -e {0}
        run: rattler-build upload anaconda --force /tmp/rattler-build/osx-arm64/*.conda


================================================
FILE: .github/workflows/dispatch_pkgdown_build.yml
================================================
name: Deploy website
on:
  push:
    branches: ["master"]
  workflow_dispatch:

env:
  GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}


permissions:
  contents: read
  pages: write
  id-token: write

concurrency:
  group: "pages"
  cancel-in-progress: false

jobs:
  build:
    runs-on: ubuntu-latest
    steps:
      - name: Checkout master
        uses: actions/checkout@v5
        with:
          ref: master

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4

      - name: Update pkgdown site
        run: pixi run -e r44 pkgdown_build

      - name: Setup Pages
        uses: actions/configure-pages@v5

      - name: Upload artifact
        uses: actions/upload-pages-artifact@v5
        with:
          path: ./docs

  deploy:
    environment:
      name: github-pages
      url: ${{ steps.deployment.outputs.page_url }}
    runs-on: ubuntu-latest
    needs: build
    steps:
      - name: Deploy to GitHub Pages
        id: deployment
        uses: actions/deploy-pages@v4


================================================
FILE: .github/workflows/release.yml
================================================
name: Upload new release

on:
  push:
    branches: [master]
    paths: [DESCRIPTION]
  workflow_dispatch:
    inputs:
      tag:
        description: Version to use for release tag
        default: auto
        required: true
      commit:
        description: Commit to use for tag
        default: auto
        required: true
      increment_major_version:
        description: Increment major version
        default: false
        required: true
      increment_minor_version:
        description: Increment minor version
        default: false
        required: true
      increment_patch_version:
        description: Increment patch version
        default: true
        required: true

# Prevent duplicate releases when manual dispatch pushes a version commit
concurrency:
  group: release
  cancel-in-progress: false

jobs:
  # Only runs on manual dispatch to bump version in DESCRIPTION
  update_version:
    outputs:
      commit: ${{ steps.commit-changes.outputs.commit_long_sha }}
    runs-on: ubuntu-latest
    if: github.event_name == 'workflow_dispatch' && github.event.inputs.commit == 'auto'
    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          token: ${{ secrets.CI_TOKEN }}
          fetch-depth: 0
          repository: ${{ github.repository }}
          ref: master

      - name: Setup pixi
        uses: prefix-dev/setup-pixi@v0.9.4

      - name: Update version
        run: |
          if [[ "${{ github.event.inputs.tag }}" != "auto" ]]; then
            sed -i 's/Version: .*$/Version: ${{ github.event.inputs.tag }}/' DESCRIPTION
          elif [[ "${{ github.event.inputs.increment_major_version }}" == "true" ]]; then
            pixi run use_major_version
          elif [[ "${{ github.event.inputs.increment_minor_version }}" == "true" ]]; then
            pixi run use_minor_version
          elif [[ "${{ github.event.inputs.increment_patch_version }}" == "true" ]]; then
            pixi run use_patch_version
          fi

      - name: Commit changes to version
        id: commit-changes
        uses: EndBug/add-and-commit@v10
        with:
          push: true
          message: Update version

  # Creates tag + GitHub release — runs for both push and manual triggers
  create_release:
    needs: update_version
    # Run when update_version succeeds (manual) or is skipped (push trigger)
    if: always() && (needs.update_version.result == 'success' || needs.update_version.result == 'skipped')
    runs-on: ubuntu-latest
    permissions:
      contents: write
    steps:
      - name: Determine commit
        id: determine-commit
        run: |
          if [[ "${{ github.event_name }}" == "push" ]]; then
            echo "commit=${{ github.sha }}" >> "$GITHUB_OUTPUT"
          elif [[ "${{ github.event.inputs.commit }}" != "auto" ]]; then
            echo "commit=${{ github.event.inputs.commit }}" >> "$GITHUB_OUTPUT"
          else
            echo "commit=${{ needs.update_version.outputs.commit }}" >> "$GITHUB_OUTPUT"
          fi

      - name: Checkout
        uses: actions/checkout@v6
        with:
          ref: ${{ steps.determine-commit.outputs.commit }}
          fetch-depth: 0

      - name: Set tag from DESCRIPTION
        id: set-tag
        run: |
          if [[ "${{ github.event_name }}" == "workflow_dispatch" && "${{ github.event.inputs.tag }}" != "auto" ]]; then
            tag="${{ github.event.inputs.tag }}"
          else
            tag=$(grep "^Version:" DESCRIPTION | sed 's/Version: *//')
          fi
          echo "tag=${tag}" >> "$GITHUB_OUTPUT"

      - name: Check if tag already exists
        id: check-tag
        run: |
          if git rev-parse "refs/tags/${{ steps.set-tag.outputs.tag }}" >/dev/null 2>&1; then
            echo "exists=true" >> "$GITHUB_OUTPUT"
            echo "::notice::Tag ${{ steps.set-tag.outputs.tag }} already exists — skipping release"
          else
            echo "exists=false" >> "$GITHUB_OUTPUT"
          fi

      - name: Check if major or minor version changed
        id: check-version-change
        run: |
          # Strip optional v prefix so legacy v-prefixed tags compare correctly
          new_version="${{ steps.set-tag.outputs.tag }}"
          new_version="${new_version#v}"
          new_major_minor=$(echo "$new_version" | cut -d. -f1,2)

          # Normalize all tags (strip v) before version-sorting, otherwise
          # git's v:refname sort ranks v-prefixed tags ahead of plain ones.
          latest_tag=$(git tag | sed 's/^v//' | sort -V | tail -n1 || echo "")

          if [[ -z "$latest_tag" ]]; then
            echo "No existing tags found — treating as new release"
            echo "is_major_minor=true" >> "$GITHUB_OUTPUT"
          else
            latest_major_minor=$(echo "$latest_tag" | cut -d. -f1,2)
            if [[ "$new_major_minor" != "$latest_major_minor" ]]; then
              echo "Major/minor version changed: $latest_major_minor -> $new_major_minor"
              echo "is_major_minor=true" >> "$GITHUB_OUTPUT"
            else
              echo "::notice::Only patch version changed ($latest_tag -> $new_version) — skipping release"
              echo "is_major_minor=false" >> "$GITHUB_OUTPUT"
            fi
          fi

      - name: Create new tag
        if: steps.check-tag.outputs.exists == 'false' && steps.check-version-change.outputs.is_major_minor == 'true'
        id: tag-version
        uses: mathieudutour/github-tag-action@v6.2
        with:
          default_bump: false
          default_prerelease_bump: false
          github_token: ${{ secrets.GITHUB_TOKEN }}
          custom_tag: ${{ steps.set-tag.outputs.tag }}
          commit_sha: ${{ steps.determine-commit.outputs.commit }}
          tag_prefix: ""

      - name: Create a GitHub release
        if: steps.check-tag.outputs.exists == 'false' && steps.check-version-change.outputs.is_major_minor == 'true'
        uses: ncipollo/release-action@v1
        with:
          tag: ${{ steps.set-tag.outputs.tag }}
          name: Release ${{ steps.set-tag.outputs.tag }}
          generateReleaseNotes: true


================================================
FILE: .gitignore
================================================
**/.Rhistory
**/.DS_Store
**/.Rapp.history
**/.ipynb_checkpoints
**/.virtual_documents
susieR.Rproj
.Rproj.user
.RData
.Ruserdata
.pixi/
Rplots.pdf
docs
pixi.lock
**/*.html
**/*.so
**/*.o
susieR.Rcheck
**/.*.swp
**/.*.swo


================================================
FILE: DESCRIPTION
================================================
Encoding: UTF-8
Type: Package
Package: susieR
Title: Sum of Single Effects Linear Regression
Description: Implements methods for variable selection in linear
    regression based on the "Sum of Single Effects" (SuSiE) model, as
    described in Wang et al (2020) <DOI:10.1101/501114> and Zou et al
    (2021) <DOI:10.1101/2021.11.03.467167>. These methods provide
    simple summaries, called "Credible Sets", for accurately
    quantifying uncertainty in which variables should be selected.
    The methods are motivated by genetic fine-mapping applications,
    and are particularly well-suited to settings where variables are
    highly correlated and detectable effects are sparse. The fitting
    algorithm, a Bayesian analogue of stepwise selection methods
    called "Iterative Bayesian Stepwise Selection" (IBSS), is simple
    and fast, allowing the SuSiE model be fit to large data sets
    (thousands of samples and hundreds of thousands of variables).
Date: 2026-04-24
Version: 0.16.1
Authors@R: c(person("Gao","Wang",role="aut",email="wang.gao@columbia.edu"),
             person("Yuxin","Zou",role="aut"),
             person("Alexander","McCreight",role="aut"),
             person("Kaiqian","Zhang",role="aut"),
             person("William","R.P. Denault",role="aut"),
             person("Peter","Carbonetto",role=c("aut","cre"),
                    email="peter.carbonetto@gmail.com"),
	     person("Matthew","Stephens",role="aut"))
URL: https://github.com/stephenslab/susieR
BugReports: https://github.com/stephenslab/susieR/issues
License: BSD_3_clause + file LICENSE
Depends: R (>= 3.0.2)
Imports:
    methods,
    graphics,
    grDevices,
    stats,
    Matrix,
    matrixStats,
    mixsqp,
    reshape,
    crayon,
    ggplot2
LinkingTo:
    cpp11,
    cpp11armadillo
Suggests:
    curl,
    pkgload,
    rprojroot,
    testthat,
    microbenchmark,
    knitr,
    rmarkdown,
    Rfast,
    cowplot,
    L0Learn
LazyData: yes
LazyDataCompression: xz
NeedsCompilation: yes
RoxygenNote: 7.3.3
VignetteBuilder: knitr


================================================
FILE: LICENSE
================================================
YEAR: 2017-2022
COPYRIGHT HOLDER: Gao Wang, Peter Carbonetto, Yuxin Zou, Kaiqian Zhang, Matthew Stephens
ORGANIZATION: Gao Wang, Peter Carbonetto, Yuxin Zou, Kaiqian Zhang, Matthew Stephens

================================================
FILE: LICENSE.md
================================================
Copyright (c) 2017-2022, Gao Wang, Peter Carbonetto, Yuxin Zou, Kaiqian Zhang, 
Matthew Stephens. 
All rights reserved. 

Redistribution and use in source and binary forms, with or without 
modification, are permitted provided that the following conditions are met: 

 * Redistributions of source code must retain the above copyright notice, 
   this list of conditions and the following disclaimer. 
 * Redistributions in binary form must reproduce the above copyright 
   notice, this list of conditions and the following disclaimer in the 
   documentation and/or other materials provided with the distribution. 
 * Neither the name of Gao Wang, Peter Carbonetto, Yuxin Zou, Kaiqian 
   Zhang, Matthew Stephens, nor the names of its contributors may be used 
   to endorse or promote products derived from this software without 
   specific prior written permission. 

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE 
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 
POSSIBILITY OF SUCH DAMAGE.


================================================
FILE: Makefile
================================================
# Makefile for susieR package
.PHONY: all install document test test-coverage pkgdown lint style clean deep-clean check check-cran

# Default target
all: document install

## Install the package
install: document
	@echo "Installing package..."
	@Rscript -e "devtools::install('.', quiet = TRUE, upgrade = FALSE, build = FALSE)"

## Document the package (properly handling Rcpp compilation)
document:
	@echo "Ensuring DESCRIPTION has final newline..."
	@Rscript -e "lines <- readLines('DESCRIPTION'); writeLines(lines, 'DESCRIPTION')"
	@echo "Creating minimal NAMESPACE if missing..."
	@test -f NAMESPACE || ( echo "# Generated by roxygen2: do not edit by hand" > NAMESPACE && \
		echo "" >> NAMESPACE ) 
	@echo "Regenerating Rcpp exports..."
	@Rscript -e "Rcpp::compileAttributes('.')"
	@echo "Compiling shared library..."
	@Rscript -e "pkgbuild::compile_dll('.')"
	@echo "Documenting with roxygen2..."
	@Rscript -e "roxygen2::roxygenise('.', clean = TRUE)"

## Run tests
test:
	@echo "Running tests..."
	@Rscript -e "devtools::test('.')"

## Test with coverage
test-coverage:
	@echo "Running tests with coverage..."
	@Rscript -e "covr::package_coverage('.')"

## Build pkgdown site
pkgdown: document
	@echo "Building pkgdown site..."
	@Rscript -e "pkgdown::clean_site('.')"
	@Rscript -e "pkgdown::init_site('.')"
	@Rscript -e "pkgdown::build_site('.', lazy = FALSE)"

pkgdown-lazy: document
	@echo "Building pkgdown site (lazy mode - only changed pages)..."
	@Rscript -e "pkgdown::build_site('.', lazy = TRUE)"

## Run lintr
lint:
	@echo "Running lintr..."
	@Rscript -e "lintr::lint_package('.')"

## Format code with styler
style:
	@echo "Styling code..."
	@Rscript -e "styler::style_pkg('.')"

## Basic check
check: document
	@echo "Running basic checks..."
	@Rscript -e "devtools::check('.', document = FALSE)"

## Run CRAN check
check-cran: document
	@echo "Running CRAN checks..."
	@Rscript -e "devtools::check('.', cran = TRUE, document = FALSE)"

## Clean generated files (KEEP NAMESPACE to avoid issues)
clean:
	@echo "Cleaning generated files..."
	@rm -f src/*.o src/*.so src/*.dll
	@rm -f src/RcppExports.cpp R/RcppExports.R
	@rm -rf man
	@rm -f src/symbols.rds
	@rm -rf *.tar.gz *.Rcheck
	@echo "Clean complete (NAMESPACE preserved)"

## Deep clean (removes everything including NAMESPACE)
deep-clean:
	@echo "Deep cleaning all generated files..."
	@rm -f src/*.o src/*.so src/*.dll
	@rm -f src/RcppExports.cpp R/RcppExports.R
	@rm -rf man
	@rm -f NAMESPACE
	@rm -f src/symbols.rds
	@rm -rf *.tar.gz *.Rcheck
	@rm -rf .Rhistory .RData .Rproj.user
	@rm -rf docs
	@rm -rf inst/doc vignettes/*.html vignettes/*.R
	@echo "Deep clean complete"

## Quick development workflow (when NAMESPACE exists)
quick: 
	@echo "Quick rebuild (assumes NAMESPACE exists)..."
	@Rscript -e "Rcpp::compileAttributes('.')"
	@Rscript -e "devtools::install('.', quick = TRUE, upgrade = FALSE)"

## Load package for interactive use
load:
	@echo "Loading package..."
	@Rscript -e "devtools::load_all('.')"

## Help
help:
	@echo "susieR Makefile"
	@echo ""
	@echo "Main targets:"
	@echo "  make              - Document and install (default)"
	@echo "  make document     - Generate documentation (creates NAMESPACE if needed)"
	@echo "  make install      - Install package"
	@echo "  make test         - Run tests"
	@echo "  make test-coverage - Test coverage report"
	@echo "  make pkgdown      - Build pkgdown site"
	@echo "  make lint         - Run lintr"
	@echo "  make style        - Format code with styler"
	@echo "  make check        - Run R CMD check"
	@echo "  make check-cran   - Run CRAN check"
	@echo ""
	@echo "Maintenance:"
	@echo "  make clean        - Remove generated files (keeps NAMESPACE)"
	@echo "  make deep-clean   - Remove ALL generated files"
	@echo ""
	@echo "Quick targets:"
	@echo "  make quick        - Quick rebuild (when NAMESPACE exists)"
	@echo "  make load         - Load package for interactive use"


================================================
FILE: NAMESPACE
================================================
# Generated by roxygen2: do not edit by hand

S3method(coef,mr.ash)
S3method(coef,susie)
S3method(get_objective,default)
S3method(ibss_initialize,default)
S3method(post_loglik_prior_hook,default)
S3method(pre_loglik_prior_hook,default)
S3method(predict,mr.ash)
S3method(predict,susie)
S3method(print,slot_prior)
S3method(print,summary.susie)
S3method(print,summary.susie_post_outcome_configuration)
S3method(summary,susie)
S3method(summary,susie_post_outcome_configuration)
export(absolute.order)
export(block_coordinate_ascent)
export(calc_z)
export(coef.mr.ash)
export(coef.susie)
export(compute_marginal_bhat_shat)
export(compute_suff_stat)
export(estimate_s_rss)
export(get.full.posterior)
export(get_cs_correlation)
export(get_objective)
export(ibss_finalize)
export(ibss_initialize)
export(is_symmetric_matrix)
export(kriging_rss)
export(mr.ash)
export(mr.ash.rss)
export(path.order)
export(post_loglik_prior_hook)
export(pre_loglik_prior_hook)
export(predict.mr.ash)
export(predict.susie)
export(print.summary.susie)
export(print.summary.susie_post_outcome_configuration)
export(slot_prior_betabinom)
export(slot_prior_poisson)
export(summary.susie)
export(summary.susie_post_outcome_configuration)
export(susie)
export(susie_auto)
export(susie_get_cs)
export(susie_get_lfsr)
export(susie_get_niter)
export(susie_get_objective)
export(susie_get_pip)
export(susie_get_posterior_mean)
export(susie_get_posterior_samples)
export(susie_get_posterior_sd)
export(susie_get_prior_variance)
export(susie_get_residual_variance)
export(susie_init_coef)
export(susie_plot)
export(susie_plot_changepoint)
export(susie_plot_iteration)
export(susie_post_outcome_configuration)
export(susie_rss)
export(susie_rss_lambda)
export(susie_ss)
export(susie_trendfilter)
export(susie_workhorse)
export(univar.order)
export(univariate_regression)
importFrom(Matrix,colMeans)
importFrom(Matrix,colSums)
importFrom(Matrix,crossprod)
importFrom(Matrix,forceSymmetric)
importFrom(Matrix,rowSums)
importFrom(Matrix,sparseMatrix)
importFrom(Matrix,summary)
importFrom(Matrix,t)
importFrom(Matrix,tcrossprod)
importFrom(Rfast,colVars)
importFrom(crayon,blue)
importFrom(crayon,bold)
importFrom(crayon,combine_styles)
importFrom(crayon,cyan)
importFrom(crayon,green)
importFrom(crayon,has_color)
importFrom(crayon,magenta)
importFrom(crayon,silver)
importFrom(crayon,yellow)
importFrom(ggplot2,.data)
importFrom(ggplot2,aes)
importFrom(ggplot2,aes_string)
importFrom(ggplot2,annotate)
importFrom(ggplot2,geom_abline)
importFrom(ggplot2,geom_col)
importFrom(ggplot2,geom_line)
importFrom(ggplot2,geom_point)
importFrom(ggplot2,ggplot)
importFrom(ggplot2,ggtitle)
importFrom(ggplot2,labs)
importFrom(ggplot2,theme_bw)
importFrom(ggplot2,theme_classic)
importFrom(grDevices,dev.off)
importFrom(grDevices,pdf)
importFrom(graphics,legend)
importFrom(graphics,par)
importFrom(graphics,plot)
importFrom(graphics,points)
importFrom(graphics,segments)
importFrom(matrixStats,colSds)
importFrom(methods,as)
importFrom(mixsqp,mixsqp)
importFrom(reshape,melt)
importFrom(stats,.lm.fit)
importFrom(stats,coef)
importFrom(stats,cor)
importFrom(stats,dnorm)
importFrom(stats,lm)
importFrom(stats,median)
importFrom(stats,optim)
importFrom(stats,optimize)
importFrom(stats,pnorm)
importFrom(stats,predict)
importFrom(stats,rmultinom)
importFrom(stats,rnorm)
importFrom(stats,sd)
importFrom(stats,summary.lm)
importFrom(stats,var)
importFrom(utils,head)
importFrom(utils,modifyList)
useDynLib(susieR, .registration = TRUE)


================================================
FILE: R/cpp11.R
================================================
# Generated by cpp11: do not edit by hand

random_order <- function(p, numiter) {
  .Call(`_susieR_random_order`, p, numiter)
}

caisa_cpp <- function(X, w, sa2, pi_init, beta_init, r_init, sigma2, o_r, maxiter, miniter, convtol, epstol, method_q, updatepi, updatesigma, verbose) {
  .Call(`_susieR_caisa_cpp`, X, w, sa2, pi_init, beta_init, r_init, sigma2, o_r, maxiter, miniter, convtol, epstol, method_q, updatepi, updatesigma, verbose)
}

mr_ash_rss_cpp <- function(bhat, shat, z, R, var_y, n, sigma2_e, s0, w0, mu1_init, tol, max_iter, update_w0, update_sigma, compute_ELBO, standardize) {
  .Call(`_susieR_mr_ash_rss_cpp`, bhat, shat, z, R, var_y, n, sigma2_e, s0, w0, mu1_init, tol, max_iter, update_w0, update_sigma, compute_ELBO, standardize)
}


================================================
FILE: R/diagnosis_reports.R
================================================
# Diagnostic functions for SuSiE-ash filter
#
# Per-iteration functions (called from susie_utils.R, return data.frame):
#   diagnose_bb_ash_iter()              - BB+ash code path
#   diagnose_ash_filter_archived_iter() - V0 code path
#
# Post-run helpers (called via susieR:::):
#   collect_ash_diag(fit)               - rbind all iterations into ML table
#   label_diag_truth(df, fit, causal)   - add TP/FP labels
#   add_delta_features(df)              - add per-slot change-over-iteration features
#   extract_bb_ash_features(fit, X, causal) - quick feature extraction from converged fit
#   compare_ash_methods(df1, df2)       - side-by-side comparison
#
# Usage example:
#   fit <- susie(X, y, L=10, slot_prior=slot_prior_betabinom(),
#                unmappable_effects="ash", max_iter=50)
#   df <- susieR:::collect_ash_diag(fit)
#   df <- susieR:::label_diag_truth(df, fit, causal)
#   df <- susieR:::add_delta_features(df)
#
#   # ML analysis: per-slot, per-iteration features with TP/FP labels
#   # Key columns: iter, slot, c_hat, lbf, purity, V, max_alpha,
#   #   alpha_entropy, mask_tier, collision, ever_uncertain, ...
#   # Delta columns: delta_c_hat, delta_V, delta_lbf, delta_max_alpha, ...
#   #   (change from previous iteration for the same slot)
#   #
#   # For 4-way comparison (BB+ash/V0 x mrash/no-mrash):
#   #   options(susie.skip_mrash = TRUE)  # toggle mr.ash off
#   #   fit_nomrash <- susie(...)
#   #   options(susie.skip_mrash = FALSE) # restore
#
# Data.frames accumulated on fit$.diag_env$history during the run.
# Debug flag .ash_debug in susie_utils.R (TRUE = on, never turn off).


#' BB+ash per-iteration diagnostic
#'
#' @return data.frame with one row per slot, all features
#' @keywords internal
diagnose_bb_ash_iter <- function(model, Xcorr, mask, b_confident,
                                 sentinels, sentinel_collision,
                                 is_confident_now, is_trusted,
                                 emerging_slots, active_slots, c_hat,
                                 ash_result, p,
                                 high_chat = NULL, low_chat = NULL,
                                 # Tunable parameters (captured for reproducibility)
                                 collision_threshold = 0.9,
                                 purity_threshold = 0.5,
                                 masking_threshold = 0.5,
                                 nPIP_threshold = 0.05,
                                 c_hat_excess_threshold = 0.2,
                                 alpha_entropy_threshold = log(5),
                                 slot_prior = NULL,
                                 mask_smoothness = NULL,
                                 mask_amount = NULL,
                                 mask_concentration = NULL,
                                 mask_burnin = NULL,
                                 mask_spread_pip_at_sent = NULL,
                                 mask_pip_prot_at_sent = NULL) {
  L <- nrow(model$alpha)
  theta_raw <- ash_result$beta
  theta_masked <- theta_raw
  theta_masked[mask] <- 0
  cs_coverage <- 0.9
  iter <- model$ash_iter

  rows <- list()
  for (l in seq_len(L)) {
    sent <- sentinels[l]
    alpha_l <- model$alpha[l, ]
    max_a <- max(alpha_l)

    # Purity and CS size
    cs_order <- order(alpha_l, decreasing = TRUE)
    cs_size <- min(which(cumsum(alpha_l[cs_order]) >= cs_coverage))
    if (cs_size > 1 && l %in% active_slots) {
      cs_idx <- cs_order[1:cs_size]
      pur <- min(abs(Xcorr[cs_idx, cs_idx]))
    } else if (cs_size == 1) {
      pur <- 1.0
    } else {
      pur <- 0.0
    }

    # Status
    status <- if (is_trusted[l]) "trusted"
              else if (is_confident_now[l] && model$ever_uncertain[l]) "conf_unc"
              else if (is_confident_now[l]) "confident"
              else if (sentinel_collision[l]) "collide"
              else if (model$V[l] == 0) "null"
              else "emerging"

    # Mask tier (key c_hat feature)
    mask_tier <- if (is_trusted[l]) "trusted"
                 else if (!is.null(high_chat) && l %in% high_chat) "high_chat"
                 else if (!is.null(low_chat) && l %in% low_chat) "low_chat"
                 else "unknown"

    # Max cross-sentinel |r| (collision strength)
    max_cross_r <- 0
    if (sent > 0 && length(active_slots) > 1) {
      other_sents <- sentinels[setdiff(active_slots, l)]
      other_sents <- other_sents[other_sents > 0]
      if (length(other_sents) > 0)
        max_cross_r <- max(abs(Xcorr[sent, other_sents]))
    }

    # Sentinel change
    prev_sent_l <- if (!is.null(model$prev_sentinel)) model$prev_sentinel[l] else 0L
    sent_changed <- (prev_sent_l > 0) && (sent != prev_sent_l)

    # Theta at sentinel
    theta_at_sent <- if (sent > 0) theta_masked[sent] else 0
    theta_raw_at_sent <- if (sent > 0) theta_raw[sent] else 0

    # Alpha entropy (low = concentrated, possibly FP)
    alpha_nz <- alpha_l[alpha_l > 1e-10]
    alpha_entropy <- -sum(alpha_nz * log(alpha_nz))

    # Number of colliding partners
    n_colliding <- 0
    if (sent > 0 && length(active_slots) > 1) {
      other_sents <- sentinels[setdiff(active_slots, l)]
      other_sents <- other_sents[other_sents > 0]
      if (length(other_sents) > 0)
        n_colliding <- sum(abs(Xcorr[sent, other_sents]) > 0.9)
    }

    # Per-slot mu properties
    mu_l <- model$mu[l, ]
    mu_at_sent <- if (sent > 0) mu_l[sent] else 0
    max_abs_mu <- max(abs(mu_l))

    # c_hat relative to prior: how much evidence beyond the prior expectation
    # For BB: prior_log_odds = log(a + k_others) - log(b + L-1 - k_others)
    # c_hat_null = sigmoid(prior_log_odds), c_hat_excess = c_hat - c_hat_null
    # Prior params read from model$slot_prior (set during susie init)
    c_hat_null_l <- NA
    c_hat_excess_l <- NA
    if (!is.null(model$slot_weights) && !is.null(slot_prior) &&
        !is.null(slot_prior$a_beta)) {
      sw <- model$slot_weights
      k_others <- sum(sw[-l])
      prior_lo <- log(slot_prior$a_beta + k_others) -
                  log(slot_prior$b_beta + L - 1 - k_others)
      c_hat_null_l <- 1 / (1 + exp(-prior_lo))
      c_hat_excess_l <- c_hat[l] - c_hat_null_l
    }

    rows[[l]] <- data.frame(
      method = "bb_ash", iter = iter, slot = l,
      sentinel = sent, purity = pur, V = model$V[l],
      c_hat = c_hat[l], c_hat_null = c_hat_null_l, c_hat_excess = c_hat_excess_l,
      lbf = if (!is.null(model$lbf)) model$lbf[l] else NA,
      max_alpha = max_a, cs_size = cs_size,
      alpha_entropy = alpha_entropy,
      is_confident = is_confident_now[l],
      is_trusted = is_trusted[l],
      status = status, mask_tier = mask_tier,
      was_low_chat = if (!is.null(model$was_low_chat)) model$was_low_chat[l] else FALSE,
      was_exposed = if (!is.null(model$was_exposed)) model$was_exposed[l] else FALSE,
      collision = sentinel_collision[l],
      ever_uncertain = model$ever_uncertain[l],
      n_colliding = n_colliding,
      max_cross_r = max_cross_r,
      sent_changed = sent_changed,
      prev_sentinel = prev_sent_l,
      mu_at_sent = mu_at_sent,
      max_abs_mu = max_abs_mu,
      theta_at_sent = theta_at_sent,
      theta_raw_at_sent = theta_raw_at_sent,
      mask_size = sum(mask), mask_frac = round(sum(mask) / p, 3),
      n_active = length(active_slots),
      n_trusted = sum(is_trusted),
      n_high_chat = if (!is.null(high_chat)) length(high_chat) else NA,
      n_low_chat = if (!is.null(low_chat)) length(low_chat) else NA,
      C_hat = round(sum(c_hat), 1),
      sigma2 = ash_result$sigma2,
      pi0 = if (!is.null(ash_result$pi)) ash_result$pi[1] else NA,
      theta_ss = sum(theta_masked^2),
      theta_raw_ss = sum(theta_raw^2),
      b_conf_ss = sum(b_confident^2),
      b_conf_max = max(abs(b_confident)),
      sent_masked = if (sent > 0) mask[sent] else FALSE,
      skip_mrash = getOption("susie.skip_mrash", FALSE),
      # Rule activation: which decision rules kicked in for this slot
      rule_active_gate = (l %in% active_slots),
      rule_collision = sentinel_collision[l],
      rule_jump = model$ever_uncertain[l] && !sentinel_collision[l],
      rule_trusted = is_trusted[l],
      rule_low_chat = if (!is.null(model$was_low_chat)) model$was_low_chat[l] else FALSE,
      rule_high_chat_pip = (!is.null(high_chat) && l %in% high_chat),
      rule_low_chat_sentinel = (!is.null(low_chat) && l %in% low_chat &&
        !(if (!is.null(model$was_exposed)) model$was_exposed[l] else FALSE)),
      rule_exposed = if (!is.null(model$was_exposed)) model$was_exposed[l] else FALSE,
      # Tunable parameter values
      param_collision_threshold = collision_threshold,
      param_purity_threshold = purity_threshold,
      param_masking_threshold = masking_threshold,
      param_nPIP_threshold = nPIP_threshold,
      param_c_hat_excess_threshold = c_hat_excess_threshold,
      param_alpha_entropy_threshold = alpha_entropy_threshold,
      # Unified mask diagnostics
      smoothness = if (!is.null(mask_smoothness)) mask_smoothness[l] else NA,
      amount = if (!is.null(mask_amount)) mask_amount[l] else NA,
      concentration = if (!is.null(mask_concentration)) mask_concentration[l] else NA,
      burnin = if (!is.null(mask_burnin)) mask_burnin[l] else NA,
      spread_pip_at_sent = if (!is.null(mask_spread_pip_at_sent) && sent > 0) mask_spread_pip_at_sent[l] else NA,
      pip_prot_at_sent = if (!is.null(mask_pip_prot_at_sent) && sent > 0) mask_pip_prot_at_sent[l] else NA,
      stringsAsFactors = FALSE
    )
  }
  do.call(rbind, rows)
}


#' V0 archived filter per-iteration diagnostic
#'
#' @return data.frame with one row per slot, all features
#' @keywords internal
diagnose_ash_filter_archived_iter <- function(model, Xcorr, masked,
                                              b_confident, sentinels,
                                              effect_purity, current_case,
                                              current_collision,
                                              mrash_output) {
  L <- nrow(model$alpha)
  p <- ncol(model$alpha)
  theta_raw <- mrash_output$beta
  theta_masked <- theta_raw
  theta_masked[masked] <- 0
  cs_coverage <- 0.9
  iter <- model$ash_iter

  is_active <- sapply(seq_len(L), function(l) {
    max(model$alpha[l, ]) - min(model$alpha[l, ]) >= 5e-5
  })

  rows <- list()
  for (l in seq_len(L)) {
    sent <- sentinels[l]
    alpha_l <- model$alpha[l, ]
    max_a <- max(alpha_l)
    cs_order <- order(alpha_l, decreasing = TRUE)
    cs_size <- min(which(cumsum(alpha_l[cs_order]) >= cs_coverage))
    case_str <- if (!is.na(current_case[l])) paste0("C", current_case[l]) else "inactive"

    # Max cross-sentinel |r|
    max_cross_r <- 0
    active_idx <- which(is_active)
    if (sent > 0 && length(active_idx) > 1) {
      other_sents <- sentinels[setdiff(active_idx, l)]
      other_sents <- other_sents[other_sents > 0]
      if (length(other_sents) > 0)
        max_cross_r <- max(abs(Xcorr[sent, other_sents]))
    }

    # Sentinel change
    prev_sent_l <- if (!is.null(model$prev_sentinel)) model$prev_sentinel[l] else 0L
    sent_changed <- (prev_sent_l > 0) && (sent != prev_sent_l)

    # Theta at sentinel
    theta_at_sent <- if (sent > 0) theta_masked[sent] else 0
    theta_raw_at_sent <- if (sent > 0) theta_raw[sent] else 0

    # Alpha entropy
    alpha_nz <- alpha_l[alpha_l > 1e-10]
    alpha_entropy <- -sum(alpha_nz * log(alpha_nz))

    # Number of colliding partners
    n_colliding <- 0
    if (sent > 0 && length(active_idx) > 1) {
      other_sents <- sentinels[setdiff(active_idx, l)]
      other_sents <- other_sents[other_sents > 0]
      if (length(other_sents) > 0)
        n_colliding <- sum(abs(Xcorr[sent, other_sents]) > 0.9)
    }

    # Per-slot mu properties
    mu_l <- model$mu[l, ]
    mu_at_sent <- if (sent > 0) mu_l[sent] else 0
    max_abs_mu <- max(abs(mu_l))

    rows[[l]] <- data.frame(
      method = "v0", iter = iter, slot = l,
      sentinel = sent, purity = effect_purity[l], V = model$V[l],
      lbf = model$lbf[l], max_alpha = max_a, cs_size = cs_size,
      alpha_entropy = alpha_entropy,
      status = case_str,
      current_collision = current_collision[l],
      ever_diffuse = model$ever_diffuse[l],
      diffuse_iter_count = if (!is.null(model$diffuse_iter_count)) model$diffuse_iter_count[l] else 0L,
      prev_case = if (!is.null(model$prev_case)) model$prev_case[l] else 0L,
      n_colliding = n_colliding,
      max_cross_r = max_cross_r,
      sent_changed = sent_changed,
      prev_sentinel = prev_sent_l,
      mu_at_sent = mu_at_sent,
      max_abs_mu = max_abs_mu,
      theta_at_sent = theta_at_sent,
      theta_raw_at_sent = theta_raw_at_sent,
      mask_size = sum(masked), mask_frac = round(sum(masked) / p, 3),
      n_active = sum(is_active),
      sigma2 = mrash_output$sigma2,
      pi0 = if (!is.null(mrash_output$pi)) mrash_output$pi[1] else NA,
      theta_ss = sum(theta_masked^2),
      theta_raw_ss = sum(theta_raw^2),
      b_conf_ss = sum(b_confident^2),
      b_conf_max = max(abs(b_confident)),
      sent_masked = if (sent > 0) masked[sent] else FALSE,
      skip_mrash = getOption("susie.skip_mrash", FALSE),
      # Rule activation: which V0 decision rules kicked in
      rule_collision = current_collision[l],
      rule_ever_diffuse = (model$ever_diffuse[l] > 0),
      rule_case1 = (!is.na(current_case[l]) && current_case[l] == 1),
      rule_case2 = (!is.na(current_case[l]) && current_case[l] == 2),
      rule_case3 = (!is.na(current_case[l]) && current_case[l] == 3),
      rule_exposure = (if (!is.null(model$diffuse_iter_count)) model$diffuse_iter_count[l] else 0) >= 2,
      rule_second_chance = if (!is.null(model$second_chance_used)) model$second_chance_used[sent] else FALSE,
      stringsAsFactors = FALSE
    )
  }
  do.call(rbind, rows)
}


# ---- Helper functions for ML analysis ----

#' Collect diagnostic data.frames across iterations
#'
#' Call this after running susie() to rbind all per-iteration diagnostics
#' into a single ML-ready data.frame.
#'
#' @param fit SuSiE fit object (must have been run with .ash_debug = TRUE)
#' @return data.frame with nrow = L * n_ash_iters, or NULL if no diagnostics
#'
#' @examples
#' \dontrun{
#' # Full ML pipeline:
#' data(unmappable_data)
#' X <- unmappable_data$X; y <- as.vector(unmappable_data$y)
#' causal <- which(unmappable_data$beta != 0)
#'
#' fit <- susie(X, y, L=10, slot_prior=slot_prior_betabinom(),
#'              unmappable_effects="ash", max_iter=50)
#'
#' df <- susieR:::collect_ash_diag(fit)         # all iterations
#' df <- susieR:::label_diag_truth(df, fit, causal) # TP/FP labels
#' df <- susieR:::add_delta_features(df)         # temporal features
#'
#' # Inspect FP slot across iterations:
#' subset(df, cs_label == "FP", select = c(iter, slot, sentinel,
#'        c_hat, lbf, max_alpha, alpha_entropy, mask_tier, delta_c_hat))
#'
#' # 4-way comparison (BB+ash vs V0, with/without mr.ash):
#' options(susie.skip_mrash = TRUE)
#' fit_nomrash <- susie(X, y, L=10, slot_prior=slot_prior_betabinom(),
#'                      unmappable_effects="ash", max_iter=50)
#' options(susie.skip_mrash = FALSE)
#' df_nomrash <- susieR:::collect_ash_diag(fit_nomrash)
#'
#' # Decision tree analysis:
#' # library(rpart)
#' # last_iter <- df[df$iter == max(df$iter) & df$V > 0, ]
#' # tree <- rpart(cs_label ~ c_hat + lbf + max_alpha + alpha_entropy +
#' #               purity + mask_tier + delta_c_hat, data = last_iter)
#' }
#'
#' @keywords internal
collect_ash_diag <- function(fit) {
  if (!is.null(fit$.diag_env) && !is.null(fit$.diag_env$history)) {
    return(do.call(rbind, fit$.diag_env$history))
  }
  # Fallback to old .diag_history list
  if (!is.null(fit$.diag_history)) {
    return(do.call(rbind, fit$.diag_history))
  }
  return(NULL)
}


#' Label diagnostic table with ground truth TP/FP
#'
#' For each slot at the final iteration, check if its CS (if any) contains
#' a causal variant.
#'
#' @param df Diagnostic data.frame (from collect_ash_diag or single iter)
#' @param fit SuSiE fit object
#' @param causal Integer vector of causal variant indices
#' @return df with added 'cs_label' column: "TP", "FP", or "-" (no CS)
#' @keywords internal
label_diag_truth <- function(df, fit, causal) {
  cs <- fit$sets$cs
  L <- max(df$slot)
  # Map each CS to its owning slot
  cs_slot_map <- rep(NA, L)
  cs_tp_map <- rep(NA, L)
  if (length(cs) > 0) {
    for (i in seq_along(cs)) {
      sent <- cs[[i]][which.max(fit$pip[cs[[i]]])]
      owner <- which.max(fit$alpha[, sent])
      cs_slot_map[owner] <- i
      cs_tp_map[owner] <- any(cs[[i]] %in% causal)
    }
  }
  df$cs_label <- sapply(df$slot, function(l) {
    if (is.na(cs_slot_map[l])) "-"
    else if (cs_tp_map[l]) "TP"
    else "FP"
  })
  df
}


#' Add per-slot delta features (change from previous iteration)
#'
#' Computes delta_c_hat, delta_V, delta_lbf, delta_max_alpha,
#' delta_alpha_entropy, delta_purity for each slot across iterations.
#' Also adds lag1 features (previous iteration values) and
#' cumulative features (max c_hat ever, min alpha_entropy ever).
#' These temporal features help ML models detect trajectories
#' (e.g., a slot that was strong then weakened = collapse signal).
#'
#' @param df data.frame from collect_ash_diag + label_diag_truth
#' @return df with added delta_, lag1_, and cum_ columns
#'
#' @examples
#' \dontrun{
#' df <- susieR:::collect_ash_diag(fit)
#' df <- susieR:::label_diag_truth(df, fit, causal)
#' df <- susieR:::add_delta_features(df)
#' # Now df has delta_c_hat, lag1_c_hat, cum_max_c_hat, etc.
#' # Use for decision tree: rpart::rpart(cs_label ~ ., data = df_last_iter)
#' }
#'
#' @keywords internal
add_delta_features <- function(df) {
  iters <- sort(unique(df$iter))
  slots <- sort(unique(df$slot))

  # Features to compute deltas/lags for
  feat_cols <- c("c_hat", "V", "lbf", "max_alpha", "alpha_entropy", "purity",
                 "mask_size", "theta_ss")

  # Initialize new columns
  for (f in feat_cols) {
    df[[paste0("delta_", f)]] <- NA_real_
    df[[paste0("lag1_", f)]] <- NA_real_
  }
  df$cum_max_c_hat <- NA_real_
  df$cum_min_entropy <- NA_real_
  df$cum_max_lbf <- NA_real_

  for (s in slots) {
    idx <- which(df$slot == s)
    if (length(idx) < 2) next

    slot_df <- df[idx, ]
    for (f in feat_cols) {
      vals <- slot_df[[f]]
      if (all(is.na(vals))) next
      # Delta: current - previous
      delta <- c(NA, diff(vals))
      df[[paste0("delta_", f)]][idx] <- delta
      # Lag1: previous value
      lag1 <- c(NA, vals[-length(vals)])
      df[[paste0("lag1_", f)]][idx] <- lag1
    }

    # Cumulative features
    if ("c_hat" %in% names(slot_df)) {
      df$cum_max_c_hat[idx] <- cummax(ifelse(is.na(slot_df$c_hat), 0, slot_df$c_hat))
    }
    if ("alpha_entropy" %in% names(slot_df)) {
      df$cum_min_entropy[idx] <- cummin(ifelse(is.na(slot_df$alpha_entropy), Inf, slot_df$alpha_entropy))
    }
    if ("lbf" %in% names(slot_df)) {
      df$cum_max_lbf[idx] <- cummax(ifelse(is.na(slot_df$lbf), 0, slot_df$lbf))
    }
  }

  df
}


#' Compare two diagnostic runs side by side
#'
#' Takes two data.frames (from diagnose_bb_ash_iter or
#' diagnose_ash_filter_archived_iter) at the same iteration
#' and prints a side-by-side comparison.
#'
#' @param df1 First diagnostic data.frame
#' @param df2 Second diagnostic data.frame
#' @param label1 Label for first run (e.g., "BB+ash")
#' @param label2 Label for second run (e.g., "V0")
#' @keywords internal
compare_ash_methods <- function(df1, df2, label1 = "Method1", label2 = "Method2") {
  cat(sprintf("\n===== %s vs %s (iter %d) =====\n", label1, label2,
              df1$iter[1]))
  cat(sprintf("  %-20s %12s %12s\n", "Feature", label1, label2))
  cat(sprintf("  %s\n", strrep("-", 46)))
  cat(sprintf("  %-20s %12d %12d\n", "mask_size", df1$mask_size[1], df2$mask_size[1]))
  cat(sprintf("  %-20s %12d %12d\n", "n_active", df1$n_active[1], df2$n_active[1]))
  cat(sprintf("  %-20s %12.4f %12.4f\n", "sigma2", df1$sigma2[1], df2$sigma2[1]))
  cat(sprintf("  %-20s %12.2e %12.2e\n", "theta_ss", df1$theta_ss[1], df2$theta_ss[1]))
  cat(sprintf("  %-20s %12.2e %12.2e\n", "b_conf_ss", df1$b_conf_ss[1], df2$b_conf_ss[1]))

  # Per-slot comparison for active slots
  active1 <- df1[df1$V > 0 | df1$status != "null", ]
  active2 <- df2[df2$V > 0 | df2$status != "inactive", ]
  n_show <- max(nrow(active1), nrow(active2))

  cat(sprintf("\n  Per-slot:\n"))
  cat(sprintf("  %2s | %-5s %5s %6s %5s | %-5s %5s %6s %5s\n",
              "L", "Sent1", "Pur1", "V1", "Sta1", "Sent2", "Pur2", "V2", "Sta2"))
  cat(sprintf("  %s\n", strrep("-", 60)))

  for (i in seq_len(n_show)) {
    r1 <- if (i <= nrow(active1)) active1[i, ] else NULL
    r2 <- if (i <= nrow(active2)) active2[i, ] else NULL
    l <- if (!is.null(r1)) r1$slot else r2$slot
    cat(sprintf("  %2d |", l))
    if (!is.null(r1))
      cat(sprintf(" %5d %5.3f %6.4f %5s |", r1$sentinel, r1$purity, r1$V,
                  substr(r1$status, 1, 5)))
    else
      cat(sprintf(" %5s %5s %6s %5s |", "-", "-", "-", "-"))
    if (!is.null(r2))
      cat(sprintf(" %5d %5.3f %6.4f %5s", r2$sentinel, r2$purity, r2$V,
                  substr(r2$status, 1, 5)))
    else
      cat(sprintf(" %5s %5s %6s %5s", "-", "-", "-", "-"))
    cat("\n")
  }
  cat(sprintf("==========================================\n"))
}


#' Extract ML feature table from a completed BB+ash fit
#'
#' Computes per-slot features from the converged model. Call with
#' susieR:::extract_bb_ash_features(fit, X_or_Xcorr, causal).
#'
#' @param fit Completed susie fit (with slot_prior + ash)
#' @param X Design matrix (used to compute Xcorr if needed)
#' @param causal Integer vector of true causal indices (for labeling)
#' @return data.frame with one row per slot, all features + TP/FP label
#' @keywords internal
extract_bb_ash_features <- function(fit, X, causal = NULL) {
  L <- nrow(fit$alpha)
  p <- ncol(fit$alpha)
  Xcorr <- cor(X)
  cs_coverage <- 0.9

  c_hat <- if (!is.null(fit$c_hat)) fit$c_hat else
           if (!is.null(fit$slot_weights)) fit$slot_weights else rep(1, L)

  # Map CS to slots
  cs <- fit$sets$cs
  cs_owner <- rep(NA, L)
  cs_is_tp <- rep(NA, L)
  if (length(cs) > 0) {
    for (i in seq_along(cs)) {
      sent <- cs[[i]][which.max(fit$pip[cs[[i]]])]
      owner <- which.max(fit$alpha[, sent])
      cs_owner[owner] <- i
      if (!is.null(causal))
        cs_is_tp[owner] <- any(cs[[i]] %in% causal)
    }
  }

  rows <- list()
  for (l in seq_len(L)) {
    alpha_l <- fit$alpha[l, ]
    sent <- which.max(alpha_l)
    max_a <- max(alpha_l)

    # Purity
    cs_order <- order(alpha_l, decreasing = TRUE)
    cs_size <- min(which(cumsum(alpha_l[cs_order]) >= cs_coverage))
    if (cs_size > 1 && fit$V[l] > 0) {
      cs_idx <- cs_order[1:cs_size]
      pur <- min(abs(Xcorr[cs_idx, cs_idx]))
    } else if (cs_size == 1) {
      pur <- 1.0
    } else {
      pur <- 0.0
    }

    # Alpha entropy
    alpha_nz <- alpha_l[alpha_l > 1e-10]
    alpha_entropy <- -sum(alpha_nz * log(alpha_nz))

    # Max cross-sentinel |r|
    max_cross_r <- 0
    n_colliding <- 0
    active <- which(fit$V > 0)
    if (sent > 0 && length(active) > 1) {
      other_sents <- sapply(setdiff(active, l), function(ll) which.max(fit$alpha[ll, ]))
      other_sents <- other_sents[other_sents > 0]
      if (length(other_sents) > 0) {
        cross_r <- abs(Xcorr[sent, other_sents])
        max_cross_r <- max(cross_r)
        n_colliding <- sum(cross_r > 0.9)
      }
    }

    # Theta at sentinel
    theta_at_sent <- if (!is.null(fit$theta) && sent > 0) fit$theta[sent] else 0

    # CS label
    cs_label <- if (is.na(cs_owner[l])) "-"
                else if (!is.null(causal) && cs_is_tp[l]) "TP"
                else if (!is.null(causal)) "FP"
                else paste0("CS", cs_owner[l])

    rows[[l]] <- data.frame(
      slot = l, sentinel = sent, purity = pur, V = fit$V[l],
      c_hat = c_hat[l],
      lbf = if (!is.null(fit$lbf)) fit$lbf[l] else NA,
      max_alpha = max_a, cs_size = cs_size,
      alpha_entropy = alpha_entropy,
      max_cross_r = max_cross_r, n_colliding = n_colliding,
      theta_at_sent = theta_at_sent,
      n_active = length(active),
      cs_label = cs_label,
      stringsAsFactors = FALSE
    )
  }
  do.call(rbind, rows)
}


================================================
FILE: R/example_dataset.R
================================================
#' @name N2finemapping
#'
#' @title Simulated Fine-mapping Data with Two Effect Variables
#'
#' @docType data
#'
#' @description This data set contains a genotype matrix for 574
#'   individuals and 1,002 variables. The variables are genotypes after
#'   centering and scaling, and therefore retain the correlation
#'   structure of the original genotype data. Two of the variables have
#'   non-zero effects on the multivariate response. The response data
#'   are generated under a multivariate linear regression model. See
#'   Wang \emph{et al} (2020) for details.
#'
#' @format \code{N2finemapping} is a list with the following elements:
#'
#' \describe{
#'
#'   \item{X}{Centered and scaled genotype data.}
#'
#'   \item{chrom}{Chromomsome of the original data, in hg38 coordinates.}
#'
#'   \item{pos}{Chromomosomal position of the original data, in hg38
#'     coordinates. The information can be used to compare impact of using
#'     other genotype references of the same variables in \code{susie_rss}
#'     application.}
#'
#'   \item{true_coef}{Simulated effect sizes.}
#'
#'   \item{residual_variance}{Simulated residual covariance matrix.}
#'
#'   \item{Y}{Simulated multivariate response.}
#'
#'   \item{allele_freq}{Allele frequencies based on the original
#'     genotype data.}
#'
#'   \item{V}{Suggested prior covariance matrix for effect sizes of
#'      the two non-zero effect variables.}
#' }
#'
#' @keywords data
#'
#' @references
#' G. Wang, A. Sarkar, P. Carbonetto and M. Stephens (2020). A simple
#'   new approach to variable selection in regression, with application
#'   to genetic fine-mapping. \emph{Journal of the Royal Statistical
#'   Society, Series B} \doi{10.1101/501114}.
#'
#' @examples
#' data(N2finemapping)
NULL

#' @name N3finemapping
#'
#' @title Simulated Fine-mapping Data with Three Effect Variables.
#'
#' @docType data
#'
#' @description The data-set contains a matrix of 574
#' individuals and 1,001 variables. These variables are real-world
#' genotypes centered and scaled, and therefore retains the
#' correlation structure of variables in the original genotype data. 3
#' out of the variables have non-zero effects.  The response data is
#' generated under a multivariate linear regression model. See Wang
#' \emph{et al} (2020) for more details.
#'
#' @format \code{N3finemapping} is a list with the following elements:
#'
#' \describe{
#'
#'   \item{X}{N by P variable matrix of centered and scaled genotype
#' data.}
#'
#'   \item{chrom}{Chromomsome of the original data, in hg38 coordinate.}
#'
#'   \item{pos}{Chromomosomal positoin of the original data, in hg38
#' coordinate. The information can be used to compare impact of using
#' other genotype references of the same variables in susie_rss
#' application.}
#'
#'   \item{true_coef}{The simulated effect sizes.}
#'
#'   \item{residual_variance}{The simulated residual covariance matrix.}
#'
#'   \item{Y}{The simulated response variables.}
#'
#'   \item{allele_freq}{Allele frequency of the original genotype data.}
#'
#'   \item{V}{Prior covariance matrix for effect size of the three
#' non-zero effect variables.}  }
#'
#' @keywords data
#'
#' @references
#' G. Wang, A. Sarkar, P. Carbonetto and M. Stephens (2020). A simple
#'   new approach to variable selection in regression, with application
#'   to genetic fine-mapping. \emph{Journal of the Royal Statistical
#'   Society, Series B} \doi{10.1101/501114}.
#'
#' @examples
#' data(N3finemapping)
NULL

#' @name FinemappingConvergence
#'
#' @title Simulated Fine-mapping Data with Convergence Problem.
#'
#' @description Data simulated using real genotypes from 50,000
#'   individuals and 200 SNPs. Two of the SNPs have non-zero effects
#'   on the multivariate response. The response data are generated under
#'   a linear regression model. The simulated response and the columns
#'   of the genotype matrix are centered.
#'
#' @format \code{FinemappingConvergence} is a list with the following
#' elements:
#'
#' \describe{
#'
#'   \item{XtX}{Summary statistics computed using the centered and
#'     scaled genotype matrix.}
#'
#'   \item{Xty}{Summary statistics computed using the centered and
#'     scaled genotype data, and the centered simulated response.}
#'
#'   \item{yty}{yty is computed using the centered simulated response.}
#'
#'   \item{n}{The sample size (50,000).}
#'
#'   \item{true_coef}{The coefficients used to simulate the responses.}
#'
#'   \item{z}{z-scores from a simple (single-SNP) linear regression.}}
#'
#' @docType data
#'
#' @keywords data
#'
#' @seealso A similar data set with more SNPs is used in the
#'   \dQuote{Refine SuSiE model} vignette.
#'
#' @examples
#' data(FinemappingConvergence)
NULL

#' @name SummaryConsistency
#'
#' @title Simulated Fine-mapping Data with LD matrix From Reference Panel.
#'
#' @description Data simulated using real genotypes from 10,000
#'   individuals and 200 SNPs. One SNP have non-zero effect
#'   on the multivariate response. The response data are generated under
#'   a linear regression model. There is also one SNP with flipped allele
#'   between summary statistics and the reference panel.
#'
#' @format \code{SummaryConsistency} is a list with the following
#' elements:
#'
#' \describe{
#'
#'   \item{z}{z-scores computed by fitting univariate simple regression
#'     variable-by-variable.}
#'
#'   \item{ldref}{LD matrix estimated from the reference panel.}
#'
#'   \item{flip_id}{The index of the SNP with the flipped allele.}
#'
#'   \item{signal_id}{The index of the SNP with the non-zero effect.}}
#'
#' @seealso A similar data set with more samples is used in the
#'   \dQuote{Diagnostic for fine-mapping with summary statistics}
#'   vignette.
#'
#' @docType data
#'
#' @keywords data
#'
#' @examples
#' data(SummaryConsistency)
NULL

#' @name data_small
#'
#' @title Simulated Small-sample eQTL Data.
#'
#' @description A simulated eQTL data set with 47 individuals and 7,430
#'   variables. The response is a simulated gene expression phenotype and
#'   the variables are genotypes. This data set illustrates the small
#'   sample-size setting considered in Denault \emph{et al} (2025).
#'
#' @format \code{data_small} is a list with the following elements:
#'
#' \describe{
#'
#'   \item{y}{Simulated gene expression response.}
#'
#'   \item{X}{Genotype matrix.}}
#'
#' @docType data
#'
#' @keywords data
#'
#' @seealso The \dQuote{Small data example} vignette.
#'
#' @references
#' W. R. P. Denault \emph{et al} (2025). Accounting for uncertainty in
#'   residual variances improves fine-mapping in small sample studies.
#'   \emph{bioRxiv} \doi{10.1101/2025.05.16.654543}.
#'
#' @examples
#' data(data_small)
NULL

#' @name unmappable_data
#'
#' @title Simulated Fine-mapping Data with Sparse, Oligogenic and Polygenic Effects.
#'
#' @description A simulated data set with 1,000 individuals and 5,000
#'   variants, combining 3 sparse, 5 oligogenic and 15 polygenic
#'   non-zero effects. The response is generated under a linear
#'   regression model. This data set illustrates fine-mapping with
#'   SuSiE-ash and SuSiE-inf.
#'
#' @format \code{unmappable_data} is a list with the following elements:
#'
#' \describe{
#'
#'   \item{X}{Centered and scaled genotype matrix.}
#'
#'   \item{y}{Simulated response.}
#'
#'   \item{beta}{Simulated effect sizes.}
#'
#'   \item{h2g}{Total proportion of variance in the response explained
#'     by the simulated effects.}}
#'
#' @docType data
#'
#' @keywords data
#'
#' @seealso The \dQuote{Fine-mapping with SuSiE-ash and SuSiE-inf}
#'   vignette.
#'
#' @examples
#' data(unmappable_data)
NULL

================================================
FILE: R/generic_methods.R
================================================
# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
#
# S3 generics dispatched on data objects setup, configuration, and preprocessing.
# These prepare data objects for model fitting and handle data-specific
# configurations like unmappable effects.
#
# Functions: configure_data, get_var_y
# =============================================================================

# Configure data object for specified method
#' @keywords internal
configure_data <- function(data, params) {
  UseMethod("configure_data")
}
#' @keywords internal
configure_data.default <- function(data, params) {
  return(data)
}

# Get variance of y
#' @keywords internal
get_var_y <- function(data, ...) {
  UseMethod("get_var_y")
}
#' @keywords internal
get_var_y.default <- function(data, ...) {
  stop("get_var_y: no method for class '", class(data)[1], "'")
}

# =============================================================================
# MODEL INITIALIZATION & SETUP
#
# Functions for initializing model objects and setting up initial states.
# These create model matrices, initialize fitted values, and prepare
# the SuSiE model for iterative fitting.
#
# Functions: initialize_susie_model, initialize_fitted, validate_prior, track_ibss_fit
# =============================================================================

# Initialize susie model object
#' @keywords internal
initialize_susie_model <- function(data, params, ...) {
  UseMethod("initialize_susie_model")
}
#' @keywords internal
initialize_susie_model.default <- function(data, params, ...) {
  stop("initialize_susie_model: no method for class '", class(data)[1], "'")
}

# Initialize fitted values
#' @keywords internal
initialize_fitted <- function(data, mat_init) {
  UseMethod("initialize_fitted")
}
#' @keywords internal
initialize_fitted.default <- function(data, mat_init, ...) {
  stop("initialize_fitted: no method for class '", class(data)[1], "'")
}

# Validate prior variance
#' @keywords internal
validate_prior <- function(data, params, model, ...) {
  UseMethod("validate_prior")
}
#' @keywords internal
validate_prior.default <- function(data, params, model, ...) {
  invisible(TRUE)
}

# Track core parameters of a susie fit across iterations
#' @keywords internal
track_ibss_fit <- function(data, params, model, tracking, iter, ...) {
  UseMethod("track_ibss_fit")
}
#' @keywords internal
track_ibss_fit.default <- function(data, params, model, tracking, iter, elbo, ...) {
  # Store iteration snapshot if tracking is enabled.
  # tracking is a purely numeric list: tracking[[1]], [[2]], etc.
  if (isTRUE(params$track_fit)) {
    tracking[[iter]] <- list(
      alpha  = model$alpha,
      niter  = iter,
      V      = model$V,
      sigma2 = model$sigma2
    )
    # Track slot activity per iteration when active
    if (!is.null(model$slot_weights)) {
      tracking[[iter]]$slot_weights <- model$slot_weights
      tracking[[iter]]$lbf <- model$lbf
    }
  }
  return(tracking)
}

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
#
# Core functions for single effect regression computation and ELBO calculation.
# These handle the mathematical core of SuSiE including residual computation, SER
# statistics, posterior moments, and log-likelihood calculations for the ELBO.
#
# Functions: compute_residuals, compute_ser_statistics, SER_posterior_e_loglik,
# calculate_posterior_moments, compute_kl, get_ER2, Eloglik, loglik, neg_loglik
# =============================================================================

#' Get the slot weight for effect l
#'
#' Returns the weight by which effect l's contribution to the fitted
#' values is scaled. When \code{model$slot_weights} is NULL (the default),
#' all effects have weight 1 and standard SuSiE behavior is recovered.
#'
#' Slot weights enable a natural mechanism for adaptively estimating the
#' number of effects: each slot l can have a weight in [0,1] reflecting
#' the posterior probability that the slot is active. With a suitable
#' prior on the number of active effects, this generalizes SuSiE's fixed
#' L to a data-driven estimate.
#'
#' @param model SuSiE model object.
#' @param l Effect index.
#'
#' @return Scalar weight (default 1).
#'
#' @keywords internal
get_slot_weight <- function(model, l) {
  if (is.null(model$slot_weights)) 1 else model$slot_weights[l]
}

# Compute residuals for single effect regression
#' @keywords internal
compute_residuals <- function(data, params, model, l, ...) {
  UseMethod("compute_residuals")
}
#' @keywords internal
compute_residuals.default <- function(data, params, model, l, ...) {
  stop("compute_residuals: no method for class '", class(data)[1], "'")
}

# Compute SER statistics (betahat, shat2)
#' @keywords internal
compute_ser_statistics <- function(data, params, model, l, ...) {
  UseMethod("compute_ser_statistics")
}
#' @keywords internal
compute_ser_statistics.default <- function(data, params, model, l, ...) {
  stop("compute_ser_statistics: no method for class '", class(data)[1], "'")
}

# Single effect regression posterior expected log-likelihood
#' @keywords internal
SER_posterior_e_loglik <- function(data, params, model, l) {
  UseMethod("SER_posterior_e_loglik")
}
#' @keywords internal
SER_posterior_e_loglik.default <- function(data, params, model, l) {
  stop("SER_posterior_e_loglik: no method for class '", class(data)[1], "'")
}

# Calculate posterior moments for single effect regression
#' @keywords internal
calculate_posterior_moments <- function(data, params, model, V, l, ...) {
  UseMethod("calculate_posterior_moments")
}
#' @keywords internal
calculate_posterior_moments.default <- function(data, params, model, V, l = NULL, ...) {
  stop("calculate_posterior_moments: no method for class '", class(data)[1], "'")
}

# Calculate KL divergence
#' @keywords internal
compute_kl <- function(data, params, model, l) {
  UseMethod("compute_kl")
}
#' @keywords internal
compute_kl.default <- function(data, params, model, l) {
  model$KL[l] <- -model$lbf[l] + SER_posterior_e_loglik(data, params, model, l)
  return(model)
}

# Expected squared residuals
#' @keywords internal
get_ER2 <- function(data, model) {
  UseMethod("get_ER2")
}
#' @keywords internal
get_ER2.default <- function(data, model) {
  stop("get_ER2: no method for class '", class(data)[1], "'")
}

# Expected log-likelihood
#' @keywords internal
Eloglik <- function(data, model) {
  UseMethod("Eloglik")
}
#' @keywords internal
Eloglik.default <- function(data, model) {
  stop("Eloglik: no method for class '", class(data)[1], "'")
}

# Variational E_q[log p(y|b, sigma^2)] under SuSiE-NIG. Non-S3 helper called
# from get_objective so we don't break the Eloglik(data, model) signature
# that downstream packages override (mvsusieR, mfsusieR).
# Decomposition: E_q[||y-Xb||^2 | sigma^2] = A + sigma^2 B,
#   B = sum_l sum_j alpha^(l)_j * r0^(l)_j * tau_j,
#   A = get_ER2 - E[sigma^2] * B.
# Eloglik = -n/2 log(2 pi) - n/2 (log b - digamma(a)) - 0.5 (A * a/b + B).
#' @keywords internal
nig_eloglik <- function(data, params, model) {
  n         <- data$n
  ERSS_marg <- get_ER2(data, model)
  a_post    <- (params$alpha0 + n) / 2
  b_post    <- (params$beta0 + ERSS_marg) / 2

  tau_v <- if (!is.null(model$shat2_inflation)) model$shat2_inflation else 1
  pw    <- model$predictor_weights
  B     <- 0
  for (l in seq_len(nrow(model$alpha))) {
    r0_l <- model$V[l] / (model$V[l] + tau_v / pw)
    B    <- B + sum(model$alpha[l, ] * r0_l * tau_v)
  }
  A <- ERSS_marg - (b_post / (a_post - 1)) * B
  -n / 2 * log(2 * pi) - n / 2 * (log(b_post) - digamma(a_post)) -
    0.5 * (A * a_post / b_post + B)
}

# Log-likelihood and posterior moments for fixed mixture prior
# (estimate_prior_method = "fixed_mixture"). Evaluates BFs on a
# pre-specified variance grid with given mixture weights.
#' @keywords internal
loglik_mixture <- function(data, params, model, ser_stats, l, ...) {
  UseMethod("loglik_mixture")
}
#' @keywords internal
loglik_mixture.default <- function(data, params, model, ser_stats, l, ...) {
  # Shared implementation for all data types.
  # compute_ser_statistics() (type-specific) has already produced betahat and shat2.
  model <- loglik_mixture_common(params, model, ser_stats, l)
  return(model)
}

#' @keywords internal
calculate_posterior_moments_mixture <- function(data, params, model, l, ...) {
  UseMethod("calculate_posterior_moments_mixture")
}
#' @keywords internal
calculate_posterior_moments_mixture.default <- function(data, params, model, l, ...) {
  # Shared implementation: mixture posterior from stored lbf_grid and ser_stats
  model <- calculate_posterior_moments_mixture_common(params, model, l)
  return(model)
}

# Log-likelihood for prior variance optimization
#' @keywords internal
loglik <- function(data, params, model, V, ser_stats, l = NULL, ...) {
  UseMethod("loglik")
}
#' @keywords internal
loglik.default <- function(data, params, model, V, ser_stats, l = NULL, ...) {
  stop("loglik: no method for class '", class(data)[1], "'")
}

# Negative log-likelihood for optimization (handles both log and linear scales)
#' @keywords internal
neg_loglik <- function(data, params, model, V_param, ser_stats, ...) {
  UseMethod("neg_loglik")
}
#' @keywords internal
neg_loglik.default <- function(data, params, model, V_param, ser_stats, ...) {
  stop("neg_loglik: no method for class '", class(data)[1], "'")
}

# EM update for prior variance
#' @keywords internal
em_update_prior_variance <- function(data, params, model, alpha, moments, V_init) {
  UseMethod("em_update_prior_variance")
}
#' @keywords internal
em_update_prior_variance.default <- function(data, params, model, alpha, moments, V_init) {
  if (!is.null(params$use_NIG) && params$use_NIG) {
    nig_ss <- get_nig_sufficient_stats(data, model)
    return(update_prior_variance_NIG_EM(data$n, model$predictor_weights,
                                         model$residuals, nig_ss$yy, nig_ss$sxy,
                                         alpha, V_init, params$alpha0, params$beta0,
                                         nig_ss$tau))
  }
  # Standard EM update
  sum(alpha * moments$post_mean2)
}

# =============================================================================
# MODEL UPDATES & FITTING
#
# Functions for iterative model updates and variance component estimation.
# These handle the dynamic aspects of model fitting including fitted value
# updates and variance component estimation.
#
# Functions: update_fitted_values, update_variance_components, update_derived_quantities
# =============================================================================

# Update fitted values
#' @keywords internal
update_fitted_values <- function(data, params, model, l, ...) {
  UseMethod("update_fitted_values")
}
#' @keywords internal
update_fitted_values.default <- function(data, params, model, l, ...) {
  stop("update_fitted_values: no method for class '", class(data)[1], "'")
}

# Update variance components
#' @keywords internal
update_variance_components <- function(data, params, model, ...) {
  UseMethod("update_variance_components")
}
#' @keywords internal
update_variance_components.default <- function(data, params, model, ...) {
  if (isTRUE(params$use_NIG)) {
    # Posterior mean of IG((alpha0+n)/2, (beta0+ERSS)/2)
    sigma2 <- (params$beta0 + get_ER2(data, model)) /
              (params$alpha0 + data$n - 2)
  } else {
    sigma2 <- est_residual_variance(data, model)
  }
  return(list(sigma2 = sigma2))
}

# Update derived quantities after variance component changes
#' @keywords internal
update_derived_quantities <- function(data, params, model) {
  UseMethod("update_derived_quantities")
}
#' @keywords internal
update_derived_quantities.default <- function(data, params, model) {
  return(model)
}

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
#
# Functions for generating final results and summary statistics.
# These process fitted models into interpretable outputs including
# credible sets, variable names, and fitted values.
#
# Functions: get_scale_factors, get_intercept, get_fitted, get_cs,
# get_variable_names, get_zscore, cleanup_model
# =============================================================================

# Get column scale factors
#' @keywords internal
get_scale_factors <- function(data, params, ...) {
  UseMethod("get_scale_factors")
}
#' @keywords internal
get_scale_factors.default <- function(data, params, ...) {
  stop("get_scale_factors: no method for class '", class(data)[1], "'")
}

# Get intercept
#' @keywords internal
get_intercept <- function(data, params, model, ...) {
  UseMethod("get_intercept")
}
#' @keywords internal
get_intercept.default <- function(data, params, model, ...) {
  stop("get_intercept: no method for class '", class(data)[1], "'")
}

# Get fitted values
#' @keywords internal
get_fitted <- function(data, params, model, ...) {
  UseMethod("get_fitted")
}
#' @keywords internal
get_fitted.default <- function(data, params, model, ...) {
  return(NULL)
}

# Get credible sets
#' @keywords internal
get_cs <- function(data, params, model, ...) {
  UseMethod("get_cs")
}
#' @keywords internal
get_cs.default <- function(data, params, model, ...) {
  stop("get_cs: no method for class '", class(data)[1], "'")
}

# Get variable names
#' @keywords internal
get_variable_names <- function(data, model, ...) {
  UseMethod("get_variable_names")
}
#' @keywords internal
get_variable_names.default <- function(data, model, ...) {
  stop("get_variable_names: no method for class '", class(data)[1], "'")
}

# Get univariate z-scores
#' @keywords internal
get_zscore <- function(data, params, model, ...) {
  UseMethod("get_zscore")
}
#' @keywords internal
get_zscore.default <- function(data, params, model, ...) {
  return(NULL)
}

# Clean up model object by removing temporary computational fields
#' @keywords internal
cleanup_model <- function(data, params, model, ...) {
  UseMethod("cleanup_model")
}

#' Class-specific extra fields to strip in cleanup_model.default
#'
#' Default returns `character(0)`. Subclasses (e.g., mfsusieR's
#' `raw_residuals`, mvsusieR's `Y_imputed`/`llik_cache`) override
#' to add their per-class scratch fields. Result is unioned with
#' the standard temp_fields list inside `cleanup_model.default`.
#' @keywords internal
cleanup_extra_fields <- function(data) {
  UseMethod("cleanup_extra_fields")
}
#' @keywords internal
cleanup_extra_fields.default <- function(data) {
  character(0)
}

#' @keywords internal
cleanup_model.default <- function(data, params, model, ...) {
  # Remove temporary fields common to all data types
  temp_fields <- c("null_weight", "predictor_weights", "runtime",
                   "prev_elbo", "prev_alpha",
                   "residuals", "fitted_without_l", "residual_variance",
                   "shat2_inflation",
                   cleanup_extra_fields(data))

  for (field in temp_fields) {
    if (field %in% names(model)) {
      model[[field]] <- NULL
    }
  }

  return(model)
}


================================================
FILE: R/individual_data_methods.R
================================================
# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
#
# Functions for data object setup, configuration, and preprocessing.
# These prepare data objects for model fitting and handle data-specific
# configurations like unmappable effects.
#
# Functions: configure_data, get_var_y
# =============================================================================

# Configure individual data for specified method
#' @keywords internal
configure_data.individual <- function(data, params) {
  if (params$unmappable_effects == "none" || params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
    return(configure_data.default(data, params))
  } else {
    # "inf" mode still requires sufficient statistics conversion
    warning_message("Individual-level data will be converted to sufficient statistics for unmappable effects methods (this step may take a while for a large data set)")
    return(convert_individual_to_ss(data, params))
  }
}

# Get variance of y
#' @keywords internal
#' @importFrom stats var
get_var_y.individual <- function(data, ...) {
  return(var(drop(data$y)))
}

# =============================================================================
# MODEL INITIALIZATION & SETUP
#
# Functions for initializing model objects and setting up initial states.
# These create model matrices, initialize fitted values, and prepare
# the SuSiE model for iterative fitting.
#
# Functions: initialize_susie_model, initialize_fitted, validate_prior, track_ibss_fit
# =============================================================================

# Initialize SuSiE model
#' @keywords internal
initialize_susie_model.individual <- function(data, params, var_y, ...) {

  # Base model
  model <- initialize_matrices(data, params, var_y)

  # Append predictor weights
  model$predictor_weights <- attr(data$X, "d")

  # Initialize NIG parameters
  if (params$use_NIG) {
    model$rv <- rep(1, params$L)
    model$marginal_loglik <- rep(as.numeric(NA), params$L)
  }

  # Initialize ash (Mr.ASH) tracking fields
  if (params$unmappable_effects == "ash") {
    model <- init_ash_fields(model, data$n, data$p, params$L, is_individual = TRUE)
  } else if (params$unmappable_effects == "ash_filter_archived") {
    model <- init_ash_fields_filter_archived(model, data$n, data$p, params$L, is_individual = TRUE)
  }

  return(model)
}

# Initialize fitted values
#' @keywords internal
initialize_fitted.individual <- function(data, mat_init) {
  return(list(Xr = compute_Xb(data$X, colSums(mat_init$alpha * mat_init$mu))))
}

# Validate prior variance
#' @keywords internal
validate_prior.individual <- function(data, params, model, ...) {
  return(validate_prior.default(data, params, model, ...))
}

# Track core parameters across iterations
#' @keywords internal
track_ibss_fit.individual <- function(data, params, model, tracking, iter, elbo, ...) {
  if (params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
    tracking <- track_ibss_fit.default(data, params, model, tracking, iter, elbo, ...)
    if (isTRUE(params$track_fit)) {
      tracking[[iter]]$tau2 <- model$tau2
    }
    return(tracking)
  }
  return(track_ibss_fit.default(data, params, model, tracking, iter, elbo, ...))
}

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
#
# Core functions for single effect regression computation and ELBO calculation.
# These handle the mathematical core of SuSiE including residual computation, SER
# statistics, posterior moments, and log-likelihood calculations for the ELBO.
#
# Functions: compute_residuals, compute_ser_statistics, SER_posterior_e_loglik,
# calculate_posterior_moments, compute_kl, get_ER2, Eloglik, loglik, neg_loglik
# =============================================================================

# Compute residuals for single effect regression
#' @keywords internal
compute_residuals.individual <- function(data, params, model, l, ...) {
  # Remove lth effect from fitted values (scaled by slot weight)
  sw_l <- get_slot_weight(model, l)
  Xr_without_l <- model$Xr - sw_l * compute_Xb(data$X, model$alpha[l, ] * model$mu[l, ])

  # Compute residuals
  if (params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
    # Subtract both sparse effects (without l) and ash theta
    R <- data$y - Xr_without_l - model$X_theta
  } else {
    R <- data$y - Xr_without_l
  }
  XtR <- compute_Xty(data$X, R)

  # Store unified residuals in model
  model$residuals         <- XtR
  model$fitted_without_l  <- Xr_without_l
  model$raw_residuals     <- R
  model$residual_variance <- model$sigma2  # Standard residual variance

  return(model)
}

# Compute SER statistics
#' @keywords internal
compute_ser_statistics.individual <- function(data, params, model, l, ...) {
  betahat <- (1 / model$predictor_weights) * model$residuals
  shat2   <- model$residual_variance / model$predictor_weights

  # Optimization parameters
  optim_init   <- log(max(c(betahat^2 - shat2, 1), na.rm = TRUE))
  optim_bounds <- c(-30, 15)
  optim_scale  <- "log"

  return(list(
    betahat      = betahat,
    shat2        = shat2,
    optim_init   = optim_init,
    optim_bounds = optim_bounds,
    optim_scale  = optim_scale
  ))
}

# Posterior expected log-likelihood for single effect regression
#' @keywords internal
SER_posterior_e_loglik.individual <- function(data, params, model, l) {
  Eb  <- model$alpha[l, ] * model$mu[l, ]
  Eb2 <- model$alpha[l, ] * model$mu2[l, ]
  return(-0.5 * data$n * log(2 * pi * model$sigma2) -
           0.5 / model$sigma2 * (sum(model$raw_residuals * model$raw_residuals)
                                 - 2 * sum(model$raw_residuals * compute_Xb(data$X, Eb)) +
                                   sum(model$predictor_weights * Eb2)))
}

# Calculate posterior moments for single effect regression
#' @keywords internal
calculate_posterior_moments.individual <- function(data, params, model, V, l, ...) {
  if (params$use_NIG) {
    if (V <= 0) {
      # Zero variance case
      post_mean  <- rep(0, data$p)
      post_mean2 <- rep(0, data$p)
      model$rv[l] <- 1
    } else {
      # Compute posterior moments for NIG prior
      nig_ss <- get_nig_sufficient_stats(data, model)
      moments <- compute_posterior_moments_NIG(data$n, model$predictor_weights,
                                               model$residuals, nig_ss$yy, nig_ss$sxy,
                                               V, params$alpha0, params$beta0, nig_ss$tau)

      post_mean  <- moments$post_mean
      post_mean2 <- moments$post_mean2

      # Compute weighted average of residual variance modes using PIPs
      model$rv[l] <- sum(model$alpha[l, ] * moments$rv)
    }
  } else {
    # Standard Gaussian posterior calculations
    post_var   <- (1 / V + model$predictor_weights / model$residual_variance)^(-1)
    post_mean  <- (1 / model$residual_variance) * post_var * model$residuals
    post_mean2 <- post_var + post_mean^2
  }

  # Store posterior moments in model
  model$mu[l, ] <- post_mean
  model$mu2[l, ] <- post_mean2

  return(model)
}

# Calculate KL divergence
#' @keywords internal
compute_kl.individual <- function(data, params, model, l) {
  if (params$use_NIG) {
    # NIG KL only valid for L=1 (gIBSS for L>1 has no coherent ELBO; supp. line 503)
    if (params$L == 1) {
      ki <- nig_kl_inputs(data, params, model, l)
      kl <- compute_kl_NIG(model$alpha[l, ], model$mu[l, ], model$mu2[l, ],
                           model$pi, model$V[l],
                           a0 = params$alpha0 / 2, b0 = params$beta0 / 2,
                           a_post = ki$a_post, b_post = ki$b_post,
                           s_j_sq = ki$s_j_sq)
    } else {
      kl <- 0
    }
  } else {
    # Standard Gaussian KL divergence
    loglik_term <- model$lbf[l] + sum(dnorm(model$raw_residuals, 0, sqrt(model$sigma2), log = TRUE))
    kl <- -loglik_term + SER_posterior_e_loglik(data, params, model, l)
  }

  # Store in model and return
  model$KL[l] <- kl
  return(model)
}

# Expected squared residuals
#' @keywords internal
get_ER2.individual <- function(data, model) {
  Xr_L <- compute_MXt(model$alpha * model$mu, data$X)
  postb2 <- model$alpha * model$mu2
  # For ash, subtract theta contribution from residuals
  y_adj <- if (!is.null(model$X_theta)) data$y - model$X_theta else data$y
  # Slot-weight correction: E[||y - sum_l c_l X beta^(l)||^2] under Bern(chat_l)
  # = ||y - Xr||^2 + sum_l chat_l * E[||X b^(l)||^2] - chat_l^2 * ||X bbar_l||^2
  # When slot_weights is NULL (all weights = 1), reduces to the standard formula.
  sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
  per_slot_Eb2 <- as.vector(postb2 %*% model$predictor_weights)  # L-vector
  per_slot_Xb2 <- rowSums(Xr_L^2)                                # L-vector
  return(sum((y_adj - model$Xr)^2) + sum(sw * per_slot_Eb2 - sw^2 * per_slot_Xb2))
}

# Expected log-likelihood
#' @keywords internal
Eloglik.individual <- function(data, model) {
  return(-data$n / 2 * log(2 * pi * model$sigma2) -
           1 / (2 * model$sigma2) * get_ER2(data, model))
}

#' @importFrom Matrix colSums
#' @importFrom stats dnorm
#' @importFrom stats cor
#' @keywords internal
loglik.individual <- function(data, params, model, V, ser_stats, l = NULL, ...) {
  # Check if using NIG prior
  if (params$use_NIG) {
    # Compute log Bayes factors for NIG prior
    nig_ss <- get_nig_sufficient_stats(data, model)
    lbf <- compute_lbf_NIG(data$n, model$predictor_weights,
                           model$residuals, nig_ss$yy, nig_ss$sxy,
                           V, params$alpha0, params$beta0, nig_ss$tau)
  } else {
    # Standard Gaussian prior log Bayes factors
    lbf <- dnorm(ser_stats$betahat, 0, sqrt(V + ser_stats$shat2), log = TRUE) -
      dnorm(ser_stats$betahat, 0, sqrt(ser_stats$shat2), log = TRUE)
  }

  # Stabilize logged Bayes Factor
  stable_res  <- lbf_stabilization(lbf, model$pi, ser_stats$shat2)

  # Compute posterior weights
  weights_res <- compute_posterior_weights(stable_res$lpo)

  # Store in model if l is provided, otherwise return lbf_model for prior variance optimization
  if (!is.null(l)) {
    # Store results in model
    model$alpha[l, ] <- weights_res$alpha
    model$lbf[l] <- weights_res$lbf_model
    model$lbf_variable[l, ] <- stable_res$lbf

    # Compute and store marginal log-likelihood for NIG prior
    if (params$use_NIG) {
      model$marginal_loglik[l] <- compute_marginal_loglik(weights_res$lbf_model, data$n,
                                                           nig_ss$yy, params$alpha0, params$beta0,
                                                           TRUE)
    }
    return(model)
  } else {
    return(weights_res$lbf_model)
  }
}

#' @keywords internal
neg_loglik.individual <- function(data, params, model, V_param, ser_stats, ...) {
  # Convert parameter to V based on optimization scale (always log for individual)
  V <- exp(V_param)
  lbf_model <- loglik.individual(data, params, model, V, ser_stats)
  return(-lbf_model)
}

# =============================================================================
# MODEL UPDATES & FITTING
#
# Functions for iterative model updates and variance component estimation.
# These handle the dynamic aspects of model fitting including fitted value
# updates and variance component estimation.
#
# Functions: update_fitted_values, update_variance_components, update_derived_quantities
# =============================================================================

# Update fitted values
#' @keywords internal
update_fitted_values.individual <- function(data, params, model, l, ...) {
  sw_l <- get_slot_weight(model, l)
  model$Xr <- model$fitted_without_l + sw_l * compute_Xb(data$X, model$alpha[l, ] * model$mu[l, ])

  return(model)
}

# Update variance components for individual data
#' @keywords internal
update_variance_components.individual <- function(data, params, model, ...) {
  if (params$unmappable_effects == "ash_filter_archived") {
    # Original filter-based masking (archived for internal diagnostics)
    return(update_ash_variance_components_filter_archived(data, model, params))
  } else if (params$unmappable_effects == "ash") {
    # c_hat + 3 LD-interference heuristics
    return(update_ash_variance_components(data, model, params))
  }
  return(update_variance_components.default(data, params, model, ...))
}

# Update derived quantities for individual data
#' @keywords internal
update_derived_quantities.individual <- function(data, params, model) {
  if (params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
    # For ash, recompute full Xr including sparse effects only
    # (theta is tracked separately via X_theta)
    # Use slot_weights (c_hat) if available to maintain consistency
    # with the c_hat-weighted Xr from ibss_fit + update_c_hat.
    sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
    b <- colSums(sw * model$alpha * model$mu)
    model$Xr <- as.vector(compute_Xb(data$X, b))
    return(model)
  }
  return(update_derived_quantities.default(data, params, model))
}

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
#
# Functions for generating final results and summary statistics.
# These process fitted models into interpretable outputs including
# credible sets, variable names, and fitted values.
#
# Functions: get_scale_factors, get_intercept, get_fitted, get_cs,
# get_variable_names, get_zscore
# =============================================================================

# Get column scale factors
#' @keywords internal
get_scale_factors.individual <- function(data, params) {
  return(attr(data$X, "scaled:scale"))
}

# Get intercept
#' @keywords internal
get_intercept.individual <- function(data, params, model, ...) {
  if (params$intercept) {
    return(data$mean_y - sum(attr(data$X, "scaled:center") *
                               (colSums(model$alpha * model$mu) / attr(data$X, "scaled:scale"))))
  } else {
    return(0)
  }
}

# Get Fitted Values
#' @keywords internal
get_fitted.individual <- function(data, params, model, ...) {
  if (params$intercept) {
    fitted <- model$Xr + data$mean_y
  } else {
    fitted <- model$Xr
  }

  # Include ash theta contribution
  if (!is.null(model$X_theta)) {
    fitted <- fitted + model$X_theta
  }

  fitted <- drop(fitted)
  names(fitted) <- `if`(is.null(names(data$y)), rownames(data$X), names(data$y))

  return(fitted)
}

# Get Credible Sets
#' @keywords internal
get_cs.individual <- function(data, params, model, ...) {
  if (is.null(params$coverage) || is.null(params$min_abs_corr)) {
    return(NULL)
  }

  return(susie_get_cs(model,
                      X            = data$X,
                      coverage     = params$coverage,
                      min_abs_corr = params$min_abs_corr,
                      n_purity     = params$n_purity))
}


# Get Variable Names
#' @keywords internal
get_variable_names.individual <- function(data, model, ...) {
  return(assign_names(data, model, colnames(data$X)))
}

# Get univariate z-score
#' @keywords internal
get_zscore.individual <- function(data, params, model, ...) {
  if (isFALSE(params$compute_univariate_zscore)) {
    return(get_zscore.default(data, params, model))
  }

  X <- data$X

  if (!is.matrix(X)) {
    warning_message(
      "Calculation of univariate regression z-scores is not ",
      "implemented specifically for sparse or trend filtering ",
      "matrices, so this step may be slow if the matrix is large; ",
      "to skip this step set compute_univariate_zscore = FALSE"
    )
  }
  if (!is.null(model$null_weight) && model$null_weight != 0) {
    X <- X[, 1:(ncol(X) - 1)]
  }

  return(calc_z(X, data$y, center = params$intercept, scale = params$standardize))
}

# Clean up model object for individual data
#' @keywords internal
cleanup_model.individual <- function(data, params, model, ...) {
  # Remove common fields
  model <- cleanup_model.default(data, params, model, ...)

  # Remove individual-specific temporary fields
  model$raw_residuals <- NULL

  # Remove NIG specific temporary fields
  if (params$use_NIG) {
    model$marginal_loglik <- NULL
  }

  # Remove ash-specific runtime fields
  if (!is.null(params$unmappable_effects) && params$unmappable_effects == "ash") {
    model <- cleanup_ash_fields(model)
  } else if (!is.null(params$unmappable_effects) && params$unmappable_effects == "ash_filter_archived") {
    model <- cleanup_ash_fields_filter_archived(model)
  }

  return(model)
}


================================================
FILE: R/iterative_bayesian_stepwise_selection.R
================================================
# =============================================================================
# IBSS INITIALIZATION
#
# Initializes the SuSiE model object for Iterative Bayesian Stepwise Selection.
# Sets up model matrices, handles model_init, and prepares for IBSS.
# =============================================================================
#' Initialize IBSS model
#'
#' Creates and initializes the model object for the IBSS algorithm.
#'
#' @param data Data object (individual, ss, or rss_lambda)
#' @param params Validated params object
#'
#' @return Initialized model object ready for the IBSS iteration loop.
#' @importFrom utils modifyList
#' @export
#' @keywords internal
ibss_initialize <- function(data, params) {
  UseMethod("ibss_initialize")
}

#' @rdname ibss_initialize
#' @export
#' @keywords internal
ibss_initialize.default <- function(data, params) {

  # Set var(y)
  var_y <- get_var_y(data)

  # Adjust number of single effects if needed
  if (data$p < params$L) {
    params$L <- data$p
  }

  # Check & validate residual variance
  if (is.null(params$residual_variance)) {
    params$residual_variance <- var_y
  }
  # For multivariate models, residual_variance can be a matrix
  if (!is.matrix(params$residual_variance)) {
    if (!is.numeric(params$residual_variance)) {
      stop("Input residual variance sigma2 must be numeric.")
    }
    params$residual_variance <- as.numeric(params$residual_variance)
    if (length(params$residual_variance) != 1) {
      stop("Input residual variance sigma2 must be a scalar.")
    }
    if (params$residual_variance <= 0) {
      stop("Residual variance sigma2 must be positive (is your var(Y) zero?).")
    }
  }

  # Handle model initialization
  if (!is.null(params$model_init)) {
    # Validate the contents of model_init
    validate_init(data, params)

    # Prune effects with zero prior variance
    model_init_pruned <- prune_single_effects(params$model_init)

    # Adjust the number of effects
    adjustment <- adjust_L(params, model_init_pruned, var_y)
    params$L   <- adjustment$L

    # Create base model with all required fields
    mat_init <- initialize_susie_model(data, params, var_y)

    # Merge with adjusted model_init
    mat_init <- modifyList(mat_init, adjustment$model_init)

    # Reset iteration-specific values
    mat_init$KL  <- rep(as.numeric(NA), params$L)
    mat_init$lbf <- rep(as.numeric(NA), params$L)
  } else {
    # Create fresh model
    mat_init <- initialize_susie_model(data, params, var_y)
  }

  # Initialize fitted values and null index
  fitted     <- initialize_fitted(data, mat_init)
  null_index <- initialize_null_index(data, mat_init)

  # Preserve model class set by initialize_susie_model (e.g., "mvsusie")
  model_class <- class(mat_init)

  # Return assembled SuSiE object
  model <- c(mat_init,
             list(null_index = null_index),
             fitted)

  # Use the class from initialize_susie_model if it inherits from "susie",
  # otherwise default to "susie"
  if (inherits(mat_init, "susie")) {
    class(model) <- model_class
  } else {
    class(model) <- "susie"
  }
  model$converged <- FALSE

  # Initialize slot activity (c_hat) if specified
  sp <- params$slot_prior
  if (!is.null(sp)) {
    if (!is.slot_prior(sp))
      stop("slot_prior must be created by slot_prior_betabinom() or ",
           "slot_prior_poisson(). ",
           "Got class: ", paste(class(sp), collapse=", "))
    L <- nrow(model$alpha)

    if (inherits(sp, "slot_prior_betabinom")) {
      a_beta <- sp$a_beta
      b_beta <- sp$b_beta
      prior_mean <- a_beta / (a_beta + b_beta)

      if (!is.null(sp$c_hat_init) && length(sp$c_hat_init) == L) {
        c_hat <- sp$c_hat_init
      } else {
        c_hat <- rep(min(prior_mean, 1 - 1e-10), L)
      }

      model$slot_weights <- c_hat
      model$c_hat_state <- list(
        prior_type = "betabinom", a_beta = a_beta, b_beta = b_beta,
        update_schedule = sp$update_schedule,
        skip_threshold_multiplier = sp$skip_threshold_multiplier,
        skip_threshold = 0
      )
    } else {
      C_val <- sp$C
      nu <- sp$nu

      if (!is.null(sp$c_hat_init) && length(sp$c_hat_init) == L) {
        c_hat <- sp$c_hat_init
        a_g <- nu + sum(c_hat)
      } else {
        c_hat <- rep(min(C_val / L, 1 - 1e-10), L)
        a_g <- nu + C_val
      }
      b_g <- nu / max(C_val, 1e-6) + 1

      model$slot_weights <- c_hat
      model$c_hat_state <- list(
        prior_type = "poisson", C = C_val, nu = nu, a_g = a_g, b_g = b_g,
        update_schedule = sp$update_schedule,
        skip_threshold_multiplier = sp$skip_threshold_multiplier,
        skip_threshold = 0
      )
    }

    model <- recompute_fitted_weighted(data, model)
  }

  # SS-path lambda_bias is stored as a scalar on the model. Only
  # allocate when R_mismatch is active so R_mismatch = "none" returns to the
  # un-augmented behavior (compute_shat2_inflation falls back to 0
  # when model$lambda_bias is NULL). The rss_lambda dispatch is out
  # of scope and continues to use a length-L vector.
  R_mismatch_mode <- if (!is.null(params$R_mismatch)) params$R_mismatch else "none"
  if (R_mismatch_mode != "none" && !is.null(data$R_finite_B) &&
      inherits(data, c("ss", "ss_mixture"))) {
    model$lambda_bias <- 0
    model$B_corrected <- data$R_finite_B
    model$R_finite_B <- data$R_finite_B
  }

  return(model)
}

# =============================================================================
# IBSS FITTING
#
# Updates all L single effects in the SuSiE model for one IBSS iteration.
# Calls single_effect_update for each effect and validates prior variance estimates.
# =============================================================================
#'
#' @param data Data object (individual, ss, or rss_lambda)
#' @param params Validated params object
#' @param model Current SuSiE model object
#'
#' @return Updated SuSiE model object with new alpha, mu, mu2, V, lbf, KL, and
#' fitted values
#'
#' @keywords internal
#' @noRd
ibss_fit <- function(data, params, model) {

  L <- nrow(model$alpha)
  use_c_hat <- !is.null(model$c_hat_state)

  # SS / ss_mixture: lambda_bias / B_corrected are scalars set per-sweep
  # by fit_R_mismatch at the end of the sweep. rss_lambda does not carry
  # these (lambda > 0 + R_mismatch != "none" errors at entry). No reset
  # needed.

  if (L > 0) {
    for (l in seq_len(L)) {
      if (use_c_hat &&
          model$slot_weights[l] < model$c_hat_state$skip_threshold) {
        next
      }

      model <- single_effect_update(data, params, model, l)

      if (use_c_hat) {
        model <- update_c_hat(data, model, l)
      }
    }
  }

  # Gamma-Poisson batch shape update (once per sweep)
  if (use_c_hat && model$c_hat_state$update_schedule == "batch" &&
      model$c_hat_state$prior_type != "betabinom") {
    model$c_hat_state$a_g <- model$c_hat_state$nu + sum(model$slot_weights)
  }

  # Adaptive skip threshold: baseline c_hat with lbf=0, scaled by multiplier
  if (use_c_hat && model$c_hat_state$skip_threshold_multiplier > 0) {
    st <- model$c_hat_state
    L_val <- nrow(model$alpha)
    if (st$prior_type == "betabinom") {
      # Self-consistent baseline: one Newton step for k_{-l} = k_total - baseline
      k_total <- sum(model$slot_weights)
      approx <- log(st$a_beta + k_total) - log(st$b_beta + L_val - 1 - k_total)
      k_others <- k_total - 1 / (1 + exp(-approx))
      baseline_logodds <- log(st$a_beta + k_others) -
                          log(st$b_beta + L_val - 1 - k_others)
    } else {
      baseline_logodds <- digamma(st$a_g) - log(st$b_g) - log(L_val)
    }
    c_hat_baseline <- 1 / (1 + exp(-baseline_logodds))
    model$c_hat_state$skip_threshold <-
      st$skip_threshold_multiplier * c_hat_baseline
  }

  # Region-level R-bias fit at the end of the sweep, before validate.
  # No-op when R_mismatch = "none" or on the rss_lambda dispatch (out of
  # scope; that path keeps the legacy per-slot fit). Reuses the
  # existing estimate_lambda_bias optimizer; only the cadence and
  # storage shape change (was per-slot inside the SER step; now
  # scalar at sweep boundary).
  if (inherits(data, c("ss", "ss_mixture"))) {
    old_lambda_bias <- model$lambda_bias
    model <- fit_R_mismatch(data, params, model)
    new_lambda_bias <- model$lambda_bias
    if (!is.null(old_lambda_bias) || !is.null(new_lambda_bias)) {
      old <- if (is.null(old_lambda_bias)) 0 else old_lambda_bias
      new <- if (is.null(new_lambda_bias)) 0 else new_lambda_bias
      model$runtime$lambda_bias_diff <- max(abs(new - old))
    }
  }

  # Validate prior variance is reasonable
  validate_prior(data, params, model)

  return(model)
}

# =============================================================================
# SLOT ACTIVITY (c_hat) HELPERS
#
# c_hat[l] = posterior probability that slot l is active.
# Beta-Binomial: logit(c_l) = log(a + k_{-l}) - log(b + L-1 - k_{-l}) + lbf_l
# Gamma-Poisson: logit(c_l) = psi(a_g) - log(b_g) - log(L) + lbf_l
# =============================================================================

#' Update c_hat for slot l after its SER step.
#' @keywords internal
#' @noRd
update_c_hat <- function(data, model, l) {
  st <- model$c_hat_state
  old_c <- model$slot_weights[l]
  L <- nrow(model$alpha)

  lbf_l <- model$lbf[l]
  if (is.na(lbf_l) || !is.finite(lbf_l)) lbf_l <- 0

  if (st$prior_type == "betabinom") {
    k_others <- sum(model$slot_weights[-l])
    log_odds <- log(st$a_beta + k_others) -
                log(st$b_beta + L - 1 - k_others) + lbf_l
  } else {
    log_odds <- digamma(st$a_g) - log(st$b_g) - log(L) + lbf_l
  }
  log_odds <- max(min(log_odds, 20), -20)
  new_c <- 1 / (1 + exp(-log_odds))
  model$slot_weights[l] <- new_c

  if (abs(new_c - old_c) > 1e-15) {
    b_bar_l <- model$alpha[l, ] * model$mu[l, ]
    model <- adjust_fitted_for_c_hat(data, model, b_bar_l, new_c - old_c)
  }

  # Gamma shape update (sequential mode; Beta-Binomial uses k_others directly)
  if (st$prior_type != "betabinom" && st$update_schedule == "sequential") {
    model$c_hat_state$a_g <- st$nu + sum(model$slot_weights)
  }

  return(model)
}

#' Add delta_weight * R*b_bar_l to the fitted-values field (Xr/XtXr/Rz).
#' @keywords internal
#' @noRd
adjust_fitted_for_c_hat <- function(data, model, b_bar_l, delta_weight) {
  fitted_field <- detect_fitted_field(model)
  if (fitted_field == "Xr") {
    model$Xr <- model$Xr +
      delta_weight * as.vector(compute_Xb(data$X, b_bar_l))
  } else {
    model[[fitted_field]] <- model[[fitted_field]] +
      delta_weight * as.vector(compute_Rv(data, b_bar_l, model$X_meta))
  }
  return(model)
}

#' @keywords internal
#' @noRd
detect_fitted_field <- function(model) {
  if ("Rz" %in% names(model)) "Rz"
  else if ("XtXr" %in% names(model)) "XtXr"
  else if ("Xr" %in% names(model)) "Xr"
  else stop("Cannot detect fitted-values field on model object.")
}

#' Recompute fitted = sum_l c_hat[l] * R * bbar[l] from scratch.
#' @keywords internal
#' @noRd
recompute_fitted_weighted <- function(data, model) {
  fitted_field <- detect_fitted_field(model)
  L <- nrow(model$alpha)
  c_hat <- model$slot_weights
  b_weighted <- rep(0, ncol(model$alpha))
  for (ll in seq_len(L)) {
    b_weighted <- b_weighted + c_hat[ll] * model$alpha[ll, ] * model$mu[ll, ]
  }
  if (fitted_field == "Xr") {
    model$Xr <- as.vector(compute_Xb(data$X, b_weighted))
  } else {
    model[[fitted_field]] <- as.vector(compute_Rv(data, b_weighted, model$X_meta))
  }
  return(model)
}

# =============================================================================
# IBSS FINALIZATION
#
# Finalizes the SuSiE model after convergence or maximum number of iterations
# reached. Computes credible sets, PIPs, intercept, fitted values, and z-scores.
# =============================================================================
#' Finalize IBSS model
#'
#' Computes credible sets, PIPs, z-scores, and cleans up temporary
#' fields from the model object.
#'
#' @param data Data object (individual, ss, or rss_lambda)
#' @param params Validated params object
#' @param model Converged model object
#' @param elbo ELBO values (optional)
#' @param iter Number of iterations completed
#' @param tracking Tracking data (optional)
#'
#' @return Finalized model object with credible sets and PIPs.
#' @export
#' @keywords internal
ibss_finalize <- function(data, params, model, elbo = NULL, iter = NA_integer_,
                          tracking = NULL) {

  # Append ELBO & iteration count to model output
  model$niter <- iter

  # Intercept & Fitted Values
  model$X_column_scale_factors <- get_scale_factors(data, params)
  model$intercept              <- get_intercept(data, params, model)
  model$fitted                 <- get_fitted(data, params, model)

  # Posterior Inclusion Probabilities, credible sets, z-scores
  model$sets <- get_cs(data, params, model)
  model$pip  <- susie_get_pip(model, prior_tol = params$prior_tol)
  model$z    <- get_zscore(data, params, model)

  # Tracking Across Iterations
  if (params$track_fit) model$trace <- tracking

  # Assign Variable Names
  model <- get_variable_names(data, model)

  # R diagnostics (from data -> model, following sets/pip/z pattern).
  # SS / ss_mixture paths store lambda_bias / B_corrected as scalars
  # (set by fit_R_mismatch once per sweep). The rss_lambda dispatch keeps
  # the per-slot vector form. Copy whatever shape lives on the model.
  R_finite_diagnostics <- data$R_finite_diagnostics
  if (!is.null(R_finite_diagnostics)) {
    model$R_finite_diagnostics <- R_finite_diagnostics
    if (!is.null(model$lambda_bias))
      model$R_finite_diagnostics$lambda_bias <- model$lambda_bias
    if (!is.null(model$B_corrected))
      model$R_finite_diagnostics$B_corrected <- model$B_corrected
    if (!is.null(data$R_mismatch))
      model$R_finite_diagnostics$R_mismatch <- data$R_mismatch
    if (!is.null(model$shat2_inflation))
      model$R_finite_diagnostics$per_variable_penalty <- as.vector(model$shat2_inflation - 1)
    # Q_art / artifact fields are present only for R_mismatch = "map_qc"
    # (set by fit_R_mismatch). Copy whichever exist.
    for (fld in c("Q_art", "artifact_flag", "artifact_evaluable",
                  "low_eigen_count", "low_eigen_fraction", "eig_delta",
                  "mode_label"))
      if (!is.null(model[[fld]]))
        model$R_finite_diagnostics[[fld]] <- model[[fld]]
  }

  # Multi-panel omega weights
  if (!is.null(model$omega))
    model$omega_weights <- model$omega

  # Store Gamma-Poisson c_hat results on output for user access
  # and for susieAnn to extract (a_g, b_g needed for genome-wide nu update).
  if (!is.null(model$c_hat_state)) {
    model$c_hat <- model$slot_weights
    model$C_hat <- sum(model$slot_weights)
    if (model$c_hat_state$prior_type == "betabinom") {
      model$a_beta <- model$c_hat_state$a_beta
      model$b_beta <- model$c_hat_state$b_beta
    } else {
      model$a_g <- model$c_hat_state$a_g
      model$b_g <- model$c_hat_state$b_g
    }
    model$c_hat_state <- NULL  # cleanup internal state
  }

  # Clean up temporary computational fields
  model <- cleanup_model(data, params, model)

  return(model)
}


================================================
FILE: R/mixture_prior.R
================================================
# =============================================================================
# FIXED MIXTURE PRIOR
#
# Shared implementations for estimate_prior_method = "fixed_mixture".
# Evaluates Bayes factors on a pre-specified variance grid with given mixture
# weights, computes mixture posterior moments, and stores per-grid BF matrix.
#
# These functions are data-type-agnostic: they operate on betahat and shat2
# produced by the type-specific compute_ser_statistics().
# =============================================================================

#' Resolve fixed mixture prior parameters
#'
#' Called from susie, susie_ss, and susie_rss to handle the
#' prior_variance_grid / mixture_weights parameters. When
#' prior_variance_grid is non-NULL, overrides estimate_prior_method
#' to "fixed_mixture" and validates inputs. Returns a list with
#' the resolved estimate_prior_method, estimate_prior_variance,
#' prior_variance_grid, and mixture_weights.
#'
#' @keywords internal
resolve_mixture_prior <- function(estimate_prior_method,
                                  estimate_prior_variance,
                                  prior_variance_grid,
                                  mixture_weights) {
  if (!is.null(prior_variance_grid)) {
    K <- length(prior_variance_grid)
    if (is.null(mixture_weights))
      mixture_weights <- rep(1 / K, K)
    stopifnot(
      length(mixture_weights) == K,
      all(prior_variance_grid > 0),
      all(mixture_weights >= 0),
      abs(sum(mixture_weights) - 1) < 1e-8
    )
    estimate_prior_method   <- "fixed_mixture"
    estimate_prior_variance <- FALSE
  } else {
    estimate_prior_method <- match.arg(
      estimate_prior_method, c("optim", "EM", "simple")
    )
  }
  list(
    estimate_prior_method   = estimate_prior_method,
    estimate_prior_variance = estimate_prior_variance,
    prior_variance_grid     = prior_variance_grid,
    mixture_weights         = mixture_weights
  )
}

#' Compute mixture log-Bayes factors and posterior inclusion probabilities
#'
#' For each grid point k and variant j, computes the Wakefield approximate
#' Bayes factor (ABF), then forms the mixture BF as a weighted sum over grid
#' points. Stores the full p x K log-BF matrix in model$lbf_grid[[l]] for
#' downstream use (e.g., mixsqp M-step in susieAnn).
#'
#' @param params Params object with prior_variance_grid (K-vector) and
#'   mixture_weights (K-vector summing to 1)
#' @param model Current model object with pi (prior weights)
#' @param ser_stats List with betahat (p-vector) and shat2 (p-vector)
#' @param l Effect index
#'
#' @return Updated model with alpha[l,], lbf[l], lbf_variable[l,], lbf_grid[[l]]
#'
#' @keywords internal
loglik_mixture_common <- function(params, model, ser_stats, l) {
  grid <- params$prior_variance_grid   # K-vector
  w    <- params$mixture_weights       # K-vector
  K    <- length(grid)

  betahat <- ser_stats$betahat         # p-vector
  shat2   <- ser_stats$shat2             # p-vector (may contain Inf)
  p       <- length(betahat)

  # Compute p x K matrix of log-BFs (Wakefield ABF at each grid point)
  # Uses pmax only for the ABF computation to avoid log(0), matching the
  # scalar path which applies pmax inside loglik.rss_lambda
  shat2_safe <- pmax(shat2, .Machine$double.eps)
  lbf_grid <- matrix(0, nrow = p, ncol = K)
  for (k in seq_len(K)) {
    V_k <- grid[k]
    lbf_grid[, k] <- -0.5 * log(1 + V_k / shat2_safe) +
      0.5 * betahat^2 * V_k / (shat2_safe * (V_k + shat2_safe))
  }

  # Mixture log-BF per variant: log(sum_k w_k * exp(lbf_jk))
  # For K=1 this reduces to lbf_grid[,1] exactly (no numerical error)
  if (K == 1L) {
    lbf_mix <- lbf_grid[, 1]
  } else {
    log_w <- log(w)
    lbf_mix <- apply(lbf_grid, 1, function(row) {
      shifted <- row + log_w
      max_val <- max(shifted)
      max_val + log(sum(exp(shifted - max_val)))
    })
  }

  # Store per-grid BF matrix for M-step (e.g., mixsqp in susieAnn)
  if (is.null(model$lbf_grid)) {
    model$lbf_grid <- vector("list", nrow(model$alpha))
  }
  model$lbf_grid[[l]] <- lbf_grid

  # Cache ser_stats for calculate_posterior_moments_mixture_common
  model$.ser_stats <- ser_stats

  # Compute posterior inclusion probabilities using existing machinery.
  # Pass raw shat2 (not pmax'd) to lbf_stabilization, matching the scalar path.
  stable_res  <- lbf_stabilization(lbf_mix, model$pi, shat2)
  weights_res <- compute_posterior_weights(stable_res$lpo)

  model$alpha[l, ]        <- weights_res$alpha
  model$lbf[l]            <- weights_res$lbf_model
  model$lbf_variable[l, ] <- stable_res$lbf

  return(model)
}


#' Compute mixture posterior moments
#'
#' For each grid point k, computes the conjugate normal posterior moments
#' (mean, variance) given prior variance V_k. Forms the mixture posterior
#' using responsibility weights r_jk = w_k * BF_jk / sum_k' w_k' * BF_jk'.
#'
#' Uses betahat and shat2 from ser_stats (produced by the data-type-specific
#' compute_ser_statistics), so this function is data-type-agnostic.
#'
#' @param params Params object with prior_variance_grid and mixture_weights
#' @param model Model with lbf_grid[[l]] (p x K), alpha[l,] already computed,
#'   and ser_stats cached from loglik_mixture_common
#' @param l Effect index
#'
#' @return Updated model with mu[l,] and mu2[l,]
#'
#' @keywords internal
calculate_posterior_moments_mixture_common <- function(params, model, l) {
  grid <- params$prior_variance_grid
  w    <- params$mixture_weights
  K    <- length(grid)

  lbf_grid <- model$lbf_grid[[l]]      # p x K
  betahat  <- model$.ser_stats$betahat  # cached by loglik_mixture_common
  shat2    <- model$.ser_stats$shat2
  shat2_safe <- pmax(shat2, .Machine$double.eps)
  p        <- length(betahat)

  # Responsibility weights: r_jk = w_k * BF_jk / sum_k' w_k' * BF_jk'
  # Work in log space for stability
  log_w <- log(w + .Machine$double.eps)
  log_r <- sweep(lbf_grid, 2, log_w, "+")  # p x K
  log_r_max <- apply(log_r, 1, max)
  r <- exp(log_r - log_r_max)              # p x K, shifted
  r <- r / rowSums(r)                       # normalize to responsibilities

  # Per-grid posterior moments
  post_mean  <- matrix(0, p, K)
  post_mean2 <- matrix(0, p, K)
  for (k in seq_len(K)) {
    V_k <- grid[k]
    pv_k <- V_k * shat2_safe / (V_k + shat2_safe)  # posterior variance
    pm_k <- pv_k / shat2_safe * betahat            # posterior mean
    post_mean[, k]  <- pm_k
    post_mean2[, k] <- pv_k + pm_k^2        # E[beta^2]
  }

  # Mixture posterior: weighted average over grid points
  model$mu[l, ]  <- rowSums(r * post_mean)
  model$mu2[l, ] <- rowSums(r * post_mean2)

  # Clean up cached ser_stats
  model$.ser_stats <- NULL

  return(model)
}


================================================
FILE: R/model_methods.R
================================================
# =============================================================================
# MODEL-LEVEL S3 METHODS

# S3 generics dispatched on model class (model field access, initialization, 
# convergence, ELBO)
# =============================================================================

#' Get prior variance for effect l
#' @keywords internal
get_prior_variance_l <- function(model, l) {
  UseMethod("get_prior_variance_l")
}
#' @keywords internal
get_prior_variance_l.default <- function(model, l) {
  model$V[l]
}

#' Set prior variance for effect l
#' @keywords internal
set_prior_variance_l <- function(model, l, V) {
  UseMethod("set_prior_variance_l")
}
#' @keywords internal
set_prior_variance_l.default <- function(model, l, V) {
  model$V[l] <- V
  model
}

#' Get posterior inclusion probabilities for effect l
#' @keywords internal
get_alpha_l <- function(model, l) {
  UseMethod("get_alpha_l")
}
#' @keywords internal
get_alpha_l.default <- function(model, l) {
  model$alpha[l, ]
}

#' Get posterior moments for effect l (for EM prior variance update)
#' @keywords internal
get_posterior_moments_l <- function(model, l) {
  UseMethod("get_posterior_moments_l")
}
#' @keywords internal
get_posterior_moments_l.default <- function(model, l) {
  list(post_mean = model$mu[l, ], post_mean2 = model$mu2[l, ])
}

#' Get PIP-weighted posterior mean for effect l (alpha * mu)
#' @keywords internal
get_posterior_mean_l <- function(model, l) {
  UseMethod("get_posterior_mean_l")
}
#' @keywords internal
get_posterior_mean_l.default <- function(model, l) {
  model$alpha[l, ] * model$mu[l, ]
}

#' Get sum of PIP-weighted posterior means across all effects
#' @keywords internal
get_posterior_mean_sum <- function(model) {
  UseMethod("get_posterior_mean_sum")
}
#' @keywords internal
get_posterior_mean_sum.default <- function(model) {
  colSums(model$alpha * model$mu)
}

# =============================================================================
# MODEL INITIALIZATION
#
# Initialize core model matrices and parameter storage.
# =============================================================================

#' @keywords internal
initialize_matrices <- function(data, params, var_y) {
  UseMethod("initialize_matrices")
}

#' @keywords internal
initialize_matrices.default <- function(data, params, var_y) {
  L <- params$L
  mat_init <- list(
    alpha             = matrix(1 / data$p, L, data$p),
    mu                = matrix(0, L, data$p),
    mu2               = matrix(0, L, data$p),
    V                 = expand_scaled_prior_variance(params$scaled_prior_variance, var_y, L),
    KL                = rep(as.numeric(NA), L),
    lbf               = rep(as.numeric(NA), L),
    lbf_variable      = matrix(as.numeric(NA), L, data$p),
    sigma2            = params$residual_variance,
    pi                = params$prior_weights,
    null_weight       = params$null_weight,
    predictor_weights = rep(as.numeric(NA), data$p)
  )

  return(mat_init)
}

# =============================================================================
# VARIANCE UPDATE
#
# Update residual variance (and possibly other variance components) after
# each IBSS iteration.
# =============================================================================

#' @keywords internal
#' @importFrom utils modifyList
update_model_variance <- function(data, params, model) {
  UseMethod("update_model_variance")
}

#' @keywords internal
update_model_variance.default <- function(data, params, model) {
  if (!isTRUE(params$estimate_residual_variance)) return(model)
  # Update variance components
  variance_result <- update_variance_components(data, params, model)
  model           <- modifyList(model, variance_result)

  # Apply bounds to residual variance
  model$sigma2    <- min(max(model$sigma2, params$residual_variance_lowerbound),
                         params$residual_variance_upperbound)

  # Update derived quantities after variance component changes
  model           <- update_derived_quantities(data, params, model)

  return(model)
}

# =============================================================================
# CONVERGENCE CHECKING
# =============================================================================

#' @keywords internal
check_convergence <- function(data, params, model, elbo, iter) {
  UseMethod("check_convergence")
}

#' Format the per-iter sigma2 cell for verbose output
#'
#' Default returns the scalar sigma2 in `%.4f`. Subclasses
#' (e.g., mfsusieR's list-of-vectors sigma2; mvsusieR's
#' matrix sigma2) override to a compact summary string of
#' fixed width.
#' @keywords internal
format_sigma2_summary <- function(model) {
  UseMethod("format_sigma2_summary")
}
#' @keywords internal
format_sigma2_summary.default <- function(model) {
  sprintf("%.4f", model$sigma2)
}

#' Append class-specific extra-diag columns to the verbose row
#'
#' Default returns an empty string. Subclasses override to inject
#' columns such as `max_pi_null`, `max_KL_l`, alpha-entropy
#' n_eff. Output is appended after the V column in the per-iter
#' tabular line.
#' @keywords internal
format_extra_diag <- function(model) {
  UseMethod("format_extra_diag")
}
#' @keywords internal
format_extra_diag.default <- function(model) {
  if (is.null(model$lambda_bias))
    return("")
  lambda_infl <- model$lambda_bias
  # Zero-masking of small finite values happens at source in
  # estimate_lambda_bias; we just sanitize non-finite for display.
  lambda_infl[!is.finite(lambda_infl)] <- 0
  if (length(lambda_infl) != 1)
    stop("lambda_bias must be a scalar on the SS path.")
  lb <- paste0("lambda_infl=", format(lambda_infl, digits = 2,
                                      scientific = TRUE))
  if (!is.null(model$B_corrected)) {
    B_corrected <- model$B_corrected
    if (length(unique(B_corrected[is.finite(B_corrected)])) == 1) {
      lb <- paste0(lb, " B_eff=", format(B_corrected[which(is.finite(B_corrected))[1]],
                                            digits = 4, scientific = FALSE))
    }
  }
  lb
}

#' @keywords internal
check_convergence.default <- function(data, params, model, elbo, iter) {
  verbose <- isTRUE(params$verbose)
  V_str <- format_V_summary(model$V)
  chat_str <- format_chat_summary(model)
  sigma2_str <- format_sigma2_summary(model)
  extra_str  <- format_extra_diag(model)

  # Tabular verbose format (ELBO-convergence path): columns are
  # iter, ELBO, delta, sigma2, mem, V (variable-width, last),
  # plus optional class-specific extras after V.
  verbose_row_fmt <- "%4d   %11.4f   %9s   %-9s   %-7s  %s%s%s"
  verbose_header  <- sprintf("%-4s   %11s   %9s   %-9s   %-7s  %s%s",
                             "iter", "ELBO", "delta", "sigma2", "mem", "V",
                             if (nzchar(extra_str)) "  extras" else "")

  # Skip convergence check on first iteration
  if (iter == 1) {
    model$converged <- FALSE
    if (verbose) {
      elbo_val <- elbo[iter + 1]
      if (!is.na(elbo_val) && is.finite(elbo_val)) {
        message(verbose_header)
        message(sprintf(verbose_row_fmt,
                        iter, elbo_val, "-", sigma2_str,
                        sprintf("%.2f GB", mem_used_gb()),
                        paste0(V_str, chat_str),
                        if (nzchar(extra_str)) paste0("  ", extra_str) else "",
                        ""))
      } else {
        message(sprintf("iter %3d: sigma2=%s, V=%s%s [mem: %.2f GB]",
                        iter, sigma2_str, V_str, chat_str, mem_used_gb()))
      }
    }
    return(model)
  }

  # Calculate difference in ELBO values
  ELBO_diff   <- elbo[iter + 1] - model$runtime$prev_elbo
  ELBO_failed <- is.na(ELBO_diff) || is.infinite(ELBO_diff)

  if (params$convergence_method == "pip" || ELBO_failed) {
    if (ELBO_failed && params$convergence_method == "elbo") {
      warning_message(paste0("Iteration ", iter, " produced an NA/infinite ELBO",
                             " value. Using pip-based convergence this iteration."))
    }
    # PIP/alpha convergence. pip_stall_window is reused as the maximum
    # short-cycle lag; it is no longer a "no improvement" stop.
    model <- check_alpha_pip_cycle_convergence(data, params, model)
    pip_diff <- model$runtime$pip_diff
    lambda_diff <- if (!is.null(model$runtime$lambda_bias_diff))
                     model$runtime$lambda_bias_diff else 0
    # Coordinate EB guard: fit_R_mismatch runs after the SER sweep, so a material
    # lambda update must be consumed by one more sweep before convergence.
    if (isTRUE(model$converged) && lambda_diff > params$tol) {
      model$converged <- FALSE
      model$convergence_reason <- paste0("lambda_infl_changed(",
                                         format(lambda_diff, digits = 3,
                                                scientific = TRUE), ")")
    }
    if (verbose) {
      conv_tag <- if (model$converged)
        paste0(" -- converged (", model$convergence_reason, ")")
      else
        ""
      lambda_str <- if (lambda_diff > 0)
        paste0(", max|d(lambda_infl)|=", format(lambda_diff, digits = 3,
                                                scientific = TRUE))
      else ""
      message(sprintf("iter %3d: max|d(alpha,PIP)|=%.2e%s, V=%s%s%s%s [mem: %.2f GB]",
                      iter, pip_diff, lambda_str, V_str, chat_str,
                      if (nzchar(extra_str)) paste0(", ", extra_str) else "",
                      conv_tag, mem_used_gb()))
    }

    if (model$converged && !is.null(params$unmappable_effects) &&
        params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
      model <- run_final_ash_pass(data, params, model)
    }
    return(model)
  }

  # Converge when ELBO stabilizes: small non-negative change.
  # A large negative ELBO_diff means the objective dropped, not convergence.
  if (ELBO_diff < -params$tol) {
    warning_message(sprintf("ELBO decreased by %.2e at iteration %d",
                            -ELBO_diff, iter))
  }
  model$converged <- (ELBO_diff >= 0 && ELBO_diff < params$tol)
  lambda_diff <- if (!is.null(model$runtime$lambda_bias_diff))
                   model$runtime$lambda_bias_diff else 0
  # Coordinate EB guard: fit_R_mismatch runs after the SER sweep, so a material
  # lambda update must be consumed by one more sweep before declaring convergence.
  if (isTRUE(model$converged) && lambda_diff > params$tol)
    model$converged <- FALSE

  if (verbose)
    message(sprintf(verbose_row_fmt,
                    iter, elbo[iter + 1],
                    sprintf("%.2e", ELBO_diff),
                    sigma2_str,
                    sprintf("%.2f GB", mem_used_gb()),
                    paste0(V_str, chat_str),
                    if (nzchar(extra_str)) paste0("  ", extra_str) else "",
                    if (model$converged) "  converged" else ""))

  if (model$converged && !is.null(params$unmappable_effects) &&
      params$unmappable_effects %in% c("ash", "ash_filter_archived")) {
    model <- run_final_ash_pass(data, params, model)
  }
  return(model)
}

# =============================================================================
# OBJECTIVE FUNCTION (ELBO)
# =============================================================================

#' Compute the SuSiE ELBO (evidence lower bound)
#'
#' Building-block function used by downstream packages implementing
#' custom IBSS loops.
#'
#' @param data Data object.
#' @param params Params object.
#' @param model Model object.
#'
#' @return Scalar ELBO value.
#'
#' @export
#' @keywords internal
get_objective <- function(data, params, model) {
  UseMethod("get_objective")
}

#' @export
#' @keywords internal
get_objective.default <- function(data, params, model) {
  if (!is.null(params$unmappable_effects) && params$unmappable_effects == "inf") {
    # Compute omega
    L         <- nrow(model$alpha)
    omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
    omega     <- matrix(0, L, data$p)

    for (l in seq_len(L)) {
      omega[l, ] <- omega_res$diagXtOmegaX + 1 / model$V[l]
    }

    # Compute total ELBO for infinitesimal effects model
    objective <- compute_elbo_inf(
      model$alpha, model$mu, omega, model$lbf,
      model$sigma2, model$tau2, data$n, data$p,
      data$eigen_vectors, data$eigen_values,
      data$VtXty, data$yty
    )
  } else if (params$use_NIG && nrow(model$alpha) == 1) {
    objective <- model$marginal_loglik[1]
  } else if (isTRUE(params$use_NIG)) {
    # NIG L>1: KL[l] is gated to 0 (gIBSS has no coherent ELBO); use the
    # proper variational expected log-likelihood.
    objective <- nig_eloglik(data, params, model)
  } else {
    # Standard ELBO computation. `na.rm = TRUE` so subclasses that
    # leave KL[l] = NA on null-effect rows (mfsusieR, mvsusieR) do
    # not need to override get_objective just to skip NAs.
    objective <- Eloglik(data, model) - sum(model$KL, na.rm = TRUE)
  }

  # Add slot prior ELBO terms when c_hat is active.
  # Without these, the ELBO is missing the prior and entropy contributions
  # from the slot activity model.
  if (!is.null(model$c_hat_state)) {
    objective <- objective + slot_prior_elbo(model)
  }

  if (is.infinite(objective)) {
    stop("get_objective() produced an infinite ELBO value")
  }
  return(objective)
}

# =============================================================================
# EFFECT TRIMMING
#
# Zero out effects with negligible prior variance after convergence.
# =============================================================================

#' @keywords internal
trim_null_effects <- function(data, params, model) {
  UseMethod("trim_null_effects")
}

#' @keywords internal
trim_null_effects.default <- function(data, params, model) {
  null_idx <- which(model$V < params$prior_tol)
  if (length(null_idx) == 0) return(model)

  model$V[null_idx] <- 0
  model$alpha[null_idx, ] <- rep(model$pi, each = length(null_idx))
  model$mu[null_idx, ] <- 0
  model$mu2[null_idx, ] <- 0
  model$lbf_variable[null_idx, ] <- 0
  model$lbf[null_idx] <- 0
  model$KL[null_idx] <- 0

  return(model)
}


================================================
FILE: R/mr.ash.R
================================================
#' @title Multiple Regression with Adaptive Shrinkage
#' 
#' @description Model fitting algorithms for Multiple Regression with
#'   Adaptive Shrinkage ("Mr.ASH"). Mr.ASH is a variational empirical
#'   Bayes (VEB) method for multiple linear regression. The fitting
#'  algorithms (locally) maximize the approximate marginal likelihood
#'   (the "evidence lower bound", or ELBO) via coordinate-wise updates.
#' 
#' @details Mr.ASH is a statistical inference method for the following
#' multiple linear regression model: \deqn{y | X, \beta, \sigma^2 ~
#' N(X \beta, \sigma I_n),} in which the regression coefficients
#' \eqn{\beta} admit a mixture-of-normals prior, \deqn{\beta | \pi,
#' \sigma ~ g = \sum_{k=1}^K N(0, \sigma^2 \sigma_k^2).} Each mixture
#' component in the prior, \eqn{g}, is a normal density centered at
#' zero, with variance \eqn{\sigma^2 \sigma_k^2}. 
#' 
#' The fitting algorithm, it run for a large enough number of
#' iterations, will find an approximate posterior for the regression
#' coefficients, denoted by \eqn{q(\beta)}, residual variance
#' parameter \eqn{sigma^2}, and prior mixture weights \eqn{\pi_1,
#' \ldots, \pi_K} maximizing the evidence lower bound, \deqn{F(q, \pi,
#' \sigma^2) = E_q \log p(y | X, \beta, \sigma^2) - \sum_{j=1}^p
#' D_{KL}(q_j || g),} where \eqn{D_{KL}(q_j || g)} denotes the
#' Kullback-Leibler (KL) divergence, a measure of the "distance"
#' between (approximate) posterior \eqn{q_j(\beta_j)} and prior
#' \eqn{g(\beta_j)}. The fitting algorithm iteratively updates the
#' approximate posteriors \eqn{q_1, \ldots, q_p}, separately for each
#' \eqn{j = 1, \ldots, p} (in an order determined by
#' \code{update.order}), then separately updates the mixture weights
#' and \eqn{\pi} and residual variance \eqn{\sigma^2}. This
#' coordinate-wise update scheme iterates until the convergence
#' criterion is met, or until the algorithm hits an upper bound on
#' the number of iterations (specified by \code{max.iter}). Coordinate-wise 
#' optimization algorithms for model fitting are implemented in C++ for 
#' efficient handling of large-scale data
#' 
#' See \sQuote{References} for more details about the model and
#' algorithm.
#'
#' @param X The input matrix, of dimension (n,p); each column is a
#'   single predictor; and each row is an observation vector. Here, n is
#'   the number of samples and p is the number of predictors. The matrix
#'   cannot be sparse.
#' 
#' @param y The observed continuously-valued responses, a vector of
#'   length p.
#' 
#' @param Z The covariate matrix, of dimension (n,k), where k is the
#'   number of covariates. This feature is not yet implemented;
#'   \code{Z} must be set to \code{NULL}.
#' 
#' @param sa2 The vector of prior mixture component variances. The
#'   variances should be in increasing order, starting at zero; that is,
#'   \code{sort(sa2)} should be the same as \code{sa2}. When \code{sa2}
#'   is \code{NULL}, the default setting is used, \code{sa2[k] =
#'   (2^(0.05*(k-1)) - 1)^2}, for \code{k = 1:20}. For this default
#'   setting, \code{sa2[1] = 0}, and \code{sa2[20]} is roughly 1.
#' 
#' @param method_q The algorithm used to update the variational
#'   approximation to the posterior distribution of the regression
#'   coefficients, \code{method = "sigma_dep_q"} and \code{method =
#'   "sigma_indep_q"}, take different approaches to updating the
#'   residual variance \eqn{sigma^2}.
#'
#' @param method_g \code{method = "caisa"}, an abbreviation of
#'   "Cooridinate Ascent Iterative Shinkage Algorithm", fits the model
#'   by approximate EM; it iteratively updates the variational
#'   approximation to the posterior distribution of the regression
#'   coefficients (the approximate E-step) and the model parameters
#'   (mixture weights and residual covariance) in an approximate
#'   M-step. Settings \code{method = "block"} and
#'   \code{method = "accelerate"} are considered experimental.
#' 
#' @param max.iter The maximum number of outer loop iterations allowed.
#' 
#' @param min.iter The minimum number of outer loop iterations allowed.
#' 
#' @param beta.init The initial estimate of the (approximate)
#'   posterior mean regression coefficients. This should be \code{NULL},
#'   or a vector of length p. When \code{beta.init} is \code{NULL}, the
#'   posterior mean coefficients are all initially set to zero.
#' 
#' @param update.pi If \code{update.pi = TRUE}, the mixture
#'   proportions in the mixture-of-normals prior are estimated from the
#'   data. In the manuscript, \code{update.pi = TRUE}.
#' 
#' @param pi The initial estimate of the mixture proportions
#'   \eqn{\pi_1, \ldots, \pi_K}. If \code{pi} is \code{NULL}, the
#'   mixture weights are initialized to \code{rep(1/K,K)}}, where
#'   \code{K = length(sa2).
#' 
#' @param update.sigma2 If \code{update.sigma2 = TRUE}, the residual
#'   variance \eqn{sigma^2} is estimated from the data.  In the manuscript,
#'   \code{update.sigma = TRUE}.
#' 
#' @param sigma2 The initial estimate of the residual variance,
#'   \eqn{\sigma^2}. If \code{sigma2 = NULL}, the residual variance is
#'   initialized to the empirical variance of the residuals based on the
#'   initial estimates of the regression coefficients, \code{beta.init},
#'   after removing linear effects of the intercept and any covariances.
#'
#' @param update.order The order in which the co-ordinate ascent
#'   updates for estimating the posterior mean coefficients are
#'   performed. \code{update.order} can be \code{NULL}, \code{"random"},
#'   or any permutation of \eqn{(1,\ldots,p)}, where \code{p} is the number
#'   of columns in the input matrix \code{X}. When \code{update.order}
#'   is \code{NULL}, the co-ordinate ascent updates are performed in
#'   order in which they appear in \code{X}; this is equivalent to
#'   setting \code{update.order = 1:p}. When \code{update.order =
#'   "random"}, the co-ordinate ascent updates are performed in a
#'   randomly generated order, and this random ordering is different at
#'   each outer-loop iteration.
#' 
#' @param standardize The logical flag for standardization of the
#'   columns of X variable, prior to the model fitting. The coefficients
#'   are always returned on the original scale.
#' 
#' @param intercept When \code{intercept = TRUE}, an intercept is
#'   included in the regression model.
#' 
#' @param tol Additional settings controlling behaviour of the model
#'   fitting algorithm. \code{tol$convtol} controls the termination
#'   criterion for the model fitting. The outer-loop updates stop when
#'   the relative L2 change in the estimates of the posterior mean
#'   coefficients is less than \code{convtol}, i.e., \code{||beta_new -
#'   beta_old||_2 / max(1, ||beta_old||_2) < convtol}.
#'   \code{tol$epstol} is a small, positive number added to the
#'   likelihoods to avoid logarithms of zero.
#'
#' @param verbose If \code{verbose = TRUE}, some information about the
#'   status of the model fitting is printed to the console.
#' 
#' @return A list object with the following elements:
#' 
#' \item{intercept}{The estimated intercept.}
#' 
#' \item{beta}{A vector containing posterior mean estimates of the
#'   regression coefficients for all predictors.}
#' 
#' \item{sigma2}{The estimated residual variance.}
#' 
#' \item{pi}{A vector of containing the estimated mixture
#'   proportions.}
#' 
#' \item{iter}{The number of outer-loop iterations that were
#'   performed.}
#' 
#' \item{update.order}{The ordering used for performing the
#'   coordinate-wise updates. For \code{update.order = "random"}, the
#'   orderings for outer-loop iterations are provided in a vector of
#'   length \code{p*max.iter}, where \code{p} is the number of predictors.}
#' 
#' \item{varobj}{A vector of length \code{numiter}, containing the
#'   value of the variational objective (equal to the negative "evidence
#'   lower bound") attained at each (outer-loop) model fitting
#'   iteration. Note that the objective does not account for the
#'   intercept term, even when \code{intercept = TRUE}; therefore, this
#'   value shoudl be interpreted as being an approximation to the
#'   marginal likelihood \emph{conditional} on the estimate of the
#'   intercept.}
#'
#' \item{data}{The preprocessed data (X, Z, y) provided as input to the model
#'   fitting algorithm. \code{data$w} is equal to
#'   \code{diag(crossprod(X))}, in which \code{X} is the preprocessed
#'   data matrix. Additionally, \code{data$sa2} gives the prior variances
#'   used.}
#' 
#' @seealso \code{\link{get.full.posterior}}, \code{\link{predict.mr.ash}}
#' 
#' @references
#'
#' Y. Kim (2020), Bayesian shrinkage methods for high dimensional
#' regression. Ph.D. thesis, University of Chicago.
#' 
#' @useDynLib susieR, .registration = TRUE
#'
#' @importFrom utils modifyList
#' @importFrom stats var
#' 
#' @examples
#' ### generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#' 
#' ### fit Mr.ASH
#' fit.mr.ash  = mr.ash(X,y, method_q = "sigma_indep_q")
#' #' fit.mr.ash  = mr.ash(X,y, method_q = "sigma_dep_q")
#' 
#' ### prediction routine
#' Xnew        = matrix(rnorm(n*p),n,p)
#' ynew        = Xnew %*% beta + rnorm(n)
#' ypred       = predict(fit.mr.ash, Xnew)
#'
#' ### test error
#' rmse        = norm(ynew - ypred, '2') / sqrt(n)
#' 
#' ### coefficients
#' betahat     = predict(fit.mr.ash, type = "coefficients")
#' # this equals c(fit.mr.ash$intercept, fit.mr.ash$beta)
#' 
#' @export
#' 
mr.ash                      = function(X, y, Z = NULL, sa2 = NULL,
                                       method_q = c("sigma_dep_q","sigma_indep_q"),
                                       method_g = c("caisa","accelerate","block"),
                                       max.iter = 1000, min.iter = 1,
                                       beta.init = NULL,
                                       update.pi = TRUE, pi = NULL,
                                       update.sigma2 = TRUE, sigma2 = NULL,
                                       update.order = NULL,
                                       standardize = FALSE, intercept = TRUE,
                                       tol = set_default_tolerance(), 
                                       verbose = TRUE){
  
  # get sizes
  n                 = nrow(X)
  p                 = ncol(X)
  
  # check necessary conditions
  if (!is.null(sa2)) {
    if (any(sa2 < 0)) {
      stop ("all the mixture component variances must be non-negative.")
    }
    if (sa2[1] != 0) {
      stop ("the first mixture component variance sa2[1] must be 0.")
    }
  }
  
  # check Z
  if (!is.null(Z)) {
    stop("covariates are not currently fully implemented; Z should be set to NULL")
  }
  
  # match method
  method_q          = match.arg(method_q)
  method_g          = match.arg(method_g)
  
  # set default tolerances unless specified
  tol0              = set_default_tolerance()
  tol               = modifyList(tol0,tol,keep.null = TRUE)
  
  # remove covariates
  data              = remove_covariate(X, y, Z, standardize, intercept)
  
  # initialize beta
  if ( is.null(beta.init) ){
    data$beta       = as.vector(double(p))
  } else {
    if (standardize) {
      data$beta     = as.vector(beta.init) * attr(data$X,"scaled:scale")
    } else {
      data$beta     = as.vector(beta.init)
    }
  }
  data$beta[1]      = data$beta[1] + 0   # to make sure beta.init is not modified
  
  # initialize r
  r                 = data$y - data$X %*% data$beta
  
  # sigma2
  if (is.null(sigma2))
    sigma2 = c(var.n(r))
  
  # precompute x_j^T x_j
  w                 = colSums(data$X^2)
  data$w            = w
  
  # set sa2 if missing
  if ( is.null(sa2) ) {
    sa2             = (2^((0:24) / 25) - 1)^2
    sa2             = sa2 / median(data$w) * n
  }
  K                 = length(sa2)
  data$sa2          = sa2
  
  # initialize other parameters
  if ( is.null(pi) ) {
    if ( is.null(beta.init) ){
      
      Phi           = matrix(1,p,K)/K
      pi            = rep(1,K)/K
      
    } else {
      
      S             = outer(1/w, sa2, '+') * sigma2
      Phi           = -data$beta^2/S/2 - log(S)/2
      Phi           = exp(Phi - apply(Phi,1,max))
      Phi           = Phi / rowSums(Phi)
      pi            = colMeans(Phi)
      
    }
  } else
    Phi             = matrix(rep(pi, each = p), nrow = p)
  pi[1]            <- pi[1] + 0
  
  # run algorithm
  
  if ( is.null(update.order) ) {
    o               = rep(0:(p-1), max.iter)
  } else if (is.numeric(update.order)) {
    o               = rep(update.order - 1, max.iter)
  } else if (update.order == "random") {
    o               = random_order(p, max.iter)
  }
  
  out               = caisa_cpp (data$X, w, sa2, pi, data$beta, r, sigma2, o,
                                 max.iter, min.iter, tol$convtol, tol$epstol,
                                 method_q, update.pi, update.sigma2, verbose)

  ## Convert to plain numeric vectors (drop matrix dim from Armadillo)
  out$beta          = c(out$beta)
  out$pi            = c(out$pi)
  out$sigma2        = c(out$sigma2)

  if (method_q == "sigma_scaled_beta") {
    out$beta        = out$beta * sqrt(out$sigma2)
  }

  ## polish return object
  out$intercept     = c(data$ZtZiZy - data$ZtZiZX %*% out$beta)
  data["beta"]      = NULL
  out$data          = data
  out$update.order  = o
  
  ## rescale beta is needed
  if (standardize)
    out$beta        = out$beta / attr(data$X, "scaled:scale")
  class(out)       <- c("mr.ash", "list")
  
  ## warn if necessary
  if (update.pi & out$pi[K] > 1/K) {
    warning(sprintf(paste("The mixture proportion associated with the",
                          "largest prior variance is greater than %0.2e;",
                          "this indicates that the model fit could be",
                          "improved by using a larger setting of the",
                          "prior variance. Consider increasing the range",
                          "of the variances \"sa2\"."),1/K))
  }
  
  return(out)
}

#' @title Extract Regression Coefficients from Mr.ASH Fit
#'
#' @description Retrieve posterior mean estimates of the regression
#'   coefficients in a Mr.ASH model.
#' 
#' @param object A Mr.ASH fit, usually the result of calling
#'   \code{mr.ash}.
#'
#' @param ... Additional arguments passed to the default S3 method.
#' 
#' @return A p+1 vector. The first element gives the estimated
#'   intercept, and the remaining p elements are the estimated
#'   regression coefficients.
#'   
#' ## generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#' 
#' ## fit mr.ash
#' fit.mr.ash  = mr.ash(X, y)
#' 
#' ## coefficient
#' coef.mr.ash = coef(fit.mr.ash)
#' intercept   = coef.mr.ash[1]
#' beta        = coef.mr.ash[-1]
#' 
#' @importFrom stats coef
#' 
#' @export coef.mr.ash
#' 
#' @export
#' 
coef.mr.ash = function (object, ...)
  c(object$intercept,object$beta)

#' @title Predict Outcomes or Extract Coefficients from Mr.ASH Fit
#'
#' @description This function predicts outcomes (y) given the observed
#'   variables (X) and a Mr.ASH model; alternatively, retrieve the
#'   estimates of the regression coefficients.
#'
#' @param object A mr_ash fit, usually the result of calling
#'   \code{mr.ash}.
#'
#' @param newx The input matrix, of dimension (n,p); each column is a
#'   single predictor; and each row is an observation vector. Here, n is
#'   the number of samples and p is the number of predictors. When
#'   \code{newx} is \code{NULL}, the fitted values for the training data
#'   are provided.
#' 
#' @param type The type of output. For \code{type = "response"},
#'   predicted or fitted outcomes are returned; for \code{type =
#'   "coefficients"}, the estimated coefficients are returned.
#' 
#' @param ... Additional arguments passed to the default S3 method.
#'
#' @return For \code{type = "response"}, predicted or fitted outcomes
#' are returned; for \code{type = "coefficients"}, the estimated
#' coefficients are returned.
#' 
#' @examples
#' ## generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#' 
#' ## fit mr.ash
#' fit.mr.ash  = mr.ash(X, y)
#' 
#' ## predict
#' Xnew        = matrix(rnorm(n*p),n,p)
#' ypred       = predict(fit.mr.ash, Xnew)
#' 
#' @importFrom stats predict
#' 
#' @export predict.mr.ash
#' 
#' @export
#' 
predict.mr.ash               = function(object,newx = NULL,
                                        type=c("response","coefficients"),...) {
  
  type <- match.arg(type)
  if (type == "coefficients"){
    if(!missing(newx))
      stop("Do not supply newx when predicting coefficients")
    return(coef(object))
  }
  else if(missing(newx))
    return(object$fitted)
  else {
    if (!all(object$data$Z == 1))
      stop("predict.mr.ash is not implemented for covariates Z other than ",
           "intercept")
    return(drop(object$intercept + newx %*% coef(object)[-1]))
  }
}

set_default_tolerance       = function(){
  epstol    = 1e-12
  convtol   = 1e-4
  
  return ( list(epstol = epstol, convtol = convtol ) )
}

#' @title Approximation Posterior Expectations from Mr.ASH Fit
#'
#' @description Recover the parameters specifying the variational
#'   approximation to the posterior distribution of the regression
#'   coefficients. To streamline the model fitting implementation, and
#'   to reduce memory requirements, \code{\link{mr.ash}} does not store
#'   all the parameters needed to specify the approximate posterior.
#' 
#' @param fit A Mr.ASH fit obtained, for example, by running
#'   \code{mr.ash}.
#' 
#' @return A list object with the following elements:
#' 
#' \item{phi}{An p x K matrix containing the posterior assignment
#'   probabilities, where p is the number of predictors, and K is the
#'   number of mixture components. (Each row of \code{phi} should sum to
#'   1.)}
#' 
#' \item{m}{An p x K matrix containing the posterior means conditional
#'   on assignment to each mixture component.}
#' 
#' \item{s2}{An p x K matrix containing the posterior variances
#'   conditional on assignment to each mixture component.}
#' 
#' @examples
#' ## generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#' 
#' ## fit mr.ash
#' fit.mr.ash  = mr.ash(X, y)
#' 
#' ## recover full posterior
#' full.post   = get.full.posterior(fit.mr.ash)
#' 
#' @export
#' 
get.full.posterior <- function(fit) {
    
  # compute residual
  r = fit$data$y - fit$data$X %*% fit$beta
  
  # compute bw and s2
  bw = as.vector((t(fit$data$X) %*% r) + fit$data$w * fit$beta)
  s2 = fit$sigma2 / outer(fit$data$w, 1/fit$data$sa2, '+')
  
  # compute m, phi
  m   = bw * s2 / fit$sigma2
  phi = -log(1 + outer(fit$data$w,fit$data$sa2))/2 + m * (bw/2/fit$sigma2)
  phi = c(fit$pi) * t(exp(phi - apply(phi,1,max)))
  phi = t(phi) / colSums(phi)
  return (list(phi = phi, m = m, s2 = s2))
}

gibbs.sampling              = function(X, y, pi, sa2 = (2^((0:19) / 20) - 1)^2,
                                       max.iter = 1500, burn.in = 500,
                                       standardize = FALSE, intercept = TRUE,
                                       sigma2 = NULL, beta.init = NULL,
                                       verbose = TRUE){
  
  # get sizes
  n            = nrow(X)
  p            = ncol(X)
  
  # remove covariates
  data         = remove_covariate(X, y, NULL, standardize, intercept)
  if ( is.null(beta.init) )
    data$beta  = as.vector(double(p))
  else
    data$beta  = as.vector(beta.init)
  
  # initialize r
  r            = data$y - data$X %*% data$beta
  
  # sigma2
  if ( is.null(sigma2) )
    sigma2 = c(var(r))
  
  # precalculate
  w            = colSums(data$X^2)
  data$w       = w
  
  # gibbs sampling
  out           = gibbs.sampling(data$X, w, sa2, pi, data$beta, r, sigma2, max.iter, burn.in, verbose)
  out$data      = data
  out$mu        = c(data$ZtZiZy - data$ZtZiZX %*% out$beta)
  
  return (out)
}

var.n                       = function(x) {
  a             = x - mean(x)
  return (sum(a^2) / length(a))
}


================================================
FILE: R/mr.ash.rss.R
================================================
#' @title Bayesian Multiple Regression with Mixture-of-Normals Prior (RSS)
#'
#' @description This function performs Bayesian multiple regression with a
#'   mixture-of-normals prior using summary statistics (RSS: Regression with
#'   Summary Statistics). It uses a C++ implementation for efficient computation.
#'
#' @param bhat Numeric vector of observed effect sizes (standardized).
#' @param shat Numeric vector of standard errors of effect sizes.
#' @param R Numeric matrix of the correlation matrix.
#' @param var_y Numeric value of the variance of the outcome.
#'   If NULL, it is set to Inf (effects on standardized scale).
#' @param n Integer value of the sample size.
#' @param s0 Numeric vector of prior variances for the mixture components.
#' @param w0 Numeric vector of prior weights for the mixture components.
#' @param sigma2_e Numeric value of the initial error variance estimate.
#'   If \code{NULL} (default), initialized to \code{var_y} (matching
#'   \code{mr.ash} behavior of using residual variance with zero
#'   initialization), or 1 when \code{var_y = Inf}.
#' @param mu1_init Numeric vector of initial values for the posterior mean of
#'   the coefficients. Default is \code{numeric(0)} (initialize to zero).
#' @param tol Numeric value of the convergence tolerance. Default is 1e-8.
#' @param max_iter Integer value of the maximum number of iterations.
#'   Default is 1e5.
#' @param z Numeric vector of Z-scores. If not provided, computed as
#'   \code{bhat / shat}.
#' @param update_w0 Logical value indicating whether to update the mixture
#'   weights. Default is TRUE.
#' @param update_sigma Logical value indicating whether to update the error
#'   variance. Default is TRUE.
#' @param compute_ELBO Logical value indicating whether to compute the
#'   Evidence Lower Bound (ELBO). Default is TRUE.
#' @param standardize Logical value indicating whether to standardize the
#'   input data. Default is FALSE.
#'
#' @return A list containing the following components:
#' \describe{
#'   \item{beta}{Numeric vector of posterior mean coefficients (same as mu1).}
#'   \item{sigma2}{Numeric value of the residual variance (same as sigma2_e).}
#'   \item{pi}{Numeric vector of mixture weights (same as w0).}
#'   \item{iter}{Integer, number of iterations performed.}
#'   \item{varobj}{Numeric vector of ELBO values per iteration.}
#'   \item{mu1}{Numeric vector of the posterior mean of the coefficients.}
#'   \item{sigma2_1}{Numeric vector of the posterior variance of the coefficients.}
#'   \item{w1}{Numeric matrix of the posterior assignment probabilities.}
#'   \item{sigma2_e}{Numeric value of the error variance.}
#'   \item{w0}{Numeric vector of the mixture weights.}
#'   \item{ELBO}{Numeric value of the Evidence Lower Bound (if \code{compute_ELBO = TRUE}).}
#' }
#'
#' @examples
#' # Generate example data
#' set.seed(985115)
#' n <- 350
#' p <- 16
#' sigmasq_error <- 0.5
#' zeroes <- rbinom(p, 1, 0.6)
#' beta.true <- rnorm(p, 1, sd = 4)
#' beta.true[zeroes] <- 0
#'
#' X <- cbind(matrix(rnorm(n * p), nrow = n))
#' X <- scale(X, center = TRUE, scale = FALSE)
#' y <- X %*% matrix(beta.true, ncol = 1) + rnorm(n, 0, sqrt(sigmasq_error))
#' y <- scale(y, center = TRUE, scale = FALSE)
#'
#' # Set the prior
#' K <- 9
#' sigma0 <- c(0.001, .1, .5, 1, 5, 10, 20, 30, .005)
#' omega0 <- rep(1 / K, K)
#'
#' # Calculate summary statistics
#' b.hat <- sapply(1:p, function(j) {
#'   summary(lm(y ~ X[, j]))$coefficients[-1, 1]
#' })
#' s.hat <- sapply(1:p, function(j) {
#'   summary(lm(y ~ X[, j]))$coefficients[-1, 2]
#' })
#' R.hat <- cor(X)
#' var_y <- var(y)
#' sigmasq_init <- 1.5
#'
#' # Run mr.ash.rss
#' out <- mr.ash.rss(b.hat, s.hat,
#'   R = R.hat, var_y = var_y, n = n,
#'   sigma2_e = sigmasq_init, s0 = sigma0, w0 = omega0,
#'   mu1_init = rep(0, ncol(X)), tol = 1e-8, max_iter = 1e5,
#'   update_w0 = TRUE, update_sigma = TRUE, compute_ELBO = TRUE,
#'   standardize = FALSE
#' )
#'
#' @export
mr.ash.rss <- function(bhat, shat, R, var_y, n,
                       s0, w0,
                       sigma2_e = NULL, mu1_init = numeric(0),
                       tol = 1e-8, max_iter = 1e5, z = numeric(0),
                       update_w0 = TRUE, update_sigma = TRUE,
                       compute_ELBO = TRUE, standardize = FALSE) {
  if (is.null(var_y)) var_y <- Inf
  if (identical(z, numeric(0))) z <- bhat / shat

  # Default sigma2_e: use var_y when available (matches mr.ash behavior of
  # initializing to var(residuals) when beta.init is zero, since var(y - X*0) = var(y)).
  # When var_y is Inf (standardized scale), default to 1.
  if (is.null(sigma2_e)) {
    sigma2_e <- if (is.finite(var_y)) var_y else 1
  }

  result <- mr_ash_rss_cpp(
    bhat = bhat, shat = shat, z = z, R = R,
    var_y = var_y, n = n, sigma2_e = sigma2_e,
    s0 = s0, w0 = w0, mu1_init = mu1_init,
    tol = tol, max_iter = max_iter,
    update_w0 = update_w0, update_sigma = update_sigma,
    compute_ELBO = compute_ELBO, standardize = standardize
  )

  # Add mr.ash-compatible output names for consistency
  result$beta <- c(result$mu1)        # posterior mean coefficients
  result$sigma2 <- c(result$sigma2_e) # residual variance (scalar)
  result$pi <- c(result$w0)           # mixture weights
  result$iter <- as.integer(c(result$iter))  # iteration count
  result$varobj <- c(result$varobj)   # ELBO per iteration

  return(result)
}


================================================
FILE: R/predict.susie.R
================================================
#' @title Extract regression coefficients from susie fit
#'
#' @param object A susie fit.
#'
#' @param \dots Additional arguments passed to the generic \code{coef}
#'   method.
#'
#' @return A p+1 vector, the first element being an intercept, and the
#'   remaining p elements being estimated regression coefficients.
#'
#' @importFrom stats coef
#'
#' @method coef susie
#'
#' @export coef.susie
#'
#' @export
#'
coef.susie <- function(object, ...) {
  s <- object
  # Compute mappable effects
  mappable_coef <- colSums(s$alpha * s$mu) / s$X_column_scale_factors

  if (!is.null(s$theta)) {
    total_coef <- mappable_coef + s$theta / s$X_column_scale_factors
  } else {
    total_coef <- mappable_coef
  }

  return(c(s$intercept, total_coef))
}

#' @title Predict outcomes or extract coefficients from susie fit.
#'
#' @param object A susie fit.
#'
#' @param newx A new value for X at which to do predictions.
#'
#' @param type The type of output. For \code{type = "response"},
#'   predicted or fitted outcomes are returned; for \code{type =
#'   "coefficients"}, the estimated coefficients are returned.
#'
#' @param \dots Other arguments used by generic predict function. These
#'   extra arguments are not used here.
#'
#' @return For \code{type = "response"}, predicted or fitted outcomes
#'   are returned; for \code{type = "coefficients"}, the estimated
#'   coefficients are returned. If the susie fit has intercept =
#'   \code{NA} (which is common when using \code{susie_ss}) then
#'   predictions are computed using an intercept of 0, and a warning is
#'   emitted.
#'
#' @importFrom stats coef
#'
#' @method predict susie
#'
#' @export predict.susie
#'
#' @export
#'
predict.susie <- function(object, newx = NULL,
                          type = c("response", "coefficients"), ...) {
  s <- object
  type <- match.arg(type)
  if (type == "coefficients") {
    if (!missing(newx)) {
      stop("Do not supply newx when predicting coefficients")
    }
    return(coef(s))
  }
  if (missing(newx)) {
    return(s$fitted)
  }
  if (is.na(s$intercept)) {
    warning_message("The prediction assumes intercept = 0")
    return(drop(newx %*% coef(s)[-1]))
  } else {
    return(drop(s$intercept + newx %*% coef(s)[-1]))
  }
}


================================================
FILE: R/refinement.R
================================================
#' Block coordinate ascent for iterative model refinement.
#'
#' Generic framework for post-convergence refinement of fitted models.
#' Repeatedly applies a block update (\code{step_fn}) to a fitted model,
#' monitoring ELBO for convergence and stability.  Both CS refinement
#' (\code{\link{run_refine}}) and residual variance estimation (mvsusieR)
#' are instances of block coordinate ascent over different parameter blocks.
#'
#' Convergence is reached when either:
#' \itemize{
#'   \item \code{step_fn} returns \code{converged = TRUE}
#'         (the block update signals no further improvement), or
#'   \item the relative ELBO change falls below \code{tol}
#'         (ELBO stabilized across block updates).
#' }
#'
#' A warning is issued if the ELBO decreases between iterations.
#'
#' @param model Fitted model (e.g., from \code{susie_workhorse} or
#'   \code{mvsusie_workhorse}).
#' @param data Data object passed to \code{step_fn}.
#' @param step_fn A function with signature
#'   \code{function(model, data, iter)} that performs one block coordinate
#'   update.  Must return a named list with elements:
#'   \describe{
#'     \item{model}{(required) The updated model.}
#'     \item{data}{(optional) Updated data object, e.g. after changing
#'       residual variance.  If \code{NULL}, the data is unchanged.}
#'     \item{converged}{(optional) Logical; if \code{TRUE}, stop
#'       iterating.}
#'     \item{log_msg}{(optional) Character string appended to verbose
#'       output.}
#'   }
#' @param max_iter Maximum number of block ascent iterations
#'   (default 100).
#' @param tol Convergence tolerance for relative ELBO change
#'   (default 1e-3).
#' @param verbose If \code{TRUE}, print progress each iteration
#'   (default \code{FALSE}).
#'
#' @return The refined model, with \code{model$converged} set to
#'   \code{TRUE} or \code{FALSE}.
#'
#' @export
block_coordinate_ascent <- function(model, data, step_fn,
                                     max_iter = 100, tol = 1e-3,
                                     verbose = FALSE) {
  prev_elbo  <- susie_get_objective(model)
  prev_model <- model
  converged  <- FALSE

  for (iter in seq_len(max_iter)) {
    result <- step_fn(model, data, iter)
    model <- result$model
    if (!is.null(result$data)) data <- result$data

    current_elbo <- susie_get_objective(model)
    elbo_change <- current_elbo - prev_elbo

    # If ELBO decreased, the step did not improve the objective.
    # Revert to the previous model and treat as converged.
    if (elbo_change < 0) {
      if (verbose)
        message(sprintf(
          "Block ascent iter %d: update did not improve ELBO (change=%.4g); ",
          iter, elbo_change),
          "rejecting update and stopping.")
      model <- prev_model
      converged <- TRUE
      break
    }

    if (verbose) {
      msg <- sprintf("Block ascent iter %d: ELBO=%.4f, change=%.4g",
                     iter, current_elbo, elbo_change)
      if (!is.null(result$log_msg))
        msg <- paste0(msg, ", ", result$log_msg)
      message(msg)
    }

    # Convergence: step_fn signals done, or ELBO stabilized
    if (isTRUE(result$converged)) {
      converged <- TRUE
      break
    }
    elbo_delta <- abs(elbo_change) / max(1, abs(current_elbo))
    if (elbo_delta < tol) {
      converged <- TRUE
      break
    }

    prev_elbo  <- current_elbo
    prev_model <- model
  }

  model$converged <- converged
  if (!converged)
    warning_message("Block coordinate ascent did not converge in ",
                    max_iter, " iterations")
  return(model)
}


# Credible set refinement via block coordinate ascent.
#
# For each credible set, perturbs prior weights (zeroing out the CS
# variables) and re-fits via a two-step procedure:
#   Step 1: fit with zeroed CS weights (explores alternative signals)
#   Step 2: re-fit with original weights, warm-started from Step 1
# The best candidate (highest ELBO) is accepted if it improves beyond
# tolerance.  This is repeated until no further improvement.
#
# @keywords internal
run_refine <- function(model, data, params) {

  if (!is.null(params$model_init))
    warning_message("The given model_init is not used in refinement")

  pw_s <- extract_prior_weights(model)

  # One block coordinate step: try refining each CS, pick best candidate.
  cs_refine_step <- function(model, data, iter) {
    if (is.null(model$sets) || length(model$sets$cs) == 0)
      return(list(model = model, converged = TRUE))

    candidates <- list()
    for (cs_idx in seq_along(model$sets$cs)) {
      # Zero out prior weights for variables in this CS
      pw_cs <- pw_s
      pw_cs[model$sets$cs[[cs_idx]]] <- 0
      if (all(pw_cs == 0)) break

      # Step 1: fit with zeroed CS weights (no initialization)
      p1 <- params
      p1$prior_weights <- reconstruct_full_weights(pw_cs, model$null_weight)
      p1$null_weight   <- model$null_weight
      p1$model_init    <- NULL
      p1$verbose       <- FALSE
      p1$track_fit     <- FALSE
      p1$refine        <- FALSE
      m1 <- susie_workhorse(data, p1)

      # Step 2: re-fit with original weights, warm-started from Step 1
      init <- list(alpha = m1$alpha, mu = m1$mu, mu2 = m1$mu2)
      class(init) <- "susie"
      p2 <- params
      p2$prior_weights <- reconstruct_full_weights(pw_s, model$null_weight)
      p2$null_weight   <- model$null_weight
      p2$model_init    <- init
      p2$verbose       <- FALSE
      p2$track_fit     <- FALSE
      p2$refine        <- FALSE
      candidates <- c(candidates, list(susie_workhorse(data, p2)))
    }

    if (length(candidates) == 0)
      return(list(model = model, converged = TRUE))

    elbos <- sapply(candidates, susie_get_objective)
    current_elbo <- susie_get_objective(model)

    if (max(elbos) - current_elbo > params$tol) {
      # Accept best candidate
      list(model = candidates[[which.max(elbos)]])
    } else {
      # No improvement beyond tolerance -- converged
      list(model = model, converged = TRUE)
    }
  }

  block_coordinate_ascent(model, data, cs_refine_step,
                          max_iter = 100, tol = params$tol,
                          verbose = params$verbose)
}


================================================
FILE: R/rss_lambda_methods.R
================================================
# =============================================================================
# OMEGA OPTIMIZATION TOLERANCES
#
# Named constants for multi-panel mixture weight optimization.
# Collected here to avoid scattered magic numbers.
# =============================================================================

.omega_tol <- list(
  convergence  = 1e-3,   # max|delta omega| to skip future updates
  grid_spacing = 0.25,   # K=2 warm-start grid resolution
  fw_stop      = 1e-6,   # Frank-Wolfe improvement stopping criterion
  fw_max_iter  = 5L      # Frank-Wolfe max iterations
)

# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
#
# Functions for data object setup, configuration, and preprocessing.
# These prepare data objects for model fitting and handle data-specific
# configurations like unmappable effects.
#
# Functions: configure_data, get_var_y
# =============================================================================

# Configure data
#' @keywords internal
configure_data.rss_lambda <- function(data, params) {
  return(configure_data.default(data, params))
}

# Get variance of y
#' @keywords internal
get_var_y.rss_lambda <- function(data, ...) {
  return(1)
}

# =============================================================================
# MODEL INITIALIZATION & SETUP
#
# Functions for initializing model objects and setting up initial states.
# These create model matrices, initialize fitted values, and prepare
# the SuSiE model for iterative fitting.
#
# Functions: initialize_susie_model, initialize_fitted, validate_prior, track_ibss_fit
# =============================================================================

# Initialize SuSiE model
#' @keywords internal
initialize_susie_model.rss_lambda <- function(data, params, var_y, ...) {
  # Base model
  model <- initialize_matrices(data, params, var_y)

  # Initialize SinvRj and RjSinvRj
  eigen_R <- get_eigen_R(data, model)
  D    <- eigen_R$values
  V    <- eigen_R$vectors
  Vt   <- t(V)
  Dinv <- compute_Dinv(model, data)

  model$SinvRj   <- V %*% (Dinv * D * Vt)
  model$RjSinvRj <- colSums(Vt * (Dinv * D^2 * Vt))

  return(model)
}

# Initialize fitted values.
#' @keywords internal
initialize_fitted.rss_lambda <- function(data, mat_init) {
  return(list(Rz = as.vector(compute_Rv(data, colSums(mat_init$alpha * mat_init$mu)))))
}

# Validate prior variance
#' @keywords internal
validate_prior.rss_lambda <- function(data, params, model, ...) {
  return(validate_prior.default(data, params, model, ...))
}

# Track core parameters for tracking
#' @keywords internal
track_ibss_fit.rss_lambda <- function(data, params, model, tracking, iter, elbo, ...) {
  return(track_ibss_fit.default(data, params, model, tracking, iter, elbo, ...))
}

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
#
# Core functions for single effect regression computation and ELBO calculation.
# These handle the mathematical core of SuSiE including residual computation, SER
# statistics, posterior moments, and log-likelihood calculations for the ELBO.
#
# Functions: compute_residuals, compute_ser_statistics, SER_posterior_e_loglik,
# calculate_posterior_moments, compute_kl, get_ER2, Eloglik, loglik, neg_loglik
# =============================================================================

# Compute residuals for single effect regression
#' @keywords internal
compute_residuals.rss_lambda <- function(data, params, model, l, ...) {
  # Remove lth effect from fitted values (scaled by slot weight)
  sw_l <- get_slot_weight(model, l)
  Rz_without_l <- model$Rz - sw_l * compute_Rv(data, model$alpha[l, ] * model$mu[l, ])

  # Store unified residuals in model
  model$residuals         <- data$z - Rz_without_l
  model$fitted_without_l  <- Rz_without_l
  model$residual_variance <- 1  # RSS lambda uses normalized residual variance

  return(model)
}

# Compute SER statistics
#' @keywords internal
compute_ser_statistics.rss_lambda <- function(data, params, model, l, ...) {
  signal  <- as.vector(crossprod(model$SinvRj, model$residuals))
  shat2   <- 1 / model$RjSinvRj
  betahat <- signal * shat2

  # Optimization parameters
  optim_init   <- log(max(c(betahat^2 - shat2, 1e-6), na.rm = TRUE))
  optim_bounds <- c(-30, 15)
  optim_scale  <- "log"

  return(list(
    betahat      = betahat,
    shat2        = shat2,
    optim_init   = optim_init,
    optim_bounds = optim_bounds,
    optim_scale  = optim_scale
  ))
}

# SER posterior expected log-likelihood
#' @keywords internal
SER_posterior_e_loglik.rss_lambda <- function(data, params, model, l) {
  Eb     <- model$alpha[l, ] * model$mu[l, ]
  Eb2    <- model$alpha[l, ] * model$mu2[l, ]
  eigen_R <- get_eigen_R(data, model)
  V      <- eigen_R$vectors
  Dinv   <- compute_Dinv(model, data)
  rR     <- compute_Rv(data, model$residuals)
  SinvEb <- V %*% (Dinv * crossprod(V, Eb))

  return(-0.5 * (-2 * sum(rR * SinvEb) + sum(model$RjSinvRj * Eb2)))
}

# Calculate posterior moments for single effect regression
#' @keywords internal
calculate_posterior_moments.rss_lambda <- function(data, params, model, V, l, ...) {
  shat2 <- 1 / model$RjSinvRj

  post_var  <- V * shat2 / (V + shat2)
  signal    <- as.vector(crossprod(model$SinvRj, model$residuals))
  betahat   <- signal * (1 / model$RjSinvRj)
  post_mean <- post_var / shat2 * betahat
  post_mean2 <- post_var + post_mean^2

  # Store posterior moments in model
  model$mu[l, ] <- post_mean
  model$mu2[l, ] <- post_mean2

  return(model)
}

# Calculate KL divergence
#' @keywords internal
compute_kl.rss_lambda <- function(data, params, model, l) {
  model <- compute_kl.default(data, params, model, l)
  return(model)
}

# Expected squared residuals
#' @keywords internal
get_ER2.rss_lambda <- function(data, model) {
  # Eigen decomposition components
  eigen_R <- get_eigen_R(data, model)
  D     <- eigen_R$values
  V     <- eigen_R$vectors
  Dinv  <- compute_Dinv(model, data)

  # Cached quantities
  Vtz   <- get_Vtz(data, model)
  zbar  <- model$zbar
  postb2 <- model$diag_postb2

  # z^T S^{-1} z (use model z_null_norm2 if omega changed, else data)
  # When lambda=0, null-space components are projected out (ignored).
  z_null_norm2 <- if (!is.null(model$z_null_norm2)) model$z_null_norm2 else data$z_null_norm2
  zSinvz <- sum((Dinv * Vtz) * Vtz)
  if (data$lambda > 0) zSinvz <- zSinvz + z_null_norm2 / data$lambda

  # -2 zbar^T S^{-1} z
  tmp <- V %*% (Dinv * (D * Vtz))
  term2 <- -2 * sum(tmp * zbar)

  # zbar^T R S^{-1} R zbar
  Vtzbar <- crossprod(V, zbar)
  term3 <- sum((Vtzbar^2) * (Dinv * D^2))

  # RZ2 = sum((Z %*% RSinvR) * Z)
  VtZ <- model$Z %*% V
  term4 <- sum((VtZ^2) %*% (Dinv * D^2))

  # diag(RSinvR)^T postb2
  diag_RSinvR <- rowSums((V^2) * rep(Dinv * D^2, each = nrow(V)))
  term5 <- sum(diag_RSinvR * postb2)

  return(zSinvz + term2 + term3 - term4 + term5)
}

# Expected log-likelihood
#' @keywords internal
Eloglik.rss_lambda <- function(data, model) {
  D <- get_eigen_R(data, model)$values
  d <- model$sigma2 * D + data$lambda
  # When lambda=0, zero eigenvalues give d=0; project out null-space.
  d_pos <- d[d > 0]
  r_eff <- length(d_pos)
  return(-(r_eff / 2) * log(2 * pi) - 0.5 *
           sum(log(d_pos)) - 0.5 * get_ER2.rss_lambda(data, model))
}

# Log-likelihood for RSS
#' @keywords internal
loglik.rss_lambda <- function(data, params, model, V, ser_stats, l = NULL, ...) {
  # Wakefield ABF using betahat/shat2 from ser_stats (supports inflation)
  shat2 <- pmax(ser_stats$shat2, .Machine$double.eps)
  lbf   <- -0.5 * log(1 + V / shat2) +
    0.5 * ser_stats$betahat^2 * V / (shat2 * (V + shat2))

  # Stabilize logged Bayes Factor
  stable_res <- lbf_stabilization(lbf, model$pi, ser_stats$shat2)

  # Compute posterior weights
  weights_res <- compute_posterior_weights(stable_res$lpo)

  # Store in model if l is provided, otherwise return lbf_model for prior variance optimization
  if (!is.null(l)) {
    model$alpha[l, ] <- weights_res$alpha
    model$lbf[l] <- weights_res$lbf_model
    model$lbf_variable[l, ] <- stable_res$lbf
    return(model)
  } else {
    return(weights_res$lbf_model)
  }
}

#' @keywords internal
neg_loglik.rss_lambda <- function(data, params, model, V_param, ser_stats, ...) {
  # Convert parameter to V based on optimization scale (always log for RSS lambda)
  V <- exp(V_param)
  lbf_model <- loglik.rss_lambda(data, params, model, V, ser_stats)
  return(-lbf_model)
}

# =============================================================================
# MODEL UPDATES & FITTING
#
# Functions for iterative model updates and variance component estimation.
# These handle the dynamic aspects of model fitting including fitted value
# updates and variance component estimation.
#
# Functions: update_fitted_values, update_variance_components, update_derived_quantities
# =============================================================================

# Update fitted values
#' @keywords internal
update_fitted_values.rss_lambda <- function(data, params, model, l, ...) {
  # Add back lth effect (scaled by slot weight)
  sw_l <- get_slot_weight(model, l)
  model$Rz <- model$fitted_without_l + sw_l *
    as.vector(compute_Rv(data, model$alpha[l, ] * model$mu[l, ]))
  model    <- precompute_rss_lambda_terms(data, model)

  return(model)
}

# Update model variance
#' @keywords internal
update_model_variance.rss_lambda <- function(data, params, model) {
  if (!isTRUE(params$estimate_residual_variance)) return(model)

  variance_result <- update_variance_components(data, params, model)
  model <- modifyList(model, variance_result)
  model$sigma2 <- min(max(model$sigma2, params$residual_variance_lowerbound),
                      params$residual_variance_upperbound)
  model <- update_derived_quantities(data, params, model)

  return(model)
}

# Update variance components
#' @keywords internal
#' @importFrom stats optimize
update_variance_components.rss_lambda <- function(data, params, model, ...) {
  if (!isTRUE(params$estimate_residual_variance)) return(list())

  upper_bound <- 1 - data$lambda
  objective <- function(sigma2) {
    temp_model        <- model
    temp_model$sigma2 <- sigma2
    Eloglik.rss_lambda(data, temp_model)
  }
  est_sigma2 <- optimize(objective, interval = c(1e-4, upper_bound),
                         maximum = TRUE)$maximum
  if (objective(est_sigma2) < objective(upper_bound))
    est_sigma2 <- upper_bound

  list(sigma2 = est_sigma2)
}

# Update derived quantities
#' @keywords internal
update_derived_quantities.rss_lambda <- function(data, params, model) {
  eigen_R <- get_eigen_R(data, model)
  Dinv <- compute_Dinv(model, data)
  V    <- eigen_R$vectors
  D    <- eigen_R$values
  Vt   <- t(V)

  # Update SinvRj and RjSinvRj
  model$SinvRj   <- V %*% (Dinv * D * Vt)
  model$RjSinvRj <- colSums(Vt * (Dinv * (D^2) * Vt))

  return(model)
}

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
#
# Functions for generating final results and summary statistics.
# These process fitted models into interpretable outputs including
# credible sets, variable names, and fitted values.
#
# Functions: get_scale_factors, get_intercept, get_fitted, get_cs,
# get_variable_names, get_zscore
# =============================================================================

# Get scale factors
#' @keywords internal
get_scale_factors.rss_lambda <- function(data, params) {
  return(rep(1, data$p))
}

# Get intercept
#' @keywords internal
get_intercept.rss_lambda <- function(data, params, model, ...) {
  return(data$intercept_value)
}

# Get fitted values
#' @keywords internal
get_fitted.rss_lambda <- function(data, params, model, ...) {
  return(get_fitted.default(data, params, model, ...))
}

# Get credible sets
#' @keywords internal
get_cs.rss_lambda <- function(data, params, model, ...) {
  if (is.null(params$coverage) || is.null(params$min_abs_corr)) {
    return(NULL)
  }

  if (!is.null(data$X)) {
    return(susie_get_cs(model,
                        X               = data$X,
                        coverage        = params$coverage,
                        min_abs_corr    = params$min_abs_corr,
                        n_purity        = params$n_purity))
  }

  return(susie_get_cs(model,
                      Xcorr           = safe_cov2cor(data$R),
                      check_symmetric = FALSE,
                      coverage        = params$coverage,
                      min_abs_corr    = params$min_abs_corr,
                      n_purity        = params$n_purity))
}

# Get variable names
#' @keywords internal
get_variable_names.rss_lambda <- function(data, model, ...) {
  return(assign_names(data, model, names(data$z)))
}

# Get univariate z-scores
#' @keywords internal
get_zscore.rss_lambda <- function(data, params, model, ...) {
  return(get_zscore.default(data, params, model))
}

# Clean up model object for RSS lambda data
#' @keywords internal
cleanup_model.rss_lambda <- function(data, params, model, ...) {
  # Remove common fields
  model <- cleanup_model.default(data, params, model, ...)

  # Remove RSS-lambda-specific temporary fields
  rss_fields <- c("SinvRj", "RjSinvRj", "Rz", "Z", "zbar", "diag_postb2",
                   "eigen_R", "Vtz", "z_null_norm2",
                   "residuals", "fitted_without_l", "residual_variance")

  for (field in rss_fields) {
    if (field %in% names(model)) {
      model[[field]] <- NULL
    }
  }

  return(model)
}


================================================
FILE: R/rss_mismatch.R
================================================
# RSS R-reference mismatch handling.
#
# Single home for code that targets the discrepancy between the
# supplied R reference and the target population. Active on the SS
# / ss_mixture dispatches; the rss_lambda dispatch (lambda > 0) does
# NOT use any of this (entry-level errors block lambda > 0 with
# R_finite or R_mismatch != "none").
#
#   * 1-D MAP optimizer for the variance component lambda_bias
#     (estimate_lambda_bias)
#   * per-variable inflation factor used inside the SER step
#     (compute_shat2_inflation)
#   * model-state storage helper for per-slot inflation diagnostics
#     (apply_inflation_state)
#   * per-sweep region-level fit (fit_R_mismatch)
#   * residual R-mismatch QC diagnostic Q_art (R_mismatch = "map_qc")
#
# Storage convention on the model:
#   model$lambda_bias    scalar set once per sweep by fit_R_mismatch
#   model$B_corrected    1 / (1/B + lambda_bias)
#   model$shat2_inflation per-variable inflation vector of length p,
#                        consumed by the SER step.

# =============================================================================
# FINITE-REFERENCE SETUP AND DIAGNOSTICS
# =============================================================================

# Resolve R_finite into an explicit reference sample size B.
# R_finite = TRUE is only meaningful when the reference factor X is available;
# for precomputed R, the caller must provide B explicitly.
#' @keywords internal
resolve_R_finite <- function(R_finite, X = NULL, is_multi_panel = FALSE) {
  if (is.null(R_finite))
    return(NULL)
  if (isTRUE(R_finite)) {
    if (is.null(X))
      stop("R_finite = TRUE requires X input. ",
           "When using a precomputed R matrix, provide a positive number ",
           "specifying the reference sample size B instead.")
    if (is_multi_panel)
      return(min(vapply(X, nrow, integer(1))))
    return(nrow(X))
  }
  if (!is.numeric(R_finite) || any(!is.finite(R_finite)) ||
      any(R_finite <= 0)) {
    stop("R_finite must be NULL, TRUE, or positive numeric value(s).")
  }
  if (is_multi_panel) {
    K <- if (is.null(X)) length(R_finite) else length(X)
    if (length(R_finite) == 1)
      return(rep(as.numeric(R_finite), K))
    if (length(R_finite) == K)
      return(as.numeric(R_finite))
    stop("For multi-panel input, R_finite must be TRUE, a single positive ",
         "number, or one positive number per panel.")
  }
  if (length(R_finite) == 1)
    return(as.numeric(R_finite))
  stop("R_finite must be NULL, TRUE, or a single positive number.")
}

# Compute finite-reference R diagnostics (debiased Frobenius norm,
# effective rank, r/B ratio, per-variant diagonal deviation from 1).
# Used by both summary_stats_constructor and rss_lambda_constructor.
#
# @param X Factor matrix (B x p), or NULL.
# @param R Precomputed R matrix (p x p), or NULL.
# @param B Reference panel sample size.
# @param p Number of variants.
# @param x_is_standardized If TRUE, X has been standardized so X'X = R_hat
#   directly (no normalization). If FALSE, R_hat = X'X/B so the Frobenius
#   norm needs a /B^2 correction.
# @return List with B, p, R_frob_sq_debiased, effective_rank, r_over_B,
#   Rhat_diag_deviation.
#' @keywords internal
compute_R_finite_diagnostics <- function(X = NULL, R = NULL, B, p,
                                         x_is_standardized = FALSE) {
  if (!is.null(X)) {
    A <- tcrossprod(X)           # B x B Gram matrix
    R_frob_sq <- sum(A * A)      # ||XX'||_F^2 = ||X'X||_F^2
    if (!x_is_standardized)
      R_frob_sq <- R_frob_sq / nrow(X)^2
    Rhat_diag <- colSums(X^2)
    if (!x_is_standardized)
      Rhat_diag <- Rhat_diag / nrow(X)
  } else if (!is.null(R)) {
    R_frob_sq <- sum(R * R)
    Rhat_diag <- diag(R)
  } else {
    R_frob_sq <- p               # identity fallback
    Rhat_diag <- rep(1, p)
  }

  # Debiased Frobenius norm (Ledoit-Wolf unbiased estimator)
  R_frob_sq_db <- (B * R_frob_sq - p^2) / (B + 1)
  eff_rank <- p^2 / max(R_frob_sq_db, 1)

  list(
    B = B,
    p = p,
    R_frob_sq_debiased = R_frob_sq_db,
    effective_rank = eff_rank,
    r_over_B = eff_rank / B,
    Rhat_diag_deviation = abs(Rhat_diag - 1)
  )
}

# =============================================================================
# 1-D MAP OPTIMIZER FOR lambda_bias
# =============================================================================

# Estimate extra R-bias variance beyond finite-reference uncertainty.
# Likelihood on the z-score residual scale,
#   tau_j^2 = sigma2 + (1/R_finite_B + lambda_bias) * s_j,
# with a half-Cauchy(prior_scale) prior on u = sqrt(lambda_bias).
# The Fisher-information boundary SE,
#   SE_0 = sqrt(2) * sigma2 / sqrt(sum(s^2)),
# defines a data-driven floor: estimates below 0.1 * SE_0 are zeroed.
# This both suppresses Brent boundary noise and replaces ad-hoc display
# thresholds with one rule; "none" short-circuits before optimization.
#' @keywords internal
estimate_lambda_bias <- function(r, s, sigma2, R_finite_B, method) {
  if (is.null(method) || method == "none")
    return(0)
  keep <- is.finite(r) & is.finite(s) & s > .Machine$double.eps
  if (!any(keep) || !is.finite(sigma2) || sigma2 <= .Machine$double.eps)
    return(0)

  cache <- list(r2 = r[keep]^2, s = s[keep])
  cache$base <- sigma2 + cache$s / R_finite_B
  pos <- (cache$r2 - cache$base) / cache$s
  pos <- pos[is.finite(pos) & pos > 0]
  prior_scale <- sqrt(max(1 / R_finite_B, 1 / 10000))
  upper_lambda <- max(c(1, 100 / R_finite_B, 100 * prior_scale^2,
                        10 * pos), na.rm = TRUE)
  upper_u <- sqrt(upper_lambda)

  nll <- function(u) {
    lambda_bias <- u^2
    tau <- cache$base + lambda_bias * cache$s
    0.5 * sum(log(tau) + cache$r2 / tau) + log1p((u / prior_scale)^2)
  }
  lambda_hat <- optimize(nll, interval = c(0, upper_u))$minimum^2

  ss2 <- sum(cache$s^2)
  if (ss2 <= 0) return(0)
  se_boundary <- sqrt(2) * sigma2 / sqrt(ss2)
  if (lambda_hat < 0.1 * se_boundary) 0 else lambda_hat
}

# =============================================================================
# PER-VARIABLE INFLATION
# =============================================================================

# SS-path per-variable inflation factor tau_j^2 / sigma2 with
#   tau_j^2 = sigma2 + (1/R_finite_B + lambda_bias) * (eta_j^2 + v_g),
#   eta_j^2 = XtXr_without_l[j]^2 / (n-1)   (z-score scale)
#   v_g     = sum(b_minus_l * XtXr_without_l).
# Reads the region-level scalar lambda_bias from model (set once per
# sweep by fit_R_mismatch). Per-slot lambda_bias re-fitting was removed:
# the previous design re-estimated lambda_bias inside every SER step
# from the leave-one-effect residual, which intentionally contains the
# lth sparse signal and so confounded signal with R-bias. The fix is
# the per-sweep fit_R_mismatch hook in ibss_fit; this function only
# applies the scalar to the slot-specific xi_l.
# Returns NULL when no inflation applies, otherwise a list with the
# inflation vector and lambda_bias / B_corrected = NULL so that
# apply_inflation_state does not write per-slot diagnostics on the SS
# path (those are scalars on the model, set by fit_R_mismatch).
#' @keywords internal
compute_shat2_inflation <- function(data, model, XtXr_without_l, b_minus_l, r) {
  R_finite_B <- if (!is.null(model$R_finite_B)) model$R_finite_B else data$R_finite_B
  if (is.null(R_finite_B) ||
      model$sigma2 <= .Machine$double.eps) {
    return(NULL)
  }
  v_g     <- max(sum(b_minus_l * XtXr_without_l), 0)
  eta2    <- XtXr_without_l^2 / (data$n - 1)
  s <- eta2 + v_g
  lambda_bias <- if (is.null(model$lambda_bias)) 0 else model$lambda_bias
  infl <- 1 + (1 / R_finite_B + lambda_bias) * s / model$sigma2
  list(infl = infl, lambda_bias = NULL, B_corrected = NULL)
}

# =============================================================================
# MODEL-STATE STORAGE FOR PER-SLOT INFLATION DIAGNOSTICS
# =============================================================================

# Unpack the inflation list from compute_shat2_inflation into the model.
# Sets model$shat2_inflation to the per-variant inflation vector. The
# per-slot writes to model$lambda_bias[l] / model$B_corrected[l] gated
# below are dormant in the current code: SS / ss_mixture callers always
# pass infl_state$lambda_bias = NULL (the scalar lambda_bias is set
# once per sweep by fit_R_mismatch), and the rss_lambda path no longer
# calls this function. The per-slot machinery is retained as inert
# back-compat shim and will be removed when the next constructor pass
# converges on a single storage shape.
#' @keywords internal
apply_inflation_state <- function(model, infl_state, l) {
  if (is.null(infl_state)) {
    model$shat2_inflation <- NULL
    return(model)
  }
  model$shat2_inflation <- infl_state$infl
  L <- nrow(model$alpha)
  if (!is.null(infl_state$lambda_bias)) {
    if (is.null(model$lambda_bias) || length(model$lambda_bias) != L)
      model$lambda_bias <- rep(0, L)
    model$lambda_bias[l] <- infl_state$lambda_bias
  }
  if (!is.null(infl_state$B_corrected)) {
    if (is.null(model$B_corrected) || length(model$B_corrected) != L)
      model$B_corrected <- rep(NA_real_, L)
    model$B_corrected[l] <- infl_state$B_corrected
  }
  model
}

# =============================================================================
# PER-SWEEP REGION-LEVEL fit_R_mismatch
# =============================================================================

#' Fit the region-level lambda_bias from the post-sweep fitted residual.
#'
#' Math (see archive/ld_mismatch_generativemodel.tex):
#'   beta_bar    = colSums(slot_weight * alpha * mu)        (full posterior mean, betahat scale)
#'   XtXr_full   = X'X * beta_bar = (n-1) * R * beta_bar
#'   r_fit       = (data$Xty - XtXr_full) / sqrt(n-1)       (z-scale fitted residual)
#'   eta_fit_j^2 = XtXr_full[j]^2 / (n-1)                   (z-scale per-variant signal)
#'   v_g_fit     = sum(beta_bar * XtXr_full)                (= beta_bar_z' R beta_bar_z)
#'   xi_fit_j    = eta_fit_j^2 + v_g_fit
#' MAP for lambda_bias on the working likelihood
#'   r_fit_j ~ N(0, sigma2 + (1/B + lambda) * xi_fit_j)
#' with half-Cauchy(scale = sqrt(max(1/B, 1e-4))) prior on sqrt(lambda).
#' Fisher SE zero-mask applied (see estimate_lambda_bias).
#'
#' Replaces the per-slot re-fit that used to live inside
#' compute_shat2_inflation, which estimated lambda_bias from the
#' intra-sweep r_full_z that drifts as the slot loop progresses.
#'
#' For mode = "map_qc" the same lambda_bias fit is followed by the
#' Q_art residual artifact diagnostic; see compute_Q_art. The
#' The artifact diagnostic emits an R warning when flagged; it does
#' not change lambda_bias or the SER likelihood.
#'
#' @keywords internal
#' @noRd
fit_R_mismatch <- function(data, params, model) {
  R_mismatch <- if (!is.null(params$R_mismatch)) params$R_mismatch else "none"
  if (R_mismatch == "none") return(model)
  R_finite_B <- if (!is.null(model$R_finite_B)) model$R_finite_B else data$R_finite_B
  if (is.null(R_finite_B) || !is.finite(model$sigma2) ||
      model$sigma2 <= .Machine$double.eps)
    return(model)
  if (!inherits(data, c("ss", "ss_mixture"))) return(model)

  sw <- if (!is.null(model$slot_weights)) model$slot_weights else
          rep(1, nrow(model$alpha))
  b_full    <- colSums(sw * model$alpha * model$mu)
  XtXr_full <- if (!is.null(model$XtXr))
                 model$XtXr
               else compute_Rv(data, b_full)
  nm1 <- if (!is.null(data$nm1)) data$nm1 else (data$n - 1)
  if (!is.finite(nm1) || nm1 <= 0) return(model)

  r_fit_z  <- (data$Xty - XtXr_full) / sqrt(nm1)
  v_g_full <- max(sum(b_full * XtXr_full), 0)
  s_full   <- XtXr_full^2 / nm1 + v_g_full

  model$lambda_bias <- estimate_lambda_bias(r_fit_z, s_full, model$sigma2,
                                            R_finite_B, R_mismatch)
  model$B_corrected <- 1 / (1 / R_finite_B + model$lambda_bias)

  if (R_mismatch == "map_qc") {
    eigen_R <- get_R_mismatch_eigen(data, model)
    if (is.null(eigen_R))
      stop("R_mismatch = 'map_qc' requires data$eigen_R; ",
           "summary_stats_constructor should have cached it.")
    eig_delta_rel <- if (!is.null(params$eig_delta_rel))
                       params$eig_delta_rel else 1e-3
    eig_delta_abs <- if (!is.null(params$eig_delta_abs))
                       params$eig_delta_abs else 0
    art <- compute_Q_art(eigen_R, r_fit_z, eig_delta_rel, eig_delta_abs)
    threshold <- if (!is.null(params$artifact_threshold))
                   params$artifact_threshold else 0.1
    flagged <- isTRUE(art$evaluable) && isTRUE(art$Q_art > threshold)

    model$Q_art              <- art$Q_art
    model$artifact_evaluable <- art$evaluable
    model$artifact_flag      <- flagged
    model$low_eigen_count    <- art$low_eigen_count
    model$low_eigen_fraction <- art$low_eigen_count /
                                length(eigen_R$values)
    model$eig_delta          <- art$eig_delta

    if (flagged) {
      msg <- paste0("Residual R-bias artifact detected (Q_art = ",
                    sprintf("%.3g", art$Q_art),
                    " > threshold ", sprintf("%.3g", threshold),
                    "). Fine-mapping results may be unreliable with ",
                    "this R reference. Consider allele/QC review, ",
                    "multi-reference analysis, or conservative fallback.")
      model$mode_label <- "warning"
      warning_message(msg)
      warning(msg, call. = FALSE)
    } else {
      model$mode_label <- "normal"
    }
  }

  model
}

# Eigen accessor for map_qc. The ordinary SS path stores data$eigen_R.
# The ss_mixture path can change R through omega, so recover the current
# mixture spectrum from panel_R when omega is available; otherwise fall
# back to the initialized X_meta crossproduct.
#' @keywords internal
get_R_mismatch_eigen <- function(data, model) {
  if (!is.null(model$eigen_R))
    return(model$eigen_R)
  if (!is.null(data$eigen_R) && !inherits(data, "ss_mixture"))
    return(data$eigen_R)
  if (inherits(data, "ss_mixture")) {
    if (!is.null(model$omega) && !is.null(data$omega_cache)) {
      eig <- eigen_from_reduced(data$omega_cache, model$omega,
                                data$K, data$p)
      eig$values <- pmax(eig$values, 0)
      return(eig)
    }
    if (!is.null(model$omega) && !is.null(data$panel_R)) {
      R_mix <- Reduce("+", Map(function(w, R) w * R, model$omega, data$panel_R))
      R_mix <- 0.5 * (R_mix + t(R_mix))
      eig <- eigen(R_mix, symmetric = TRUE)
      eig$values <- pmax(eig$values, 0)
      return(eig)
    }
    if (!is.null(data$X)) {
      R_init <- crossprod(data$X) / data$nm1
      R_init <- 0.5 * (R_init + t(R_init))
      eig <- eigen(R_init, symmetric = TRUE)
      eig$values <- pmax(eig$values, 0)
      return(eig)
    }
  }
  data$eigen_R
}

# =============================================================================
# Q_art residual R-bias artifact diagnostic
# =============================================================================

# Fraction of fitted-residual energy in low-eigenvalue directions of R.
#   delta = max(eig_delta_abs, eig_delta_rel * max(d))
#   A_delta = {k : d_k <= delta}
#   Q_art = sum_{k in A_delta} (v_k' r_fit)^2 / sum(r_fit^2)
# When the fitted residual is well-explained by R, energy in
# low-eigenvalue directions is near the noise floor. A large Q_art
# flags residual structure that the supplied reference says should be
# weak or absent; allele/strand flips should still be checked by
# kriging-style diagnostics.
#
# Returns a list with Q_art (in [0, 1]), evaluable (FALSE when no
# low-eigenvalues exist or r_fit has negligible energy),
# low_eigen_count, eig_delta. Q_art is a heuristic proportion, not a
# calibrated test statistic; see archive/ld_mismatch_generativemodel.tex
# Sec. "Detecting residual R-bias artifacts".
#' @keywords internal
compute_Q_art <- function(eigen_R, r_fit, eig_delta_rel = 1e-3,
                          eig_delta_abs = 0,
                          residual_energy_floor = 1e-12) {
  d <- eigen_R$values
  V <- eigen_R$vectors
  delta  <- max(eig_delta_abs, eig_delta_rel * max(d))
  A_delta <- which(d <= delta)
  rss    <- sum(r_fit^2)
  if (length(A_delta) == 0L || rss <= residual_energy_floor) {
    return(list(Q_art = 0, evaluable = FALSE,
                low_eigen_count = length(A_delta), eig_delta = delta))
  }
  proj <- as.numeric(crossprod(V[, A_delta, drop = FALSE], r_fit))
  Q <- sum(proj^2) / rss
  list(Q_art = Q, evaluable = TRUE,
       low_eigen_count = length(A_delta), eig_delta = delta)
}


================================================
FILE: R/single_effect_regression.R
================================================
# =============================================================================
# SINGLE EFFECT REGRESSION
#
# Performs single effect regression for the lth effect in the SuSiE model.
# Computes posterior moments, log Bayes factors, and optimizes prior variance.
# =============================================================================
#'
#' @param data Data object (individual, ss, or rss_lambda)
#' @param params Validated params object
#' @param model Current SuSiE model object
#' @param l Effect index being updated
#'
#' @return Updated model with alpha, mu, mu2, lbf, lbf_variable, V, and KL stored for the lth effect
#'
#' @keywords internal
#' @noRd
single_effect_regression <- function(data, params, model, l) {

    # Fixed mixture prior path: evaluate BFs on a pre-specified variance grid
    # with given mixture weights, bypassing scalar V optimization entirely.
    # Activated by estimate_prior_method = "fixed_mixture" with non-NULL
    # prior_variance_grid and mixture_weights in params.
    if (params$estimate_prior_method == "fixed_mixture") {
      ser_stats <- compute_ser_statistics(data, params, model, l)
      model <- loglik_mixture(data, params, model, ser_stats, l)
      model <- calculate_posterior_moments_mixture(data, params, model, l)
      model <- compute_kl(data, params, model, l)
      # Store effective V as posterior-weighted grid mean (for diagnostics)
      V_eff <- sum(params$mixture_weights * params$prior_variance_grid)
      model <- set_prior_variance_l(model, l, V_eff)
      return(model)
    }

    # Two S3 hook slots: pre/post loglik. Defaults dispatch on
    # `params$estimate_prior_method`; downstream classes override.

    V <- get_prior_variance_l(model, l)
    ser_stats <- compute_ser_statistics(data, params, model, l)

    out <- pre_loglik_prior_hook(data, params, model, ser_stats,
                                 l = l, V_init = V)
    V     <- out$V
    model <- out$model

    model <- loglik(data, params, model, V, ser_stats, l)
    model <- calculate_posterior_moments(data, params, model, V, l)
    model <- compute_kl(data, params, model, l)

    out <- post_loglik_prior_hook(data, params, model, ser_stats,
                                  l = l, V_init = V)
    V     <- out$V
    model <- out$model

    model <- set_prior_variance_l(model, l, V)
    model
  }

#' Pre-loglik prior-update hook
#'
#' S3 generic, called between SER stats and `loglik`. Default
#' routes to `optimize_prior_variance` for `optim` / `uniroot` /
#' `simple`. Returns `list(V, model)`.
#'
#' @export
#' @keywords internal
pre_loglik_prior_hook <- function(data, params, model, ser_stats,
                                  l, V_init) {
  UseMethod("pre_loglik_prior_hook")
}

#' @export
#' @keywords internal
pre_loglik_prior_hook.default <- function(data, params, model, ser_stats,
                                          l, V_init) {
  if (params$estimate_prior_method %in% c("optim", "uniroot", "simple")) {
    return(optimize_prior_variance(data, params, model, ser_stats,
                                   l = l, V_init = V_init))
  }
  list(V = V_init, model = model)
}

#' Post-loglik prior-update hook
#'
#' S3 generic, called after `loglik` / posterior moments / KL.
#' Default routes to `optimize_prior_variance` for `EM`. Returns
#' `list(V, model)`.
#'
#' @export
#' @keywords internal
post_loglik_prior_hook <- function(data, params, model, ser_stats,
                                   l, V_init) {
  UseMethod("post_loglik_prior_hook")
}

#' @export
#' @keywords internal
post_loglik_prior_hook.default <- function(data, params, model, ser_stats,
                                           l, V_init) {
  if (identical(params$estimate_prior_method, "EM")) {
    return(optimize_prior_variance(
      data, params, model, ser_stats,
      l       = l,
      alpha   = get_alpha_l(model, l),
      moments = get_posterior_moments_l(model, l),
      V_init  = V_init))
  }
  list(V = V_init, model = model)
}

# =============================================================================
# PRIOR VARIANCE OPTIMIZATION
#
# Optimizes prior variance for single effects using different methods.
# Handles optim, EM, simple methods and null threshold checking.
# =============================================================================

#' Per-effect prior variance update (S3 generic)
#'
#' Dispatched on the data class so downstream packages with non-scalar
#' prior structures (e.g., mfsusieR's adaptive mixture-of-normals
#' prior, future cross-modality priors) can run a per-effect prior
#' update step here while reusing the surrounding SER scaffolding.
#'
#' The default path implements the standard susieR scalar-V
#' optimization (`optim` Brent / `uniroot` / `EM` / `simple` /
#' `none`) plus the post-optimization null-threshold check.
#'
#' @param data Data object (e.g., `individual`, `ss`, `rss_lambda`,
#'   or a downstream class such as `mv_individual`, `mf_individual`).
#' @param params Validated params object.
#' @param model Current SuSiE model object.
#' @param ser_stats SER statistics and optimization parameters from
#'   `compute_ser_statistics`.
#' @param l Index of the effect being updated. Used by downstream
#'   methods that need per-effect state (e.g., the EM mixture-weight
#'   path); the default method uses it only for diagnostic purposes.
#' @param alpha Per-SNP posterior weights for effect `l`, supplied by
#'   the EM path (`get_alpha_l(model, l)`); `NULL` on the pre-loglik
#'   call.
#' @param moments Posterior moments for effect `l`, supplied by the
#'   EM path (`get_posterior_moments_l(model, l)`); `NULL` on the
#'   pre-loglik call.
#' @param V_init Initial value for the prior variance scalar.
#'
#' @return A named list with two elements:
#' \describe{
#'   \item{`V`}{numeric scalar, the optimized prior variance for
#'     effect `l`.}
#'   \item{`model`}{the (possibly mutated) model object. The default
#'     method leaves `model` unchanged; downstream methods may write
#'     prior-state updates here (e.g., mixture-weight vectors).}
#' }
#'
#' @keywords internal
#' @noRd
optimize_prior_variance <- function(data, params, model, ser_stats,
                                    l       = NULL,
                                    alpha   = NULL,
                                    moments = NULL,
                                    V_init  = NULL) {
  UseMethod("optimize_prior_variance")
}

#' Default scalar-V prior-variance optimization
#'
#' Backbone implementation of `optimize_prior_variance`. Handles the
#' five `params$estimate_prior_method` cases (`optim`, `uniroot`,
#' `EM`, `simple`, `none`) on a scalar prior variance and runs the
#' post-optimization null-threshold check.
#'
#' @inheritParams optimize_prior_variance
#' @return A named list `list(V = ..., model = model)` (see
#'   `optimize_prior_variance` for the full contract). `model` is
#'   returned unchanged by this default method.
#' @keywords internal
#' @noRd
optimize_prior_variance.default <- function(data, params, model, ser_stats,
                                            l       = NULL,
                                            alpha   = NULL,
                                            moments = NULL,
                                            V_init  = NULL) {
  V <- V_init
  if (params$estimate_prior_method != "simple") {
    if (params$estimate_prior_method == "optim") {
      V_param_opt <- optim(
        par = ser_stats$optim_init,
        fn = function(V_param) neg_loglik(data, params, model, V_param, ser_stats),
        method = "Brent",
        lower = ser_stats$optim_bounds[1],
        upper = ser_stats$optim_bounds[2]
      )$par

      # Convert optimized parameter to V based on scale of optimization
      V_new <- if (ser_stats$optim_scale == "linear") {
        V_param_opt
      } else {
        exp(V_param_opt)
      }

      # Check if new estimate improves likelihood
      V_param_init <- if (ser_stats$optim_scale == "linear") V else log(V)
      if (neg_loglik(data, params, model, V_param_opt, ser_stats) >
          neg_loglik(data, params, model, V_param_init, ser_stats)) {
        V_new <- V
      }
      V <- V_new
    } else if (params$estimate_prior_method == "uniroot") {
      # Root-finding on the gradient of neg_loglik (on the optimization scale)
      neg_loglik_fn <- function(V_param) neg_loglik(data, params, model, V_param, ser_stats)
      neg_loglik_grad <- function(V_param) {
        h <- max(abs(V_param) * 1e-4, 1e-8)
        (neg_loglik_fn(V_param + h) - neg_loglik_fn(V_param - h)) / (2 * h)
      }

      V_root <- tryCatch(
        uniroot(neg_loglik_grad,
                interval = c(ser_stats$optim_bounds[1], ser_stats$optim_bounds[2]),
                extendInt = "yes",
                tol = .Machine$double.eps^0.25)$root,
        error = function(e) {
          # Fallback: if uniroot fails (no sign change), use initial value
          if (ser_stats$optim_scale == "linear") V else log(V)
        }
      )

      V_new <- if (ser_stats$optim_scale == "linear") V_root else exp(V_root)

      # Check if new estimate improves likelihood
      V_param_init <- if (ser_stats$optim_scale == "linear") V else log(V)
      if (neg_loglik(data, params, model, V_root, ser_stats) >
          neg_loglik(data, params, model, V_param_init, ser_stats)) {
        V_new <- V
      }
      V <- V_new
    } else if (params$estimate_prior_method == "EM") {
      V <- em_update_prior_variance(data, params, model, alpha, moments, V_init)
    } else {
      stop("Invalid option for estimate_prior_method: ", params$estimate_prior_method)
    }
  }

  # Set V exactly 0 if that beats the numerical value by
  # check_null_threshold in loglik. check_null_threshold = 0.1 is
  # exp(0.1) = 1.1 on likelihood scale; it means that for parsimony
  # reasons we set estimate of V to zero, if its numerical estimate is
  # only "negligibly" different from zero. We use a likelihood ratio
  # of exp(check_null_threshold) to define "negligible" in this
  # context. This is fairly modest condition compared to, say, a
  # formal LRT with p-value 0.05. But the idea is to be lenient to
  # non-zeros estimates unless they are indeed small enough to be
  # neglible. See more intuition at
  # https://stephens999.github.io/fiveMinuteStats/LR_and_BF.html
  #
  # For EM, skip this check: the null check would zero V without
  # recomputing the posterior, creating an inconsistent (q, V) pair
  # that can decrease the ELBO. Null effects are handled by
  # trim_null_effects() after convergence instead.
  # see https://github.com/stephenslab/mvsusieR/issues/26
  if (params$estimate_prior_method != "EM" &&
      params$estimate_prior_method != "none") {
    if (loglik(data, params, model, 0, ser_stats) +
      params$check_null_threshold >= loglik(data, params, model, V, ser_stats)) {
      V <- 0
    }
  }

  list(V = V, model = model)
}

# =============================================================================
# SINGLE EFFECT UPDATE
#
# High-level function that updates one effect in the SuSiE model.
# Coordinates residual computation, SER, KL divergence, and fitted value updates.
# =============================================================================
#'
#' @param data Data object (individual, ss, or rss_lambda)
#' @param params Validated params object
#' @param model Current SuSiE model object
#' @param l Effect index being updated
#'
#' @return Updated SuSiE model object with new parameters for effect l
#'
#' @keywords internal
#' @noRd
single_effect_update <- function(data, params, model, l) {

  # Compute Residuals
  model <- compute_residuals(data, params, model, l)

  # Run Single Effect Regression
  model <- single_effect_regression(data, params, model, l)

  # Update fitted values
  model <- update_fitted_values(data, params, model, l)

  return(model)
}

================================================
FILE: R/slot_prior.R
================================================
#' @title Slot Activity Prior for SuSiE
#'
#' @description Construct a prior specification for the slot activity
#'   model, which regularizes the number of active single effects in
#'   SuSiE. Two prior families are available: Beta-Binomial (default,
#'   recommended for single-locus) and Gamma-Poisson (recommended for
#'   genome-wide applications via susieAnn).
#'
#' @param C Expected number of causal variants for the Gamma-Poisson prior
#'   on the per-block causal rate. Must be positive. Not used by
#'   \code{slot_prior_betabinom}.
#' @param nu Overdispersion parameter for the Gamma-Poisson prior on the
#'   per-block causal rate. Not used by \code{slot_prior_betabinom}.
#'   Larger values give stronger shrinkage toward C. Default 8 when
#'   not specified.
#' @param a_beta Shape parameter for the Beta prior on inclusion
#'   probability rho. Default 1.
#' @param b_beta Shape parameter for the Beta prior on inclusion
#'   probability rho. Default 2, giving a moderate sparsity preference
#'   with \code{E[rho] = 1/3 ~ 0.33}. Setting \code{a_beta = 1}
#'   and \code{b_beta = 1} gives a uniform prior on [0,1], providing
#'   automatic multiplicity correction following Scott and Berger (2010).
#' @param update_schedule How the Gamma shape parameter is updated
#'   during IBSS iterations (Gamma-Poisson only; ignored for
#'   Beta-Binomial which is inherently sequential).
#'   \code{"batch"} updates once per full sweep (standard CAVI).
#'   \code{"sequential"} updates after each slot (faster convergence
#'   per iteration, used by susieAnn).
#' @param c_hat_init Optional numeric L-vector of initial slot activity
#'   probabilities for warm-starting. If NULL, initialized at the
#'   prior mean.
#' @param skip_threshold_multiplier Multiplier for the adaptive skip
#'   threshold. Slots with c_hat below this fraction of the baseline
#'   (prior with zero signal) are skipped. Default 0 (no skipping).
#'   The threshold is recomputed after each sweep from the current
#'   model state, and is set to 0 on the first sweep so all slots
#'   are evaluated at least once.
#'
#' @return A list of class \code{"slot_prior"} with the appropriate
#'   subclass.
#'
#' @details
#' Two prior types are available:
#' \describe{
#'   \item{\code{slot_prior_betabinom}}{Uses a Beta-Binomial model
#'     for slot inclusion. The inclusion probability rho is given a
#'     Beta(a_beta, b_beta) prior and integrated out analytically,
#'     yielding an adaptive multiplicity correction that penalizes
#'     less when more slots are active. This is the recommended
#'     default for single-locus applications. See Scott and Berger
#'     (2010) for the theoretical justification.}
#'   \item{\code{slot_prior_poisson}}{Uses the Gamma-Poisson model
#'     with Poisson approximation for slot indicators. Recommended
#'     for genome-wide applications via susieAnn, where C and nu
#'     are estimated across loci.}
#' }
#'
#' @references
#' Scott, J. G. and Berger, J. O. (2010). Bayes and empirical-Bayes
#' multiplicity adjustment in the variable-selection problem.
#' \emph{Annals of Statistics}, 38(5), 2587--2619.
#'
#' @examples
#' # Default: Beta-Binomial with Beta(1, 2) prior on inclusion probability
#' slot_prior_betabinom()
#'
#' # Gamma-Poisson for susieAnn
#' slot_prior_poisson(C = 5, nu = 8)
#'
#' # Pass to susie
#' # fit <- susie(X, y, slot_prior = slot_prior_betabinom())
#'
# Beta-Binomial: rho ~ Beta(a, b), c_l | rho ~ Bern(rho), rho collapsed.
# Collapsed update: logit(c_l) = log(a + k_{-l}) - log(b + L-1 - k_{-l}) + lbf_l
# Scott & Berger (2010), Ann. Statist. 38(5):2587-2619.
#' @export
slot_prior_betabinom <- function(a_beta = NULL, b_beta = NULL,
                                 c_hat_init = NULL,
                                 skip_threshold_multiplier = 0) {
  ab_was_default <- is.null(a_beta) && is.null(b_beta)
  if (is.null(a_beta)) a_beta <- 1
  # Beta(1, 2) gives approximately linear decline in the number of active
  # slots: P(K=1) > P(K=2) > P(K=3) > ..., favoring sparse architectures
  # while still allowing multiple effects. E[rho] = 1/3, expecting ~3 of 10.
  if (is.null(b_beta)) b_beta <- 2

  stopifnot(is.numeric(a_beta), length(a_beta) == 1, a_beta > 0)
  stopifnot(is.numeric(b_beta), length(b_beta) == 1, b_beta > 0)
  structure(
    list(
      a_beta = a_beta,
      b_beta = b_beta,
      ab_was_default = ab_was_default,
      update_schedule = "sequential",  # inherently sequential (uses k_{-l})
      c_hat_init = c_hat_init,
      skip_threshold_multiplier = skip_threshold_multiplier
    ),
    class = c("slot_prior_betabinom", "slot_prior")
  )
}

#' @rdname slot_prior_betabinom
#' @export
slot_prior_poisson <- function(C, nu = NULL, update_schedule = c("sequential", "batch"),
                               c_hat_init = NULL, skip_threshold_multiplier = 0) {
  update_schedule <- match.arg(update_schedule)
  stopifnot(is.numeric(C), length(C) == 1, C > 0)
  nu_was_null <- is.null(nu)
  if (nu_was_null) nu <- 8
  stopifnot(is.numeric(nu), length(nu) == 1, nu > 0)
  structure(
    list(
      C = C,
      nu = nu,
      nu_was_default = nu_was_null,
      update_schedule = update_schedule,
      c_hat_init = c_hat_init,
      skip_threshold_multiplier = skip_threshold_multiplier
    ),
    class = c("slot_prior_poisson", "slot_prior")
  )
}

#' @export
print.slot_prior <- function(x, ...) {
  type <- if (inherits(x, "slot_prior_betabinom")) "beta-binomial"
          else "poisson"
  cat(sprintf("Slot activity prior (%s)\n", type))
  if (type == "beta-binomial") {
    cat(sprintf("  a_beta:               %g\n", x$a_beta))
    cat(sprintf("  b_beta:               %g\n", x$b_beta))
  } else {
    cat(sprintf("  C (expected causal):  %g\n", x$C))
    cat(sprintf("  nu (overdispersion):  %g\n", x$nu))
  }
  if (type != "beta-binomial")
    cat(sprintf("  update schedule:      %s\n", x$update_schedule))
  if (!is.null(x$c_hat_init))
    cat(sprintf("  warm start:           %d-vector\n", length(x$c_hat_init)))
  invisible(x)
}

#' Check if an object is a slot_prior
#' @param x Object to test.
#' @return Logical.
#' @keywords internal
#' @noRd
is.slot_prior <- function(x) inherits(x, "slot_prior")

#' ELBO contribution from the slot activity prior.
#' Beta-Binomial: log Beta(a+k, b+L-k) - log Beta(a,b) + Bernoulli entropy.
#' Gamma-Poisson: Gamma prior/entropy + Poisson slot prior + Bernoulli entropy.
#' @keywords internal
#' @noRd
slot_prior_elbo <- function(model) {
  st <- model$c_hat_state
  chat <- model$slot_weights
  L <- length(chat)

  # Bernoulli entropy: -sum(c log c + (1-c) log(1-c))
  eps <- .Machine$double.eps
  ch <- pmax(pmin(chat, 1 - eps), eps)
  bern_entropy <- -sum(ch * log(ch) + (1 - ch) * log(1 - ch))

  if (st$prior_type == "betabinom") {
    k <- sum(chat)
    log_prior <- lbeta(st$a_beta + k, st$b_beta + L - k) -
      lbeta(st$a_beta, st$b_beta)
    return(log_prior + bern_entropy)
  }

  # Gamma-Poisson: E_q[log mu] = psi(a_g) - log(b_g), E_q[mu] = a_g/b_g
  a_g <- st$a_g; b_g <- st$b_g; nu <- st$nu; C <- st$C
  Eq_log_mu <- digamma(a_g) - log(b_g)
  Eq_mu     <- a_g / b_g
  Lhat      <- sum(chat)

  # E[log p(mu)] + H[q(mu)] + E[log p(c|mu)]
  gamma_prior   <- (nu - 1) * Eq_log_mu - (nu / max(C, 1e-10)) * Eq_mu +
    nu * log(nu / max(C, 1e-10)) - lgamma(nu)
  gamma_entropy <- a_g - log(b_g) + lgamma(a_g) + (1 - a_g) * digamma(a_g)
  slot_prior    <- Lhat * (Eq_log_mu - log(L))

  return(gamma_prior + gamma_entropy + slot_prior + bern_entropy)
}


================================================
FILE: R/sparse_multiplication.R
================================================
# @title Computes standardized.X %*% b using sparse multiplication trick
# @param X an n by p unstandardized matrix with three attributes:
# attr(X,"scaled:center"), attr(X,"scaled:scale") and attr(X,"d")
# @param b a p vector
# @return an n vector
#
#' @importFrom Matrix t
#' @importFrom Matrix tcrossprod
compute_Xb <- function(X, b) {
  cm <- attr(X, "scaled:center")
  csd <- attr(X, "scaled:scale")

  # Scale Xb.
  if (!is.null(attr(X, "matrix.type"))) {

    # When X is a trend filtering matrix.
    scaled.Xb <- compute_tf_Xb(attr(X, "order"), b / csd)
  } else {

    # When X is an ordinary sparse/dense matrix.
    scaled.Xb <- tcrossprod(X, t(b / csd))
  }

  # Center Xb.
  Xb <- scaled.Xb - sum(cm * b / csd)
  return(as.numeric(Xb))
}

# @title Computes t(standardized.X) %*% y using sparse multiplication trick
# @param X an n by p unstandardized matrix with three attributes:
# attr(X,"scaled:center"), attr(X,"scaled:scale") and attr(X,"d")
# @param y an n vector
# @return a p vector
#
#' @importFrom Matrix t
#' @importFrom Matrix crossprod
compute_Xty <- function(X, y) {
  cm <- attr(X, "scaled:center")
  csd <- attr(X, "scaled:scale")
  ytX <- crossprod(y, X)

  # Scale Xty.
  if (!is.null(attr(X, "matrix.type"))) {

    # When X is a trend filtering matrix.
    scaled.Xty <- compute_tf_Xty(attr(X, "order"), y) / csd
  } else {

    # When X is an ordinary sparse/dense matrix.
    scaled.Xty <- t(ytX / csd)
  }

  # Center Xty.
  centered.scaled.Xty <- scaled.Xty - cm / csd * sum(y)
  return(as.numeric(centered.scaled.Xty))
}

# @title Computes t(standardized.X) %*% standardized.X using attributes
# @param X an n by p unstandardized matrix with three attributes:
# attr(X,"scaled:center"), attr(X,"scaled:scale") and attr(X,"d")
# @return a p by p matrix representing (scaled X)'(scaled X)
#
#' @importFrom Matrix crossprod
compute_XtX <- function(X) {
  cm <- attr(X, "scaled:center")
  csd <- attr(X, "scaled:scale")
  n <- nrow(X)
  colsums_X <- colSums(X)

  if (!is.null(attr(X, "matrix.type"))) {
    stop("compute_XtX not yet implemented for trend filtering matrices")
  }

  # Compute raw X'X
  XtX_raw <- crossprod(X)

  # Scale columns and rows by 1/csd
  XtX_scaled <- sweep(sweep(XtX_raw, 1, csd, "/"), 2, csd, "/")

  # Adjust for centering
  XtX_centered_scaled <- XtX_scaled -
    n * outer(cm/csd, cm/csd) -
    outer(cm/csd, (colsums_X - n*cm)/csd) -
    outer((colsums_X - n*cm)/csd, cm/csd)

  return(XtX_centered_scaled)
}

# @title Computes M %* %t(standardized.X) using sparse multiplication trick
# @param M a L by p matrix
# @param X an n by p unstandardized matrix with three attributes:
# attr(X,"scaled:center"), attr(X,"scaled:scale") and attr(X,"d")
# @return a L by n matrix
#
#' @importFrom Matrix t
compute_MXt <- function(M, X) {
  cm <- attr(X, "scaled:center")
  csd <- attr(X, "scaled:scale")

  if (!is.null(attr(X, "matrix.type"))) {

    # When X is a trend filtering matrix.
    return(as.matrix(t(apply(M, 1, function(b) compute_Xb(X, b)))))
  } else {

    # When X is an ordinary sparse/dense matrix.
    return(as.matrix(t(X %*% (t(M) / csd)) - drop(M %*% (cm / csd))))
  }

  # This should be the same as
  #
  #   t(apply(M, 1, function(b) compute_Xb(X, b))))
  #
  # as well as
  #
  #   M %*% (t(X)/csd) - drop(tcrossprod(M,t(cm/csd)))
  #
  # but should be more memory-efficient.
}


================================================
FILE: R/ss_mixture_methods.R
================================================
# =============================================================================
# SS MIXTURE PANEL METHODS
#
# Class c("ss_mixture", "ss"). Inherits ALL SER/ELBO from ss path.
# Overrides: 5 methods for omega-aware state management.
#
# Model: y ~ N(X(omega)*beta, sigma2*I), X'X = (n-1)*R(omega)
# mu on betahat scale (same as ss). Omega evaluators use z-score scale.
# =============================================================================

# (n-1)*R(omega)*v using current X_meta (or fallback to data$X)
#' @keywords internal
compute_XtXv_mixture <- function(data, model, v) {
  # Use panel_R for accurate R*v (cov2cor-based, not standardize_X)
  if (!is.null(model$omega) && !is.null(data$panel_R)) {
    Rv <- Reduce("+", Map(function(w, R) w * (R %*% v), model$omega, data$panel_R))
    return(data$nm1 * as.vector(Rv))
  }
  # Fallback: data$X = sqrt(n-1)*X_meta_init
  as.vector(compute_Rv(data, v))
}

# 1. Initialize fitted values
#' @keywords internal
initialize_fitted.ss_mixture <- function(data, mat_init) {
  list(XtXr = as.vector(compute_Rv(data, colSums(mat_init$alpha * mat_init$mu))))
}

# 2. Compute residuals using current R(omega)
#' @keywords internal
compute_residuals.ss_mixture <- function(data, params, model, l, ...) {
  sw_l <- get_slot_weight(model, l)
  bl <- model$alpha[l, ] * model$mu[l, ]
  XtXr_without_l <- model$XtXr - sw_l * compute_XtXv_mixture(data, model, bl)

  model$residuals         <- data$Xty - XtXr_without_l
  model$fitted_without_l  <- XtXr_without_l
  model$residual_variance <- model$sigma2
  model$predictor_weights <- rep(data$nm1, data$p)

  if (!is.null(data$R_finite_B) && model$sigma2 > .Machine$double.eps) {
    # Region-level scalar lambda_bias is set by fit_R_mismatch once per
    # IBSS sweep; here we just apply it through the slot-specific
    # xi_l = eta_l^2 + v_g,l on z-scale.
    sw <- if (!is.null(model$slot_weights)) model$slot_weights else
            rep(1, nrow(model$alpha))
    b_minus_l <- colSums(sw * model$alpha * model$mu) - sw_l * bl
    nm1  <- data$nm1
    v_g  <- max(sum(b_minus_l * XtXr_without_l), 0)
    xi_l <- XtXr_without_l^2 / nm1 + v_g
    lambda_bias <- if (is.null(model$lambda_bias)) 0 else model$lambda_bias
    R_finite_B <- if (!is.null(model$R_finite_B)) model$R_finite_B else data$R_finite_B
    model$shat2_inflation <- 1 + (1 / R_finite_B + lambda_bias) *
                                  xi_l / model$sigma2
  }
  return(model)
}

# 3. Update fitted values + precompute z-score quantities for omega
#' @keywords internal
update_fitted_values.ss_mixture <- function(data, params, model, l, ...) {
  sw_l <- get_slot_weight(model, l)
  bl <- model$alpha[l, ] * model$mu[l, ]
  model$XtXr <- model$fitted_without_l + sw_l * compute_XtXv_mixture(data, model, bl)

  # Convert betahat-scale mu to z-score scale for omega evaluators.
  # Weight by slot_weights (c_hat) when active.
  sqnm1 <- sqrt(data$nm1)
  sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
  model$Z           <- sw * model$alpha * model$mu * sqnm1
  model$zbar        <- colSums(model$Z)
  model$diag_postb2 <- colSums(sw * model$alpha * model$mu2 * data$nm1)
  return(model)
}

# 4. Update variance: sigma2 (via default ss chain) + omega M-step
#' @keywords internal
update_model_variance.ss_mixture <- function(data, params, model) {
  # Sigma2: reuse default chain (est_residual_variance + bounds)
  if (isTRUE(params$estimate_residual_variance)) {
    model <- update_model_variance.default(data, params, model)
  }

  # Omega M-step
  if (!is.null(data$K) && data$K > 1 && !isTRUE(model$omega_converged)) {
    omega_cur <- if (!is.null(model$omega)) model$omega else rep(1 / data$K, data$K)

    # Omega-objective ridge: small floor used ONLY inside the Eloglik
    # evaluator to stabilize log|sigma2*A(omega)| near rank-deficient
    # vertices. Without it, small eigenvalues of A(omega) produce a huge
    # -0.5 * log|.| penalty at vertex omegas, pulling the optimizer toward
    # the interior (collapse to ~uniform weights). Matches the behavior
    # of the prev rss_lambda path with auto lambda = 1/(n-1). Does NOT
    # affect the ss-SER update, which still uses lambda = 0 (no FDR
    # inflation in the credible-set inference).
    omega_ridge <- 1 / data$nm1
    eval_omega <- NULL
    if (!is.null(data$omega_cache)) {
      cache <- data$omega_cache
      iter_cache <- precompute_omega_iteration(cache, model$zbar,
                                                model$diag_postb2, model$Z)
      eval_omega <- function(w) {
        eval_omega_eloglik_reduced(cache, w, iter_cache,
                                    model$sigma2, omega_ridge, data$K, data$p)
      }
    } else if (!is.null(data$panel_R)) {
      eval_omega <- function(w) {
        eval_omega_eloglik_R(data$panel_R, w, data$z, model$zbar,
                              model$diag_postb2, model$Z, model$sigma2,
                              omega_ridge, data$K, data$p)
      }
    }

    if (!is.null(eval_omega)) {
      opt <- optimize_omega(eval_omega, omega_cur, data$K)
      model$omega <- opt$omega
      if (!is.null(data$R_finite_B) && !is.null(data$B_list))
        model$R_finite_B <- 1 / sum(model$omega^2 / data$B_list)
      # Recompute XtXr with updated R(omega)
      b_bar <- colSums(model$alpha * model$mu)
      model$XtXr <- compute_XtXv_mixture(data, model, b_bar)
      if (opt$converged) model$omega_converged <- TRUE
    }
  }
  return(model)
}

# 5. ER2 using current R(omega), not stale data$X
#' @keywords internal
get_ER2.ss_mixture <- function(data, model) {
  B       <- model$alpha * model$mu
  betabar <- colSums(B)
  postb2  <- model$alpha * model$mu2

  XtX_betabar <- compute_XtXv_mixture(data, model, betabar)
  XB2 <- 0
  for (l in seq_len(nrow(B))) {
    bl <- B[l, ]
    XB2 <- XB2 + sum(bl * compute_XtXv_mixture(data, model, bl))
  }

  data$yty - 2 * sum(betabar * data$Xty) + sum(betabar * XtX_betabar) -
    XB2 + data$nm1 * sum(postb2)
}


================================================
FILE: R/sufficient_stats_methods.R
================================================
# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
#
# Functions for data object setup, configuration, and preprocessing.
# These prepare data objects for model fitting and handle data-specific
# configurations like unmappable effects.
#
# Functions: configure_data, get_var_y
# =============================================================================

# Configure ss data for specified method
#' @keywords internal
configure_data.ss <- function(data, params) {
  if (params$unmappable_effects == "inf") {
    return(add_eigen_decomposition(data, params))
  } else {
    return(configure_data.default(data, params))
  }
}

# Get variance of y
#' @keywords internal
get_var_y.ss <- function(data, ...) {
  return(data$yty / (data$n - 1))
}

# =============================================================================
# MODEL INITIALIZATION & SETUP
#
# Functions for initializing model objects and setting up initial states.
# These create model matrices, initialize fitted values, and prepare
# the SuSiE model for iterative fitting.
#
# Functions: initialize_susie_model, initialize_fitted, validate_prior, track_ibss_fit
# =============================================================================

# Initialize SuSiE model
#' @keywords internal
initialize_susie_model.ss <- function(data, params, var_y, ...) {

  # Base model
  model <- initialize_matrices(data, params, var_y)

  # Append predictor weights and initialize non-sparse quantities
  if (params$unmappable_effects == "inf") {
    # Initialize omega quantities for unmappable effects
    omega_res               <- compute_omega_quantities(data, tau2 = 0, sigma2 = var_y)
    model$omega_var         <- omega_res$omega_var
    model$predictor_weights <- omega_res$diagXtOmegaX
    model$XtOmegay          <- data$eigen_vectors %*% (data$VtXty / omega_res$omega_var)

    # Initialize unmappable variance component and coefficients
    model$tau2  <- 0
    model$theta <- rep(0, data$p)

  } else if (params$unmappable_effects == "ash") {
    pm <- if (!is.null(data$XtX)) data$XtX else data$X
    model$predictor_weights <- attr(pm, "d")
    model <- init_ash_fields(model, data$n, data$p, params$L, is_individual = FALSE)
  } else if (params$unmappable_effects == "ash_filter_archived") {
    pm <- if (!is.null(data$XtX)) data$XtX else data$X
    model$predictor_weights <- attr(pm, "d")
    model <- init_ash_fields_filter_archived(model, data$n, data$p, params$L, is_individual = FALSE)
  } else {
    pm <- if (!is.null(data$XtX)) data$XtX else data$X
    model$predictor_weights <- attr(pm, "d")

    # Initialize NIG parameters
    if (params$use_NIG) {
      model$rv <- rep(1, params$L)
      model$marginal_loglik <- rep(as.numeric(NA), params$L)
    }
  }

  return(model)
}

# Initialize fitted values
#' @keywords internal
initialize_fitted.ss <- function(data, mat_init) {
  return(list(XtXr = compute_Rv(data, colSums(mat_init$alpha * mat_init$mu))))
}

# Validate Prior Variance
#' @keywords internal
validate_prior.ss <- function(data, params, model, ...) {
  if (isTRUE(params$check_prior)) {
    if (is.null(data$zm)) {
      bhat <- data$Xty / model$predictor_weights
      shat <- sqrt(model$sigma2 / model$predictor_weights)
      z <- bhat / shat
      data$zm <- max(abs(z[!is.nan(z)]))
    }
    if (any(model$V > 100 * (data$zm^2))) {
      stop(
        "Estimated prior variance is unreasonably large.\n",
        "This usually caused by mismatch between the summary statistics and the R matrix.\n",
        "Please check the input."
      )
    }
  }
  return(validate_prior.default(data, params, model, ...))
}

# Track core parameters across iterations
#' @keywords internal
track_ibss_fit.ss <- function(data, params, model, tracking, iter, elbo, ...) {
  if (params$unmappable_effects %in% c("inf", "ash", "ash_filter_archived")) {
    # Append non-sparse variance component to tracking
    tracking <- track_ibss_fit.default(data, params, model, tracking, iter, elbo, ...)
    if (isTRUE(params$track_fit)) {
      tracking[[iter]]$tau2 <- model$tau2
    }
    return(tracking)
  } else {
    # Use default for standard SS case
    return(track_ibss_fit.default(data, params, model, tracking, iter, elbo, ...))
  }
}

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
#
# Core functions for single effect regression computation and ELBO calculation.
# These handle the mathematical core of SuSiE including residual computation, SER
# statistics, posterior moments, and log-likelihood calculations for the ELBO.
#
# Functions: compute_residuals, compute_ser_statistics, SER_posterior_e_loglik,
# calculate_posterior_moments, compute_kl, get_ER2, Eloglik, loglik, neg_loglik
# =============================================================================

# Compute residuals for single effect regression
#' @keywords internal
compute_residuals.ss <- function(data, params, model, l, ...) {
  # Weighted sum of effects excluding l (slot_weights scale each effect's contribution)
  sw_l <- get_slot_weight(model, l)
  sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
  b_minus_l <- colSums(sw * model$alpha * model$mu) - sw_l * model$alpha[l, ] * model$mu[l, ]

  if (params$unmappable_effects == "inf") {
    # SuSiE-inf: Omega-weighted residuals
    omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
    XtOmegay <- data$eigen_vectors %*% (data$VtXty / omega_res$omega_var)
    XtOmegaXb <- data$eigen_vectors %*% ((t(data$eigen_vectors) %*% b_minus_l) * data$eigen_values / omega_res$omega_var)

    model$residuals         <- XtOmegay - XtOmegaXb
    model$predictor_weights <- omega_res$diagXtOmegaX
    model$residual_variance <- 1   # Already incorporated in Omega

    # R inflation uses standard (non-Omega) quantities
    XtXr_without_l <- compute_Rv(data, b_minus_l)
    r <- data$Xty - XtXr_without_l
    infl_state <- compute_shat2_inflation(data, model, XtXr_without_l,
                                          b_minus_l, r)
    model <- apply_inflation_state(model, infl_state, l)
    return(model)
  }

  # Below are SuSiE, SuSiE-ASH and SuSiE-SS

  # Remove lth effect from fitted values (scaled by slot weight)
  XtXr_without_l <- model$XtXr - sw_l * compute_Rv(data, model$alpha[l, ] * model$mu[l, ])

  # Compute residuals (ash subtracts unmappable effect X'X*theta).
  is_ash <- params$unmappable_effects %in% c("ash", "ash_filter_archived")
  if (is_ash) {
    model$residuals <- data$Xty - model$XtX_theta - XtXr_without_l
  } else {
    model$residuals <- data$Xty - XtXr_without_l
  }

  model$fitted_without_l  <- XtXr_without_l
  model$residual_variance <- model$sigma2

  # NIG prior: compute residual sum of squares
  if (params$use_NIG) {
    model$yy_residual <- as.numeric(
      data$yty - 2 * sum(b_minus_l * data$Xty) + sum(b_minus_l * XtXr_without_l))
    model$yy_residual <- max(model$yy_residual, .Machine$double.eps)
  }

  # ASH path: residual subtracts theta (line 167), so the variance scale
  # s = eta^2 + v_g must also be built from b_minus_l + theta or the
  # data and variance model disagree on what has been removed.
  if (is_ash && !is.null(model$theta)) {
    XtX_theta <- if (!is.null(model$XtX_theta))
                   model$XtX_theta
                 else compute_Rv(data, model$theta)
    b_for_infl    <- b_minus_l + model$theta
    XtXr_for_infl <- XtXr_without_l + XtX_theta
  } else {
    b_for_infl    <- b_minus_l
    XtXr_for_infl <- XtXr_without_l
  }
  infl_state <- compute_shat2_inflation(data, model, XtXr_for_infl,
                                        b_for_infl, model$residuals)
  model <- apply_inflation_state(model, infl_state, l)

  return(model)
}

# compute_shat2_inflation moved to R/rss_mismatch.R.

# Compute SER statistics
#' @keywords internal
compute_ser_statistics.ss <- function(data, params, model, l, ...) {
  betahat <- (1 / model$predictor_weights) * model$residuals
  shat2   <- model$residual_variance / model$predictor_weights

  # Inflate shat2 for finite-reference R variance tracking (tau_j^2 / sigma^2)
  if (!is.null(model$shat2_inflation))
    shat2 <- shat2 * model$shat2_inflation

  # Optimization parameters
  if (params$unmappable_effects == "inf") {
    # SuSiE-inf: optimize on linear scale
    optim_init   <- model$V[l]
    optim_bounds <- c(0, 1)
    optim_scale  <- "linear"
  } else {
    # Standard SuSiE and SuSiE-ash: optimize on log scale
    optim_init   <- log(max(c(betahat^2 - shat2, 1), na.rm = TRUE))
    optim_bounds <- c(-30, 15)
    optim_scale  <- "log"
  }

  return(list(
    betahat      = betahat,
    shat2        = shat2,
    optim_init   = optim_init,
    optim_bounds = optim_bounds,
    optim_scale  = optim_scale
  ))
}

# Posterior expected log-likelihood for a single effect regression
#' @keywords internal
SER_posterior_e_loglik.ss <- function(data, params, model, l) {
  Eb  <- model$alpha[l, ] * model$mu[l, ]
  Eb2 <- model$alpha[l, ] * model$mu2[l, ]

  if (params$unmappable_effects == "inf") {
    # SuSiE-inf: Omega-weighted likelihood
    return(-0.5 * (-2 * sum(Eb * model$residuals) + sum(model$predictor_weights * as.vector(Eb2))))
  } else {
    # Standard SuSiE and SuSiE-ash
    return(-0.5 / model$residual_variance * (-2 * sum(Eb * model$residuals) + sum(model$predictor_weights * as.vector(Eb2))))
  }
}

# Calculate posterior moments for single effect regression
#' @keywords internal
calculate_posterior_moments.ss <- function(data, params, model, V, l, ...) {
  if (params$use_NIG) {
    # NIG posterior moments
    if (V <= 0) {
      post_mean  <- rep(0, data$p)
      post_mean2 <- rep(0, data$p)
      model$rv[l] <- 1
    } else {
      nig_ss <- get_nig_sufficient_stats(data, model)
      moments <- compute_posterior_moments_NIG(data$n, model$predictor_weights,
                                               model$residuals, nig_ss$yy, nig_ss$sxy,
                                               V, params$alpha0, params$beta0, nig_ss$tau)
      post_mean  <- moments$post_mean
      post_mean2 <- moments$post_mean2
      model$rv[l] <- sum(model$alpha[l, ] * moments$rv)
    }
  } else {
    # Standard Gaussian posterior calculations
    shat2 <- model$residual_variance / model$predictor_weights
    if (!is.null(model$shat2_inflation))
      shat2 <- shat2 * model$shat2_inflation

    post_var   <- V * shat2 / (V + shat2)
    post_mean  <- V * (model$residuals / model$predictor_weights) / (V + shat2)
    post_mean2 <- post_var + post_mean^2
  }

  # Store posterior moments in model
  model$mu[l, ] <- post_mean
  model$mu2[l, ] <- post_mean2

  return(model)
}

# Calculate KL divergence
#' @keywords internal
compute_kl.ss <- function(data, params, model, l) {
  if (params$use_NIG) {
    # NIG KL only valid for L=1 (gIBSS for L>1 has no coherent ELBO; supp. line 503)
    if (params$L == 1) {
      ki <- nig_kl_inputs(data, params, model, l)
      model$KL[l] <- compute_kl_NIG(model$alpha[l, ], model$mu[l, ], model$mu2[l, ],
                                     model$pi, model$V[l],
                                     a0 = params$alpha0 / 2, b0 = params$beta0 / 2,
                                     a_post = ki$a_post, b_post = ki$b_post,
                                     s_j_sq = ki$s_j_sq)
    } else {
      model$KL[l] <- 0
    }
  } else {
    model <- compute_kl.default(data, params, model, l)
  }
  return(model)
}

# Expected Squared Residuals
#' @keywords internal
get_ER2.ss <- function(data, model) {
  B       <- model$alpha * model$mu
  postb2  <- model$alpha * model$mu2 # Posterior second moment.
  # Slot-weight correction: E[||y - sum_l c_l X beta^(l)||^2] under Bern(chat_l)
  # = y'y - 2 betabar_w' X'y + betabar_w' X'X betabar_w
  #   + sum_l chat_l * E[b^(l)' X'X b^(l)] - chat_l^2 * bbar_l' X'X bbar_l
  # When slot_weights is NULL (all weights = 1), reduces to the standard formula.
  sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(B))
  betabar <- colSums(sw * B)                                      # c_hat-weighted mean
  per_slot_XB2 <- rowSums(compute_BR(data, B) * B)                # bbar_l' R bbar_l
  per_slot_Eb2 <- as.vector(postb2 %*% model$predictor_weights)   # diag(X'X)' (alpha*mu2)_l

  return(data$yty - 2 * sum(betabar * data$Xty) + sum(betabar * compute_Rv(data, betabar)) -
           sum(sw^2 * per_slot_XB2) + sum(sw * per_slot_Eb2))
}

# Expected log-likelihood for the sufficient-stats path.  Without inflation,
# the standard regression log-likelihood under sigma2 (matches Eloglik.individual).
# With finite-R inflation, the SER posterior fits a betahat-scale augmented
# model; switch to the matching data-fit term.  Affects ELBO only; PIP/CS/
# sigma2 (which goes through est_residual_variance, not Eloglik) are unchanged.
#' @keywords internal
Eloglik.ss <- function(data, model) {
  if (!is.null(model$shat2_inflation))
    return(compute_augmented_eloglik_ss(data, model))
  -data$n / 2 * log(2 * pi * model$sigma2) -
    1 / (2 * model$sigma2) * get_ER2(data, model)
}

# Variational expectation of the augmented betahat-scale Gaussian log-
# likelihood under finite-R inflation.  Form derived in
# ld_mismatch_generativemodel.tex Sec. "Variational ELBO under the
# augmented variance".  The Var_q[(X'X beta)_j] correction requires
# (X'X)^2 element-wise; formed on each call.
#' @keywords internal
compute_augmented_eloglik_ss <- function(data, model) {
  pw     <- data$predictor_weights
  infl   <- model$shat2_inflation
  sigma2 <- model$sigma2
  p      <- length(pw)

  sw  <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
  am  <- model$alpha * model$mu
  am2 <- model$alpha * model$mu2
  betabar  <- colSums(sw * am)

  res_mean <- data$Xty - compute_Rv(data, betabar)

  XtX <- if (!is.null(data$XtX)) data$XtX else crossprod(data$X)
  XtX_sq <- XtX * XtX
  F_mat <- am  %*% XtX
  G_mat <- am2 %*% XtX_sq
  var_corr <- as.vector(crossprod(G_mat - F_mat^2, sw^2))

  -p / 2 * log(2 * pi) -
    0.5 * sum(log(sigma2 * infl / pw)) -
    0.5 * sum((res_mean^2 + var_corr) / (pw * sigma2 * infl))
}

#' @importFrom Matrix colSums
#' @importFrom stats dnorm
#' @keywords internal
loglik.ss <- function(data, params, model, V, ser_stats, l = NULL, ...) {
  if (params$use_NIG) {
    # NIG log Bayes factors
    nig_ss <- get_nig_sufficient_stats(data, model)
    lbf <- compute_lbf_NIG(data$n, model$predictor_weights,
                            model$residuals, nig_ss$yy, nig_ss$sxy,
                            V, params$alpha0, params$beta0, nig_ss$tau)
  } else {
    # Standard Gaussian prior log Bayes factors
    lbf <- dnorm(ser_stats$betahat, 0, sqrt(V + ser_stats$shat2), log = TRUE) -
      dnorm(ser_stats$betahat, 0, sqrt(ser_stats$shat2), log = TRUE)
  }

  # Stabilize logged Bayes Factor
  stable_res  <- lbf_stabilization(lbf, model$pi, ser_stats$shat2)

  # Compute posterior weights
  weights_res <- compute_posterior_weights(stable_res$lpo)

  # Store in model if l is provided, otherwise return lbf_model for prior variance optimization
  if (!is.null(l)) {
    model$alpha[l, ] <- weights_res$alpha
    model$lbf[l] <- weights_res$lbf_model
    model$lbf_variable[l, ] <- stable_res$lbf

    # Compute and store marginal log-likelihood for NIG prior
    if (params$use_NIG) {
      model$marginal_loglik[l] <- compute_marginal_loglik(weights_res$lbf_model, data$n,
                                                           nig_ss$yy, params$alpha0, params$beta0,
                                                           TRUE)
    }
    return(model)
  } else {
    return(weights_res$lbf_model)
  }
}

#' @keywords internal
neg_loglik.ss <- function(data, params, model, V_param, ser_stats, ...) {
  # Convert parameter to V based on optimization scale
  V <- if (ser_stats$optim_scale == "log") exp(V_param) else V_param

  if (params$unmappable_effects == "inf") {
    # SuSiE-inf: Omega-weighted objective with logSumExp trick
    # Apply finite-reference R inflation: effective pw = pw / inflation
    pw   <- model$predictor_weights
    infl <- if (!is.null(model$shat2_inflation)) model$shat2_inflation else 1
    return(-matrixStats::logSumExp(
      -0.5 * log(1 + V * pw / infl) +
        V * model$residuals^2 / (2 * infl * (1 + V * pw / infl)) +
        log(model$pi + sqrt(.Machine$double.eps))
    ))
  } else {
    # Standard SuSiE and SuSiE-ash: standard objective
    lbf_model <- loglik.ss(data, params, model, V, ser_stats)
    return(-lbf_model)
  }
}

# =============================================================================
# MODEL UPDATES & FITTING
#
# Functions for iterative model updates and variance component estimation.
# These handle the dynamic aspects of model fitting including fitted value
# updates and variance component estimation.
#
# Functions: update_fitted_values, update_variance_components, update_derived_quantities
# =============================================================================

# Update fitted values
#' @keywords internal
update_fitted_values.ss <- function(data, params, model, l, ...) {
  sw_l <- get_slot_weight(model, l)
  if (params$unmappable_effects == "inf") {
    # SuSiE-inf: include theta in fitted values
    sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
    model$XtXr <- as.vector(compute_Rv(data, colSums(sw * model$alpha * model$mu) + model$theta))
  } else {
    # Standard SuSiE and SuSiE-ash: sparse component only
    model$XtXr <- model$fitted_without_l + sw_l * as.vector(compute_Rv(data, model$alpha[l, ] * model$mu[l, ]))
  }
  return(model)
}

# Update variance components for ss data
#' @keywords internal
update_variance_components.ss <- function(data, params, model, ...) {
  if (params$unmappable_effects == "inf") {
    # Calculate omega
    L         <- nrow(model$alpha)
    omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
    omega     <- matrix(rep(omega_res$diagXtOmegaX, L), nrow = L, ncol = data$p, byrow = TRUE) +
      matrix(rep(1 / model$V, data$p), nrow = L, ncol = data$p, byrow = FALSE)

    # Compute theta for infinitesimal effects.
    theta <- compute_theta_blup(data, model)

    # Sigma2 and tau2 update
    if (params$estimate_residual_method == "MLE") {
      mle_result <- mle_unmappable(data, params, model, omega)
      return(list(sigma2 = mle_result$sigma2,
                  tau2   = mle_result$tau2,
                  theta  = theta))
    } else {
      mom_result <- mom_unmappable(data, params, model, omega, model$tau2)
      return(list(sigma2 = mom_result$sigma2,
                  tau2   = mom_result$tau2,
                  theta  = theta))
    }
  } else if (params$unmappable_effects == "ash_filter_archived") {
    # Original filter-based masking (archived for internal diagnostics)
    return(update_ash_variance_components_filter_archived(data, model, params))
  } else if (params$unmappable_effects == "ash") {
    # c_hat + 3 LD-interference heuristics
    return(update_ash_variance_components(data, model, params))
  } else {
    # Use default method for standard SuSiE
    return(update_variance_components.default(data, params, model))
  }
}

# Update derived quantities for ss data
#' @keywords internal
update_derived_quantities.ss <- function(data, params, model) {
  if (params$unmappable_effects == "inf") {
    # Update omega quantities for next iteration
    omega_res               <- compute_omega_quantities(data, model$tau2, model$sigma2)
    model$omega_var         <- omega_res$omega_var
    model$predictor_weights <- omega_res$diagXtOmegaX
    model$XtOmegay          <- data$eigen_vectors %*% (data$VtXty / omega_res$omega_var)
    # Update fitted values to include theta
    b          <- colSums(model$alpha * model$mu)
    model$XtXr <- compute_Rv(data, b + model$theta)
    return(model)
  } else {
    return(update_derived_quantities.default(data, params, model))
  }
}

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
#
# Functions for generating final results and summary statistics.
# These process fitted models into interpretable outputs including
# credible sets, variable names, and fitted values.
#
# Functions: get_scale_factors, get_intercept, get_fitted, get_cs,
# get_variable_names, get_zscore
# =============================================================================

# Get column scale factors
#' @keywords internal
get_scale_factors.ss <- function(data, params) {
  pm <- if (!is.null(data$XtX)) data$XtX else data$X
  return(attr(pm, "scaled:scale"))
}

# Get intercept
#' @keywords internal
get_intercept.ss <- function(data, params, model, ...) {
  return(data$y_mean - sum(data$X_colmeans * (colSums(model$alpha * model$mu) / model$X_column_scale_factors)))
}

# Get Fitted Values
#' @keywords internal
get_fitted.ss <- function(data, params, model, ...) {
  return(get_fitted.default(data, params, model, ...))
}

# Get Credible Sets
#' @keywords internal
get_cs.ss <- function(data, params, model, ...) {
  if (is.null(params$coverage) || is.null(params$min_abs_corr)) {
    return(NULL)
  }

  if (!is.null(data$X)) {
    # Low-rank X path: data$X is B x p, columns are variables
    return(susie_get_cs(model,
                        X               = data$X,
                        coverage        = params$coverage,
                        min_abs_corr    = params$min_abs_corr,
                        n_purity        = params$n_purity))
  }

  if (any(!(diag(data$XtX) %in% c(0, 1)))) {
    Xcorr <- safe_cov2cor(data$XtX)
  } else {
    Xcorr <- data$XtX
  }

  return(susie_get_cs(model,
                      Xcorr           = Xcorr,
                      check_symmetric = FALSE,
                      coverage        = params$coverage,
                      min_abs_corr    = params$min_abs_corr,
                      n_purity        = params$n_purity))
}

# Get Variable Names
#' @keywords internal
get_variable_names.ss <- function(data, model, ...) {
  pm <- if (!is.null(data$XtX)) data$XtX else data$X
  return(assign_names(data, model, colnames(pm)))
}

# Get univariate z-score
#' @keywords internal
get_zscore.ss <- function(data, params, model, ...) {
  return(get_zscore.default(data, params, model))
}

# Clean up model object for sufficient statistics data
#' @keywords internal
cleanup_model.ss <- function(data, params, model, ...) {
  # Remove common fields
  model <- cleanup_model.default(data, params, model, ...)

  # FIXME: for non-standard fields please connect them to "runtime_xx" where xx is unmappable effect option
  
  # Remove SS-specific fields for unmappable effects
  if (!is.null(params$unmappable_effects) && params$unmappable_effects == "inf") {
    unmappable_fields <- c("omega_var", "XtOmegay")
    
    for (field in unmappable_fields) {
      if (field %in% names(model)) {
        model[[field]] <- NULL
      }
    }
  } else if (!is.null(params$unmappable_effects) && params$unmappable_effects == "ash") {
    model <- cleanup_ash_fields(model)
  } else if (!is.null(params$unmappable_effects) && params$unmappable_effects == "ash_filter_archived") {
    model <- cleanup_ash_fields_filter_archived(model)
  }
  
  # Remove NIG specific temporary fields
  if (params$use_NIG) {
    model$marginal_loglik <- NULL
  }
  
  return(model)
}


================================================
FILE: R/summary.susie.R
================================================
#' @title Summarize Susie Fit.
#'
#' @description \code{summary} method for the \dQuote{susie} class.
#'
#' @param object A susie fit.
#'
#' @param \dots Additional arguments passed to the generic \code{summary}
#'   or \code{print.summary} method.
#'
#' @return \code{summary.susie} returns a list containing a data frame
#'   of variables and a data frame of credible sets.
#'
#' @method summary susie
#'
#' @export summary.susie
#'
#' @export
#'
summary.susie <- function(object, ...) {
  if (is.null(object$sets)) {
    stop(
      "Cannot summarize SuSiE object because credible set information ",
      "is not available"
    )
  }
  variables <- data.frame(cbind(1:length(object$pip), object$pip, -1))
  colnames(variables) <- c("variable", "variable_prob", "cs")
  rownames(variables) <- NULL
  if (object$null_index > 0) {
    variables <- variables[-object$null_index, ]
  }
  if (!is.null(object$sets$cs)) {
    cs <- data.frame(matrix(NA, length(object$sets$cs), 5))
    colnames(cs) <- c("cs", "cs_log10bf", "cs_avg_r2", "cs_min_r2", "variable")
    for (i in 1:length(object$sets$cs)) {
      variables$cs[variables$variable %in% object$sets$cs[[i]]] <-
        object$sets$cs_index[[i]]
      cs$cs[i] <- object$sets$cs_index[[i]]
      cs$cs_log10bf[i] <- object$lbf[cs$cs[i]] / log(10)
      cs$cs_avg_r2[i] <- object$sets$purity$mean.abs.corr[i]^2
      cs$cs_min_r2[i] <- object$sets$purity$min.abs.corr[i]^2
      cs$variable[i] <- paste(object$sets$cs[[i]], collapse = ",")
    }
    variables <- variables[order(variables$variable_prob, decreasing = TRUE), ]
  } else {
    cs <- NULL
  }
  out <- list(vars = variables, cs = cs)
  class(out) <- c("summary.susie", "list")
  return(out)
}

#' @rdname summary.susie
#'
#' @param x A susie summary.
#'
#' @method print summary.susie
#'
#' @export print.summary.susie
#'
#' @export
#'
print.summary.susie <- function(x, ...) {
  message("\nVariables in credible sets:\n")
  print.data.frame(x$vars[which(x$vars$cs > 0), ], row.names = FALSE)
  message("\nCredible sets summary:\n")
  print.data.frame(x$cs, row.names = FALSE)
}


================================================
FILE: R/susie.R
================================================
# =============================================================================
# SuSiE WITH INDIVIDUAL-LEVEL DATA
# =============================================================================

#' @title Sum of Single Effects (SuSiE) Regression
#'
#' @description Performs a sparse Bayesian multiple linear regression
#' of y on X, using the "Sum of Single Effects" model from Wang et al
#' (2020). In brief, this function fits the regression model \eqn{y =
#' \mu + X b + e}, where elements of \eqn{e} are \emph{i.i.d.} normal
#' with zero mean and variance \code{residual_variance}, \eqn{\mu} is
#' an intercept term and \eqn{b} is a vector of length p representing
#' the effects to be estimated. The \dQuote{susie assumption} is that
#' \eqn{b = \sum_{l=1}^L b_l} where each \eqn{b_l} is a vector of
#' length p with exactly one non-zero element. The prior on the
#' non-zero element is normal with zero mean and variance \code{var(y)
#' * scaled_prior_variance}. The value of \code{L} is fixed, and
#' should be chosen to provide a reasonable upper bound on the number
#' of non-zero effects to be detected. Typically, the hyperparameters
#' \code{residual_variance} and \code{scaled_prior_variance} will be
#' estimated during model fitting, although they can also be fixed as
#' specified by the user. See functions \code{\link{susie_get_cs}} and
#' other functions of form \code{susie_get_*} to extract the most
#' commonly-used results from a susie fit.
#'
#' #' @details The function \code{susie} implements the IBSS algorithm
#' from Wang et al (2020). The option \code{refine = TRUE} implements
#' an additional step to help reduce problems caused by convergence of
#' the IBSS algorithm to poor local optima (which is rare in our
#' experience, but can provide misleading results when it occurs). The
#' refinement step incurs additional computational expense that
#' increases with the number of CSs found in the initial run.
#'
#' The function \code{susie_ss} implements essentially the same
#' algorithms, but using sufficient statistics. (The statistics are
#' sufficient for the regression coefficients \eqn{b}, but not for the
#' intercept \eqn{\mu}; see below for how the intercept is treated.)
#' If the sufficient statistics are computed correctly then the
#' results from \code{susie_ss} should be the same as (or very
#' similar to) \code{susie}, although runtimes will differ as
#' discussed below. The sufficient statistics are the sample
#' size \code{n}, and then the p by p matrix \eqn{X'X}, the p-vector
#' \eqn{X'y}, and the sum of squared y values \eqn{y'y}, all computed
#' after centering the columns of \eqn{X} and the vector \eqn{y} to
#' have mean 0; these can be computed using \code{compute_suff_stat}.
#'
#' The handling of the intercept term in \code{susie_ss} needs
#' some additional explanation. Computing the summary data after
#' centering \code{X} and \code{y} effectively ensures that the
#' resulting posterior quantities for \eqn{b} allow for an intercept
#' in the model; however, the actual value of the intercept cannot be
#' estimated from these centered data. To estimate the intercept term
#' the user must also provide the column means of \eqn{X} and the mean
#' of \eqn{y} (\code{X_colmeans} and \code{y_mean}). If these are not
#' provided, they are treated as \code{NA}, which results in the
#' intercept being \code{NA}. If for some reason you prefer to have
#' the intercept be 0 instead of \code{NA} then set
#' \code{X_colmeans = 0,y_mean = 0}.
#'
#' For completeness, we note that if \code{susie_ss} is run on
#' \eqn{X'X, X'y, y'y} computed \emph{without} centering \eqn{X} and
#' \eqn{y}, and with \code{X_colmeans = 0,y_mean = 0}, this is
#' equivalent to \code{susie} applied to \eqn{X, y} with
#' \code{intercept = FALSE} (although results may differ due to
#' different initializations of \code{residual_variance} and
#' \code{scaled_prior_variance}). However, this usage is not
#' recommended for for most situations.
#'
#' The computational complexity of \code{susie} is \eqn{O(npL)} per
#' iteration, whereas \code{susie_ss} is \eqn{O(p^2L)} per
#' iteration (not including the cost of computing the sufficient
#' statistics, which is dominated by the \eqn{O(np^2)} cost of
#' computing \eqn{X'X}). Because of the cost of computing \eqn{X'X},
#' \code{susie} will usually be faster. However, if \eqn{n >> p},
#' and/or if \eqn{X'X} is already computed, then
#' \code{susie_ss} may be faster.
#'
#' @param X An n by p matrix of covariates.
#'
#' @param y The observed responses, a vector of length n.
#'
#' @param L Maximum number of non-zero effects in the model. If L is larger than
#' the number of covariates, p, L is set to p.
#'
#' @param scaled_prior_variance The prior variance, divided by
#'   \code{var(y)} (or by \code{(1/(n-1))yty} for
#'   \code{susie_ss}); that is, the prior variance of each
#'   non-zero element of b is \code{var(y) * scaled_prior_variance}. The
#'   value provided should be either a scalar or a vector of length
#'   \code{L}. If \code{estimate_prior_variance = TRUE}, this provides
#'   initial estimates of the prior variances.
#'
#' @param residual_variance Variance of the residual. If
#'   \code{estimate_residual_variance = TRUE}, this value provides the
#'   initial estimate of the residual variance. By default, it is set to
#'   \code{var(y)} in \code{susie} and \code{(1/(n-1))yty} in
#'   \code{susie_ss}.
#'
#' @param prior_weights A vector of length p, in which each entry
#'   gives the prior probability that corresponding column of X has a
#'   nonzero effect on the outcome, y. The weights are internally
#'   normalized to sum to 1. When \code{NULL} (the default), uniform
#'   prior weights are used (each variable is assigned probability
#'   \code{1/p}).
#'
#' @param null_weight Prior probability of no effect (a number between 0 and 1,
#' and cannot be exactly 1).
#'
#' @param standardize If \code{standardize = TRUE}, standardize the
#'   columns of X to unit variance prior to fitting (or equivalently
#'   standardize XtX and Xty to have the same effect). Note that
#'   \code{scaled_prior_variance} specifies the prior on the
#'   coefficients of X \emph{after} standardization (if it is
#'   performed). If you do not standardize, you may need to think more
#'   carefully about specifying \code{scaled_prior_variance}. Whatever
#'   your choice, the coefficients returned by \code{coef} are given for
#'   \code{X} on the original input scale. Any column of \code{X} that
#'   has zero variance is not standardized.
#'
#' @param intercept If \code{intercept = TRUE}, the intercept is
#'   fitted; it \code{intercept = FALSE}, the intercept is set to
#'   zero. Setting \code{intercept = FALSE} is generally not
#'   recommended.
#'
#' @param estimate_residual_variance If
#'   \code{estimate_residual_variance = TRUE}, the residual variance is
#'   estimated, using \code{residual_variance} as an initial value. If
#'   \code{estimate_residual_variance = FALSE}, the residual variance is
#'   fixed to the value supplied by \code{residual_variance}.
#'
#' @param estimate_residual_method The method used for estimating residual variance.
#'   For the original SuSiE model, "MLE" and "MoM" estimation is equivalent, but for
#'   the infinitesimal model, "MoM" is more stable. We recommend using "NIG"
#'   when n < 80 for improved coverage, although it is currently only implemented
#'   for individual-level data.
#'
#' @param estimate_prior_variance If \code{estimate_prior_variance =
#'   TRUE}, the prior variance is estimated (this is a separate
#'   parameter for each of the L effects). If provided,
#'   \code{scaled_prior_variance} is then used as an initial value for
#'   the optimization. When \code{estimate_prior_variance = FALSE}, the
#'   prior variance for each of the L effects is determined by the
#'   value supplied to \code{scaled_prior_variance}.
#'
#' @param estimate_prior_method The method used for estimating prior
#'   variance. When \code{estimate_prior_method = "simple"} is used, the
#'   likelihood at the specified prior variance is compared to the
#'   likelihood at a variance of zero, and the setting with the larger
#'   likelihood is retained. When \code{prior_variance_grid} is provided,
#'   this is automatically set to \code{"fixed_mixture"}.
#'
#' @param prior_variance_grid Numeric vector of K prior variances defining
#'   a mixture-of-normals prior on effect sizes. When provided, the SER
#'   evaluates Bayes factors at each grid point and forms a mixture BF
#'   weighted by \code{mixture_weights}. This bypasses the scalar prior
#'   variance optimization. Default is \code{NULL} (standard scalar V path).
#'
#' @param mixture_weights Numeric vector of K non-negative weights summing
#'   to 1, giving the mixture proportions for the variance grid. Default is
#'   \code{NULL}, which uses uniform weights when \code{prior_variance_grid}
#'   is provided.
#'
#' @param unmappable_effects The method for modeling unmappable effects:
#'   "none", "inf", "ash".
#'
#' @param check_null_threshold When the prior variance is estimated,
#'   compare the estimate with the null, and set the prior variance to
#'   zero unless the log-likelihood using the estimate is larger by this
#'   threshold amount. For example, if you set
#'   \code{check_null_threshold = 0.1}, this will "nudge" the estimate
#'   towards zero when the difference in log-likelihoods is small. A
#'   note of caution that setting this to a value greater than zero may
#'   lead the IBSS fitting procedure to occasionally decrease the ELBO. This
#'   setting is disabled when using \code{unmappable_effects = "inf"} or
#'   \code{unmappable_effects = "ash"}.
#'
#' @param prior_tol When the prior variance is estimated, compare the
#'   estimated value to \code{prior_tol} at the end of the computation,
#'   and exclude a single effect from PIP computation if the estimated
#'   prior variance is smaller than this tolerance value.
#'
#' @param residual_variance_upperbound Upper limit on the estimated
#'   residual variance. It is only relevant when
#'   \code{estimate_residual_variance = TRUE}.
#'
#' @param model_init A previous susie fit with which to initialize.
#'
#' @param s_init Deprecated alias for \code{model_init}.
#'
#' @param coverage A number between 0 and 1 specifying the
#'   \dQuote{coverage} of the estimated confidence sets.
#'
#' @param min_abs_corr Minimum absolute correlation allowed in a
#'   credible set. The default, 0.5, corresponds to a squared
#'   correlation of 0.25, which is a commonly used threshold for
#'   genotype data in genetic studies. This "purity" filter is
#'   applied to the CSs reported in the fit object, so the CS list
#'   returned here may be a subset of the one produced by calling
#'   \code{\link{susie_get_cs}} on the same fit without passing
#'   \code{X} or \code{Xcorr} (in which case the purity filter is
#'   skipped).
#'
#' @param compute_univariate_zscore If \code{compute_univariate_zscore
#'   = TRUE}, the univariate regression z-scores are outputted for each
#'   variable.
#'
#' @param na.rm Drop any missing values in y from both X and y.
#'
#' @param max_iter Maximum number of IBSS iterations to perform.
#'
#' @param L_greedy Integer or \code{NULL}. When non-\code{NULL}, run a
#'   greedy outer loop that grows the number of effects from
#'   \code{L_greedy} up to \code{L} in linear steps until the fit
#'   saturates. The default \code{NULL} runs the usual fixed-\code{L}
#'   fit.
#'
#' @param greedy_lbf_cutoff Numeric saturation threshold for the
#'   \code{L_greedy} outer loop. Default is 0.1.
#'
#' @param tol tol A small, non-negative number specifying the convergence
#'   tolerance for the IBSS fitting procedure.
#'
#' @param convergence_method When \code{converge_method = "elbo"} the fitting
#'   procedure halts when the difference in the variational lower bound, or
#'   \dQuote{ELBO} (the objective function to be maximized), is
#'   less than \code{tol}. When \code{converge_method = "pip"} the fitting
#'   procedure halts when the maximum absolute difference in \code{alpha} is less
#'   than \code{tol}.
#'
#' @param verbose If \code{verbose = TRUE}, the algorithm's progress,
#'  a summary of the optimization settings, and refinement progress (if
#'  \code{refine = TRUE}) are printed to the console.
#'
#' @param track_fit If \code{track_fit = TRUE}, \code{trace}
#'   is also returned containing detailed information about the
#'   estimates at each iteration of the IBSS fitting procedure.
#'
#' @param residual_variance_lowerbound Lower limit on the estimated
#'   residual variance. It is only relevant when
#'   \code{estimate_residual_variance = TRUE}.
#'
#' @param refine If \code{refine = TRUE}, then an additional
#'  iterative refinement procedure is used, after the IBSS algorithm,
#'  to check and escape from local optima (see details).
#'
#' @param n_purity Passed as argument \code{n_purity} to
#'   \code{\link{susie_get_cs}}.
#'
#' @param alpha0 Numerical parameter for the NIG prior when using
#'   \code{estimate_residual_method = "NIG"}. Defaults to
#'   \code{1/sqrt(n)}, where \code{n} is the sample size. When calling
#'   \code{susie_rss} with NIG, \code{n} must be supplied; otherwise
#'   validation errors.
#'
#' @param beta0 Numerical parameter for the NIG prior when using
#'   \code{estimate_residual_method = "NIG"}. Defaults to
#'   \code{1/sqrt(n)}, where \code{n} is the sample size. When calling
#'   \code{susie_rss} with NIG, \code{n} must be supplied; otherwise
#'   validation errors.
#'
#' @param slot_prior Optional slot activity prior created by
#'   \code{\link{slot_prior_betabinom}} or \code{\link{slot_prior_poisson}}.
#'   Use \code{slot_prior_betabinom(a_beta, b_beta)} for the usual
#'   single-locus setting; it places a Beta-Binomial prior on the
#'   number of active effects and gives an adaptive multiplicity
#'   correction. Use \code{slot_prior_poisson(C, nu)} when you want a
#'   Gamma-Poisson prior centered on an expected number \code{C} of
#'   active effects. When supplied, each single-effect slot has an
#'   estimated activity probability \code{c_hat}; fitted values and
#'   PIPs are weighted by these activity probabilities, and convergence
#'   is checked using \code{convergence_method = "pip"}.
#'
#' @param init_only Logical. If \code{TRUE}, return a list with
#'   \code{data} and \code{params} objects without running the IBSS
#'   algorithm. Used by packages like susieAnn that implement their own
#'   outer loop around SuSiE's building blocks. Default is \code{FALSE}.
#'
#' @return A \code{"susie"} object with some or all of the following elements:
#'
#' \item{alpha}{An L by p matrix of posterior inclusion probabilities.}
#'
#' \item{mu}{An L by p matrix of posterior means, conditional on inclusion.}
#'
#' \item{mu2}{An L by p matrix of posterior second moments, conditional on
#'   inclusion.}
#'
#' \item{Xr}{A vector of length n, equal to \code{X \%*\% colSums(alpha * mu)}.}
#'
#' \item{lbf}{Log-Bayes Factor for each single effect.}
#'
#' \item{lbf_variable}{Log-Bayes Factor for each variable and single effect.}
#'
#' \item{intercept}{Intercept (fixed or estimated).}
#'
#' \item{sigma2}{Residual variance (fixed or estimated).}
#'
#' \item{V}{Prior variance of the non-zero elements of b.}
#'
#' \item{elbo}{The variational lower bound (or ELBO) achieved at each iteration.}
#'
#' \item{fitted}{Vector of length n containing the fitted values.}
#'
#' \item{sets}{Credible sets estimated from model fit.}
#'
#' \item{pip}{A vector of length p giving the marginal posterior inclusion
#'   probabilities.}
#'
#' \item{z}{A vector of univariate z-scores.}
#'
#' \item{niter}{Number of IBSS iterations performed.}
#'
#' \item{converged}{\code{TRUE} or \code{FALSE} indicating whether
#'   the IBSS converged to a solution within the chosen tolerance
#'   level.}
#'
#' \item{theta}{If \code{unmappable_effects = "inf"} or
#'   \code{unmappable_effects = "ash"}, then \code{theta} is a p-vector of posterior
#'   means for the unmappable effects.}
#'
#' \item{tau2}{If \code{unmappable_effects = "inf"} or
#'   \code{unmappable_effects = "ash"}, then \code{tau2} is the unmappable variance.}
#'
#' @importFrom stats var
#' 
#' @export
#' 
susie <- function(X, y, L = min(10, ncol(X)),
                  scaled_prior_variance = 0.2,
                  residual_variance = NULL,
                  prior_weights = NULL,
                  null_weight = 0,
                  standardize = TRUE,
                  intercept = TRUE,
                  estimate_residual_variance = TRUE,
                  estimate_residual_method = c("MoM", "MLE", "NIG"),
                  estimate_prior_variance = TRUE,
                  estimate_prior_method = c("optim", "EM", "simple"),
                  prior_variance_grid = NULL,
                  mixture_weights = NULL,
                  unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
                  check_null_threshold = 0,
                  prior_tol = 1e-9,
                  residual_variance_upperbound = Inf,
                  model_init = NULL,
                  s_init = NULL,
                  coverage = 0.95,
                  min_abs_corr = 0.5,
                  compute_univariate_zscore = FALSE,
                  na.rm = FALSE,
                  max_iter = 100,
                  L_greedy = NULL,
                  greedy_lbf_cutoff = 0.1,
                  tol = 1e-4,
                  convergence_method = c("elbo", "pip"),
                  verbose = FALSE,
                  track_fit = FALSE,
                  residual_variance_lowerbound = NULL,
                  refine = FALSE,
                  n_purity = 100,
                  alpha0 = 1/sqrt(nrow(X)),
                  beta0 = 1/sqrt(nrow(X)),
                  init_only = FALSE,
                  slot_prior = NULL) {

  # Validate method arguments
  unmappable_effects       <- match.arg(unmappable_effects)
  estimate_residual_method <- match.arg(estimate_residual_method)
  convergence_method       <- match.arg(convergence_method)
  mp <- resolve_mixture_prior(estimate_prior_method, estimate_prior_variance,
                              prior_variance_grid, mixture_weights)
  estimate_prior_method   <- mp$estimate_prior_method
  estimate_prior_variance <- mp$estimate_prior_variance
  prior_variance_grid     <- mp$prior_variance_grid
  mixture_weights         <- mp$mixture_weights

  # See vignette "finemapping_summary_statistics" for the recommended workflow
  if (verbose && nrow(X) >= 2 * ncol(X)) {
    warning_message(
      "nrow(X) = ", nrow(X), " >= 2 * ncol(X) = ", 2 * ncol(X), ". ",
      "Consider precomputing sufficient statistics with compute_suff_stat() ",
      "and fitting with susie_ss() instead -- this avoids holding X in ",
      "memory at every iteration and lets you reuse XtX across multiple y.",
      style = "hint"
    )
  }

  # Construct data and params objects
  susie_objects <- individual_data_constructor(
    X, y, L, scaled_prior_variance, residual_variance,
    prior_weights, null_weight, standardize, intercept,
    estimate_residual_variance, estimate_residual_method,
    estimate_prior_variance, estimate_prior_method,
    prior_variance_grid, mixture_weights,
    unmappable_effects, check_null_threshold, prior_tol,
    residual_variance_upperbound, model_init, s_init, coverage,
    min_abs_corr, compute_univariate_zscore, na.rm,
    max_iter, tol, convergence_method, verbose, track_fit,
    residual_variance_lowerbound, refine, n_purity,
    alpha0, beta0, slot_prior, L_greedy, greedy_lbf_cutoff
  )

  # Return data and params without fitting if init_only is TRUE.
  # The caller is responsible for calling ibss_initialize() on these.
  if (init_only) {
    return(susie_objects)
  }

  # Run main SuSiE algorithm
  model <- susie_workhorse(susie_objects$data, susie_objects$params)

  return(model)
}

# =============================================================================
# SuSiE WITH SUFFICIENT STATISTICS
# =============================================================================

#' @title SuSiE using Sufficient Statistics
#'
#' @inheritParams susie
#' 
#' @description Performs SuSiE regression using sufficient statistics (XtX, Xty,
#' yty, n) instead of individual-level data (X, y).
#'
#' @param XtX A p by p matrix, X'X, with columns of X centered to have mean zero.
#'
#' @param Xty A p-vector, X'y, with y and columns of X centered to have mean zero.
#'
#' @param yty A scalar, y'y, with y centered to have mean zero.
#'
#' @param n The sample size.
#'
#' @param X_colmeans A p-vector of column means of \code{X}. If both
#'   \code{X_colmeans} and \code{y_mean} are provided, the intercept
#'   is estimated; otherwise, the intercept is NA.
#'
#' @param y_mean A scalar containing the mean of \code{y}. If both
#'   \code{X_colmeans} and \code{y_mean} are provided, the intercept
#'   is estimated; otherwise, the intercept is NA.
#'
#' @param maf A p-vector of minor allele frequencies; to be used along with
#'   \code{maf_thresh} to filter input summary statistics.
#'
#' @param maf_thresh Variants with MAF smaller than this threshold are not used.
#'
#' @param check_input If \code{check_input = TRUE}, \code{susie_ss} performs
#'   additional checks on \code{XtX} and \code{Xty}. The checks are:
#'   (1) check that \code{XtX} is positive semidefinite; (2) check that
#'   \code{Xty} is in the space spanned by the non-zero eigenvectors of \code{XtX}.
#'
#' @param r_tol Tolerance level for eigenvalue check of positive semidefinite
#'   matrix \code{XtX}.
#'
#' @param check_prior If \code{check_prior = TRUE}, it checks if the
#'   estimated prior variance becomes unreasonably large (comparing with
#'   10 * max(abs(z))^2).
#'
#' @export
#' 
susie_ss <- function(XtX, Xty, yty, n,
                     L = min(10, ncol(XtX)),
                     X_colmeans = NA, y_mean = NA,
                     maf = NULL, maf_thresh = 0,
                     check_input = FALSE,
                     r_tol = 1e-8,
                     standardize = TRUE,
                     scaled_prior_variance = 0.2,
                     residual_variance = NULL,
                     prior_weights = NULL,
                     null_weight = 0,
                     model_init = NULL,
                     s_init = NULL,
                     estimate_residual_variance = TRUE,
                     estimate_residual_method = c("MoM", "MLE", "NIG"),
                     residual_variance_lowerbound = 0,
                     residual_variance_upperbound = Inf,
                     estimate_prior_variance = TRUE,
                     estimate_prior_method = c("optim", "EM", "simple"),
                     prior_variance_grid = NULL,
                     mixture_weights = NULL,
                     unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
                     check_null_threshold = 0,
                     prior_tol = 1e-9,
                     max_iter = 100,
                     L_greedy = NULL,
                     greedy_lbf_cutoff = 0.1,
                     tol = 1e-4,
                     convergence_method = c("elbo", "pip"),
                     coverage = 0.95,
                     min_abs_corr = 0.5,
                     n_purity = 100,
                     verbose = FALSE,
                     track_fit = FALSE,
                     check_prior = FALSE,
                     refine = FALSE,
                     alpha0 = 1/sqrt(n),
                     beta0 = 1/sqrt(n),
                     slot_prior = NULL) {

  # Validate method arguments
  unmappable_effects       <- match.arg(unmappable_effects)
  estimate_residual_method <- match.arg(estimate_residual_method)
  convergence_method       <- match.arg(convergence_method)
  mp <- resolve_mixture_prior(estimate_prior_method, estimate_prior_variance,
                              prior_variance_grid, mixture_weights)
  estimate_prior_method   <- mp$estimate_prior_method
  estimate_prior_variance <- mp$estimate_prior_variance
  prior_variance_grid     <- mp$prior_variance_grid
  mixture_weights         <- mp$mixture_weights

  # Construct data and params objects
  susie_objects <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = n, XtX = XtX,
    L = L, X_colmeans = X_colmeans, y_mean = y_mean,
    maf = maf, maf_thresh = maf_thresh,
    check_input = check_input, r_tol = r_tol, standardize = standardize,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights, null_weight = null_weight,
    model_init = model_init, s_init = s_init,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    residual_variance_lowerbound = residual_variance_lowerbound,
    residual_variance_upperbound = residual_variance_upperbound,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold, prior_tol = prior_tol,
    max_iter = max_iter, tol = tol, convergence_method = convergence_method,
    coverage = coverage, min_abs_corr = min_abs_corr, n_purity = n_purity,
    verbose = verbose, track_fit = track_fit, check_prior = check_prior,
    refine = refine, alpha0 = alpha0, beta0 = beta0,
    slot_prior = slot_prior, L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Run main SuSiE algorithm
  model <- susie_workhorse(susie_objects$data, susie_objects$params)

  return(model)
}

# =============================================================================
# SuSiE WITH REGRESSION SUMMARY STATISTICS
# =============================================================================

#' @title SuSiE with Regression Summary Statistics (RSS)
#'
#' @inheritParams susie_ss
#' 
#' @description Performs SuSiE regression using z-scores and correlation matrix.
#' This is the sufficient-statistics RSS interface. For the specialized
#' regularized eigendecomposition likelihood with \code{lambda > 0}, use
#' \code{\link{susie_rss_lambda}}.
#'
#' @param z A p-vector of z-scores.
#'
#' @param R A p by p correlation matrix. Exactly one of \code{R} or
#'   \code{X} must be provided.
#'
#' @param n The sample size, not required but recommended.
#'
#' @param X A factor matrix (B x p) such that \code{R = crossprod(X) /
#'   nrow(X)} approximates the R (correlation) matrix. When
#'   \code{nrow(X) >= ncol(X)}, the correlation matrix \code{R} is
#'   formed explicitly and the standard path is used. When
#'   \code{nrow(X) < ncol(X)}, a low-rank path is used that avoids
#'   forming the p x p matrix, reducing per-iteration cost from
#'   O(Lp^2) to O(LBp). Columns of \code{X} are standardized
#'   internally.
#'
#' @param bhat Alternative summary data giving the estimated effects
#'   (a vector of length p). This, together with \code{shat}, may be
#'   provided instead of \code{z}.
#'
#' @param shat Alternative summary data giving the standard errors of
#'   the estimated effects (a vector of length p). This, together with
#'   \code{bhat}, may be provided instead of \code{z}.
#'
#' @param var_y The sample variance of y, defined as \eqn{y'y/(n-1)}.
#'   When the sample variance is not provided, the coefficients
#'   (returned from \code{coef}) are computed on the
#'   \dQuote{standardized} X, y scale.
#' 
#' @param estimate_residual_variance The default is FALSE, the
#'   residual variance is fixed to 1 or variance of y. If the in-sample
#'   R matrix is provided, we recommend setting
#'   \code{estimate_residual_variance = TRUE}.
#'
#' @param R_finite Controls variance inflation to account
#'   for estimating the R matrix from a finite reference panel. Accepts three
#'   types of input:
#'   \describe{
#'     \item{\code{NULL} (default)}{The R matrix is treated as trusted, and no
#'       finite-reference variance inflation is applied.}
#'     \item{\code{TRUE}}{Infer the reference sample size B from the input
#'       \code{X}. Sets \code{B = nrow(X)} for single-panel input,
#'       or \code{B = min(nrow(X_k))} across panels for multi-panel
#'       input. Requires \code{X} to be provided (errors if only
#'       \code{R} is given, since B cannot be inferred).}
#'     \item{Number}{Explicit reference sample size B.}
#'   }
#'   When active, this dynamically inflates the null variance of each
#'   variable's score statistic at every IBSS iteration to account for
#'   finite-reference uncertainty in the Single Effect Regression (SER).
#'   When provided, the output includes a
#'   \code{R_finite_diagnostics} element with per-region and
#'   per-variable quality metrics.
#'
#' @param R_mismatch R-bias correction mode. \code{"none"} (default) is off.
#'   \code{"map"} adds a region-level population-mismatch variance
#'   component on top of the finite-reference correction; recommended
#'   whenever \code{R} comes from a different cohort than the GWAS.
#'   \code{"map_qc"} is \code{"map"} plus a QC score (\code{Q_art}) that
#'   warns when the fitted residual carries energy in directions where
#'   the supplied \code{R} indicates signal should be weak. For
#'   allele-coding / strand-flip checks, see the kriging diagnostic in
#'   \code{susie_rss}'s companion utilities.
#'   Requires \code{R_finite}; auto-disables \code{estimate_residual_variance}
#'   with a warning.
#'
#' @param eig_delta_rel,eig_delta_abs Cutoffs for "low-eigenvalue"
#'   directions of \code{R} used by the QC diagnostic
#'   (\code{R_mismatch = "map_qc"}). Default \code{eig_delta_rel = 1e-3},
#'   \code{eig_delta_abs = 0}; the threshold is
#'   \code{max(eig_delta_abs, eig_delta_rel * max_eigenvalue(R))}. Tighter
#'   (smaller) values flag fewer regions.
#'
#' @param artifact_threshold Flag threshold on the QC score \code{Q_art}
#'   (a fraction in [0, 1]). Default \code{0.1}; flag fires when
#'   \code{Q_art > artifact_threshold}. Heuristic, not a calibrated test.
#'
#' @param init_only Logical. If \code{TRUE}, return a list with
#'   \code{data} and \code{params} objects without running the IBSS
#'   algorithm. Default is \code{FALSE}.
#'
#' @return In addition to the standard \code{"susie"} output (see
#'   \code{\link{susie}}), the returned object may contain:
#'
#' \item{R_finite_diagnostics}{A list of diagnostics for the
#'   finite-reference correction (only present when
#'   \code{R_finite} is provided), containing:
#'   \code{B} (the reference sample size);
#'   \code{p} (number of variables);
#'   \code{effective_rank} (debiased \eqn{\tilde{r} = p^2 / \|R\|_F^2});
#'   \code{r_over_B} (\eqn{\tilde{r}/B}, one number per region; values
#'     \eqn{\le 0.2} indicate the reference panel is adequate);
#'   \code{Rhat_diag_deviation} (\eqn{|\hat{R}_{jj} - 1|}, one number
#'     per variable);
#'   \code{lambda_bias} (region-level scalar on the default
#'     \code{lambda = 0} sufficient-statistics path when
#'     \code{R_mismatch != "none"});
#'   \code{B_corrected} (effective reference sample size after the
#'     R-bias correction, \eqn{1/(1/B + \lambda_{\mathrm{bias}})};
#'     substantially
#'     smaller than the input \code{B} flags a dominant population
#'     mismatch component);
#'   \code{per_variable_penalty} (final-iteration
#'     \eqn{v_j / \sigma^2 = \tau_j^2 / \sigma^2 - 1}, one number per
#'     variable; values \eqn{\le 0.2} indicate minimal power loss,
#'     values \eqn{\gg 1} flag variables where the correction is doing
#'     heavy lifting).}
#'
#' @export
#' 
susie_rss <- function(z = NULL, R = NULL, n = NULL,
                      X = NULL,
                      bhat = NULL, shat = NULL, var_y = NULL,
                      L = min(10, if (is.list(R) && !is.matrix(R)) ncol(R[[1]])
                               else if (!is.null(R)) ncol(R)
                               else if (is.list(X) && !is.matrix(X)) ncol(X[[1]])
                               else ncol(X)),
                      maf = NULL,
                      maf_thresh = 0,
                      scaled_prior_variance = 0.2,
                      residual_variance = NULL,
                      prior_weights = NULL,
                      null_weight = 0,
                      standardize = TRUE,
                      estimate_residual_variance = FALSE,
                      estimate_residual_method = c("MoM", "MLE", "NIG"),
                      estimate_prior_variance = TRUE,
                      estimate_prior_method = c("optim", "EM", "simple"),
                      prior_variance_grid = NULL,
                      mixture_weights = NULL,
                      unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
                      check_null_threshold = 0,
                      prior_tol = 1e-9,
                      residual_variance_lowerbound = 0,
                      residual_variance_upperbound = Inf,
                      model_init = NULL,
                      s_init = NULL,
                      coverage = 0.95,
                      min_abs_corr = 0.5,
                      max_iter = 100,
                      L_greedy = NULL,
                      greedy_lbf_cutoff = 0.1,
                      tol = 1e-4,
                      convergence_method = c("elbo", "pip"),
                      verbose = FALSE,
                      track_fit = FALSE,
                      check_input = FALSE,
                      check_prior = TRUE,
                      n_purity = 100,
                      r_tol = 1e-8,
                      refine = FALSE,
                      R_finite = NULL,
                      R_mismatch = c("none", "map", "map_qc"),
                      eig_delta_rel = 1e-3,
                      eig_delta_abs = 0,
                      artifact_threshold = 0.1,
                      alpha0 = if (is.null(n)) NULL else 1/sqrt(n),
                      beta0 = if (is.null(n)) NULL else 1/sqrt(n),
                      init_only = FALSE,
                      slot_prior = NULL) {

  # Validate: exactly one of R or X must be provided
  if (is.null(R) && is.null(X))
    stop("Please provide either R (correlation matrix) or X (factor matrix).")
  if (!is.null(R) && !is.null(X))
    stop("Please provide either R or X, but not both.")
  is_multi_panel <- (is.list(X) && !is.matrix(X)) ||
                    (is.list(R) && !is.matrix(R))

  R_mismatch <- match.arg(R_mismatch)

  if (!is.numeric(eig_delta_rel) || length(eig_delta_rel) != 1L ||
      eig_delta_rel < 0)
    stop("eig_delta_rel must be a single nonnegative numeric.")
  if (!is.numeric(eig_delta_abs) || length(eig_delta_abs) != 1L ||
      eig_delta_abs < 0)
    stop("eig_delta_abs must be a single nonnegative numeric.")
  if (!is.numeric(artifact_threshold) || length(artifact_threshold) != 1L ||
      artifact_threshold < 0 || artifact_threshold > 1)
    stop("artifact_threshold must be a single numeric in [0, 1].")

  # Resolve R_finite BEFORE any X -> R conversion.
  if (isTRUE(R_finite) && is.null(X))
    stop("R_finite = TRUE requires X input. When using precomputed R, ",
         "provide the reference sample size explicitly.")
  R_finite <- resolve_R_finite(R_finite, if (!is.null(X)) X else R,
                               is_multi_panel)
  if (R_mismatch != "none" && is.null(R_finite))
    stop("R_mismatch requires R_finite because lambda_bias is estimated ",
         "as extra R bias beyond finite-reference uncertainty.")

  # sigma^2 and lambda_bias both inflate the residual variance and are
  # only weakly jointly identified; we follow Zou et al. (2022) and fix
  # sigma^2 when R_mismatch is active.
  if (R_mismatch != "none" && isTRUE(estimate_residual_variance)) {
    warning_message(
      "R_mismatch = '", R_mismatch, "' is incompatible with ",
      "estimate_residual_variance = TRUE; disabling sigma^2 estimation."
    )
    estimate_residual_variance <- FALSE
  }

  # Multi-panel: shared validation, PIP-switch, and per-panel sub-fit
  # machinery. The R-input and X-input branches differ only in (i) what
  # "valid" means for an element and (ii) whether the panels need
  # centering. They share everything else: the n requirement, the
  # PIP-convergence switch, and the per-panel single-panel sub-fits used
  # to pick the best mixture init via attr(., ".init_panel").
  if (is_multi_panel) {
    if (is.null(n))
      stop("Sample size 'n' is required for multi-panel mode.")
    if (convergence_method[1] == "elbo") {
      convergence_method <- "pip"
      warning_message("Switching to PIP-based convergence for multi-panel mixture ",
              "as mixture weights updates change R(omega) each iteration, which prevents ",
              "ELBO monotonicity.")
    }

    # Capture the user's call frame here so the per-panel recursive call
    # can resolve any unevaluated arguments in the original caller env.
    user_env <- parent.frame()
    sp_call <- match.call()
    sp_call[[1]] <- quote(susie_rss)
    sp_call$verbose <- FALSE
    sp_call$s_init <- NULL
    sp_call$model_init <- NULL

    # Returns the index of the panel with the highest single-panel ELBO.
    # `panel_arg` selects which call slot to substitute (`"R"` or `"X"`).
    pick_init_panel <- function(panels, panel_arg) {
      sp_fits <- lapply(seq_along(panels), function(k) {
        sp_call[[panel_arg]] <- panels[[k]]
        sp_call$R_finite <- if (is.null(R_finite)) NULL else R_finite[k]
        tryCatch(eval(sp_call, user_env), error = function(e) NULL)
      })
      sp_elbos <- vapply(sp_fits, function(f)
        if (!is.null(f)) tail(f$elbo, 1) else -Inf, numeric(1))
      which.max(sp_elbos)
    }

    if (!is.null(R)) {
      for (k in seq_along(R)) {
        if (!is.matrix(R[[k]]) || !is.numeric(R[[k]]))
          stop("Each element of R list must be a numeric matrix.")
        if (nrow(R[[k]]) != ncol(R[[k]]))
          stop("Each element of R list must be square.")
      }
      attr(R, ".init_panel") <- pick_init_panel(R, "R")
    } else {
      for (k in seq_along(X)) {
        if (!is.matrix(X[[k]]) || !is.numeric(X[[k]]))
          stop("Each element of X list must be a numeric matrix.")
      }
      # Center each panel before sub-fits so that crossprod(Xk) gives a
      # covariance-like quantity, matching the ss_mixture_constructor's
      # downstream expectation.
      X <- lapply(X, function(Xk) {
        cm <- colMeans(Xk)
        if (max(abs(cm)) > 1e-10 * max(abs(Xk)))
          Xk <- t(t(Xk) - cm)
        Xk
      })
      attr(X, ".init_panel") <- pick_init_panel(X, "X")
    }
  }

  # Handle single-panel X input.
  if (!is.null(X) && !is_multi_panel) {
    if (!is.matrix(X) || !is.numeric(X))
      stop("X must be a numeric matrix.")

    # Center columns of X so that crossprod gives covariance-like quantities.
    cm <- colMeans(X)
    if (max(abs(cm)) > 1e-10 * max(abs(X)))
      X <- t(t(X) - cm)

    # Features incompatible with the low-rank path: fall back to forming R
    needs_R <- !is.null(var_y) && !is.null(shat)
    if (needs_R && nrow(X) < ncol(X)) {
      warning_message(
        "X is provided as a low-rank factor matrix, but var_y/shat ",
        "requires the full correlation matrix R. Forming ",
        "R = cov2cor(crossprod(X)/nrow(X)) and using the standard path.")
    }

    # If nrow(X) >= ncol(X) or features require R, form R and use standard path
    if (nrow(X) >= ncol(X) || needs_R) {
      R <- safe_cor(X)
      X <- NULL
    }
  }

  # Validate method arguments
  unmappable_effects       <- match.arg(unmappable_effects)
  estimate_residual_method <- match.arg(estimate_residual_method)
  convergence_method       <- match.arg(convergence_method)
  mp <- resolve_mixture_prior(estimate_prior_method, estimate_prior_variance,
                              prior_variance_grid, mixture_weights)
  estimate_prior_method   <- mp$estimate_prior_method
  estimate_prior_variance <- mp$estimate_prior_variance
  prior_variance_grid     <- mp$prior_variance_grid
  mixture_weights         <- mp$mixture_weights

  # Auto-switch to PIP convergence for finite-reference R inflation.
  # (R_finite was already resolved to an integer above)
  if (!is.null(R_finite) && convergence_method[1] == "elbo") {
    convergence_method <- "pip"
    warning_message("Switching to PIP-based convergence because finite-reference R inflation ",
            "modifies per-variant SER likelihoods which prevents a consistent model-level ELBO.")
  }

  # Construct data and params objects with ALL parameters
  susie_objects <- summary_stats_constructor(
    z = z, R = R, X = X, n = n,
    bhat = bhat, shat = shat, var_y = var_y,
    L = L, maf = maf, maf_thresh = maf_thresh,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights, null_weight = null_weight,
    standardize = standardize,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold, prior_tol = prior_tol,
    residual_variance_lowerbound = residual_variance_lowerbound,
    residual_variance_upperbound = residual_variance_upperbound,
    model_init = model_init, s_init = s_init,
    coverage = coverage, min_abs_corr = min_abs_corr,
    max_iter = max_iter, tol = tol, convergence_method = convergence_method,
    verbose = verbose, track_fit = track_fit, check_input = check_input,
    check_prior = check_prior,
    n_purity = n_purity, r_tol = r_tol, refine = refine,
    R_finite = R_finite, R_mismatch = R_mismatch,
    eig_delta_rel = eig_delta_rel, eig_delta_abs = eig_delta_abs,
    artifact_threshold = artifact_threshold,
    alpha0 = alpha0, beta0 = beta0,
    slot_prior = slot_prior, L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Return constructed data and params without running IBSS (for susieAnn
  # and other packages that implement their own outer loop). The caller
  # is responsible for calling ibss_initialize() on the returned objects.
  if (init_only) {
    return(susie_objects)
  }

  # Run main SuSiE algorithm
  model <- susie_workhorse(susie_objects$data, susie_objects$params)

  # Store single-panel fits inside the mixture result so users can compare.
  # Always return the mixture result; users can choose a single-panel fit
  # from model$single_panel_fits if they prefer.
  if (exists("sp_fits") && !is.null(sp_fits)) {
    if (verbose) {
      mix_elbo <- tail(model$elbo, 1)
      best_k <- which.max(sp_elbos)
      omega_str <- paste(round(model$omega_weights, 3), collapse = ", ")
      message(sprintf(
        "Multi-panel: mixture ELBO = %.2f (omega = %s), best single-panel ELBO = %.2f (panel %d).",
        mix_elbo, omega_str, sp_elbos[best_k], best_k))
    }
    model$single_panel_fits <- sp_fits
  }

  return(model)
}

#' Sum of Single Effects Regression using the RSS-lambda likelihood
#'
#' @description Specialized interface for the regularized eigendecomposition
#' RSS likelihood of Zou et al. (2022). This path accepts a single reference
#' matrix or a single factor matrix and does not support multi-panel mixture,
#' finite-reference inflation, or R-bias correction.
#'
#' @inheritParams susie_rss
#'
#' @param lambda Regularization parameter for the RSS-lambda likelihood.
#'   Must be supplied. \code{lambda = "estimate"} estimates lambda from
#'   the null-space residual.
#' @param prior_variance Prior variance for each non-zero effect on the
#'   z-score scale. Replaces \code{scaled_prior_variance} from
#'   \code{\link{susie_rss}}. Default \code{50}.
#' @param intercept_value Intercept used by the RSS-lambda likelihood.
#'   Default \code{0}.
#' @param estimate_residual_method Variance-component estimator. The
#'   RSS-lambda path supports \code{"MLE"} only; any other value errors.
#' @param estimate_prior_variance If \code{estimate_prior_variance = TRUE},
#'   the prior variance is estimated (a separate parameter for each of
#'   the L effects). When \code{TRUE}, \code{prior_variance} provides the
#'   initial value; when \code{FALSE}, it is held fixed.
#' @param check_null_threshold When the prior variance is estimated,
#'   compare its likelihood to the likelihood at zero and use zero
#'   unless the larger value exceeds it by at least
#'   \code{check_null_threshold}. \code{0} (default) takes the larger
#'   likelihood at face value.
#' @param check_R If TRUE, verify that \code{R} is positive semidefinite.
#' @param check_z If TRUE, verify that \code{z} lies in the column space
#'   of \code{R}.
#'
#' @return A \code{"susie"} fit (or, with \code{init_only = TRUE}, the
#'   constructed data and params objects).
#'
#' @export
susie_rss_lambda <- function(z = NULL, R = NULL, n = NULL,
                             X = NULL,
                             L = min(10, if (!is.null(R)) ncol(R)
                                      else ncol(X)),
                             lambda,
                             maf = NULL,
                             maf_thresh = 0,
                             prior_variance = 50,
                             residual_variance = NULL,
                             prior_weights = NULL,
                             null_weight = 0,
                             intercept_value = 0,
                             estimate_residual_variance = FALSE,
                             estimate_residual_method = "MLE",
                             estimate_prior_variance = TRUE,
                             estimate_prior_method = c("optim", "EM", "simple"),
                             prior_variance_grid = NULL,
                             mixture_weights = NULL,
                             check_null_threshold = 0,
                             prior_tol = 1e-9,
                             residual_variance_lowerbound = 0,
                             model_init = NULL,
                             coverage = 0.95,
                             min_abs_corr = 0.5,
                             max_iter = 100,
                             L_greedy = NULL,
                             greedy_lbf_cutoff = 0.1,
                             tol = 1e-4,
                             convergence_method = c("elbo", "pip"),
                             verbose = FALSE,
                             track_fit = FALSE,
                             check_prior = TRUE,
                             check_R = TRUE,
                             check_z = FALSE,
                             n_purity = 100,
                             r_tol = 1e-8,
                             refine = FALSE,
                             init_only = FALSE,
                             slot_prior = NULL) {
  if (missing(lambda))
    stop("susie_rss_lambda() requires lambda.")
  if (is.null(R) && is.null(X))
    stop("Please provide either R (correlation matrix) or X (factor matrix).")
  if (!is.null(R) && !is.null(X))
    stop("Please provide either R or X, but not both.")
  if (is.list(R) && !is.matrix(R))
    stop("susie_rss_lambda() accepts only a single R matrix.")
  if (is.list(X) && !is.matrix(X))
    stop("susie_rss_lambda() accepts only a single X matrix.")
  if (!identical(estimate_residual_method, "MLE"))
    stop("susie_rss_lambda() supports estimate_residual_method = \"MLE\" only.")

  convergence_method       <- match.arg(convergence_method)
  mp <- resolve_mixture_prior(estimate_prior_method, estimate_prior_variance,
                              prior_variance_grid, mixture_weights)
  estimate_prior_method   <- mp$estimate_prior_method
  estimate_prior_variance <- mp$estimate_prior_variance
  prior_variance_grid     <- mp$prior_variance_grid
  mixture_weights         <- mp$mixture_weights

  susie_objects <- rss_lambda_constructor(
    z = z, R = R, X = X, n = n,
    L = L, lambda = lambda, maf = maf, maf_thresh = maf_thresh,
    prior_variance = prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights, null_weight = null_weight,
    intercept_value = intercept_value,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    check_null_threshold = check_null_threshold, prior_tol = prior_tol,
    residual_variance_lowerbound = residual_variance_lowerbound,
    model_init = model_init, coverage = coverage, min_abs_corr = min_abs_corr,
    max_iter = max_iter, tol = tol, convergence_method = convergence_method,
    verbose = verbose, track_fit = track_fit,
    check_prior = check_prior, check_R = check_R, check_z = check_z,
    n_purity = n_purity, r_tol = r_tol, refine = refine,
    slot_prior = slot_prior, L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  if (init_only)
    return(susie_objects)

  susie_workhorse(susie_objects$data, susie_objects$params)
}


================================================
FILE: R/susieR-package.R
================================================
#' @keywords internal
"_PACKAGE"

# The following block is used by usethis to automatically manage
# roxygen namespace tags. Modify with care!
## usethis namespace: start
## usethis namespace: end
NULL


================================================
FILE: R/susie_auto.R
================================================
#' @title Attempt at Automating SuSiE for Hard Problems
#'
#' @description \code{susie_auto} is an attempt to automate reliable
#'   running of susie even on hard problems. It implements a three-stage
#'   strategy for each L: first, fit susie with very small residual
#'   error; next, estimate residual error; finally, estimate the prior
#'   variance. If the last step estimates some prior variances to be
#'   zero, stop. Otherwise, double L, and repeat. Initial runs are
#'   performed with relaxed tolerance; the final run is performed using
#'   the default susie tolerance.
#'
#' @param X An n by p matrix of covariates.
#'
#' @param y The observed responses, a vector of length n.
#'
#' @param L_init The initial value of L.
#'
#' @param L_max The largest value of L to consider.
#'
#' @param verbose If \code{verbose = TRUE}, the algorithm's progress,
#'   and a summary of the optimization settings, are printed to the
#'   console.
#'
#' @param init_tol The tolerance to passed to \code{susie} during
#'   early runs (set large to shorten the initial runs).
#'
#' @param standardize If \code{standardize = TRUE}, standardize the
#'   columns of X to unit variance prior to fitting. Note that
#'   \code{scaled_prior_variance} specifies the prior on the
#'   coefficients of X \emph{after} standardization (if it is
#'   performed). If you do not standardize, you may need to think more
#'   carefully about specifying \code{scaled_prior_variance}. Whatever
#'   your choice, the coefficients returned by \code{coef} are given for
#'   \code{X} on the original input scale. Any column of \code{X} that
#'   has zero variance is not standardized.
#'
#' @param intercept If \code{intercept = TRUE}, the intercept is
#'   fitted; it \code{intercept = FALSE}, the intercept is set to
#'   zero. Setting \code{intercept = FALSE} is generally not
#'   recommended.
#'
#' @param max_iter Maximum number of IBSS iterations to perform.
#'
#' @param tol A small, non-negative number specifying the convergence
#'   tolerance for the IBSS fitting procedure. The fitting procedure
#'   will halt when the difference in the variational lower bound, or
#'   \dQuote{ELBO} (the objective function to be maximized), is
#'   less than \code{tol}.
#'
#' @param \dots Additional arguments passed to \code{\link{susie}}.
#'
#' @return See \code{\link{susie}} for a description of return values.
#'
#' @seealso \code{\link{susie}}
#'
#' @examples
#' set.seed(1)
#' n = 1000
#' p = 1000
#' beta = rep(0,p)
#' beta[1:4] = 1
#' X = matrix(rnorm(n*p),nrow = n,ncol = p)
#' X = scale(X,center = TRUE,scale = TRUE)
#' y = drop(X %*% beta + rnorm(n))
#' res = susie_auto(X,y)
#' plot(beta,coef(res)[-1])
#' abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
#' plot(y,predict(res))
#' abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
#'
#' @importFrom stats sd
#'
#' @export
#'
susie_auto = function (X, y, L_init = 1, L_max = 512, verbose = FALSE,
                       init_tol = 1, standardize = TRUE, intercept = TRUE,
                       max_iter = 100,tol = 1e-2, ...) {
  L = L_init
  if (verbose)
    message(paste0("Trying L=",L))
  s.0 = susie(X,y,L = L,residual_variance = 0.01*sd(y)^2,tol = init_tol,
              scaled_prior_variance = 1,estimate_residual_variance = FALSE,
              estimate_prior_variance = FALSE,standardize = standardize,
              intercept = intercept,max_iter = max_iter,...)
  s.1 = susie(X,y,L = nrow(s.0$alpha),model_init = s.0,tol = init_tol,
              estimate_residual_variance = TRUE,
              estimate_prior_variance = FALSE,
              standardize = standardize,intercept = intercept,
              max_iter = max_iter,...)
  s.2 = susie(X,y,L = nrow(s.1$alpha),model_init = s.1,tol = init_tol,
              estimate_residual_variance = TRUE,
              estimate_prior_variance = TRUE,
              standardize = standardize,intercept = intercept,
              max_iter = max_iter,...)

  # We call it converged---i.e., L is "big enough"---if there are any
  # prior variances set to zero.
  converged = !all(s.2$V > 0)
  while (!converged & (L <= L_max)) {
    for (i in 1:L) {
      s.2 = add_null_effect(s.2,1) # Add in L more effects.
      s.2$sigma2 = 0.01*sd(y)^2    # Set residual variance to be small
                                   # again for next iteration.
    }
    L = 2*L
    if (verbose)
      message(paste0("Trying L=",L))
    s.0 = susie(X,y,L = nrow(s.2$alpha),model_init = s.2,tol = init_tol,
                estimate_residual_variance = FALSE,
                estimate_prior_variance = FALSE,
                standardize = standardize,intercept = intercept,
                max_iter = max_iter,...)
    s.1 = susie(X,y,L = nrow(s.0$alpha),model_init = s.0,tol = init_tol,
                estimate_residual_variance = TRUE,
                estimate_prior_variance = FALSE,
                standardize = standardize,intercept = intercept,
                max_iter = max_iter,...)
    s.2 = susie(X,y,L = nrow(s.1$alpha),model_init = s.1,tol = init_tol,
                estimate_residual_variance = TRUE,
                estimate_prior_variance = TRUE,
                standardize = standardize,intercept = intercept,
                max_iter = max_iter,...)

    # We call it converged---i.e., L is "big enough"---if there are
    # any prior variances set to zero.
    converged = !all(s.2$V > 0)
  }

  # Final run at default tolerance to improve fit.
  s.2 = susie(X,y,L = nrow(s.2$alpha),model_init = s.2,estimate_residual_variance = TRUE,
              estimate_prior_variance = TRUE,tol = tol,
              standardize = standardize,intercept = intercept,
              max_iter = max_iter,...)
  return(s.2)
}


================================================
FILE: R/susie_constructors.R
================================================
# =============================================================================
# INDIVIDUAL-LEVEL DATA CONSTRUCTOR
#
# Constructs data and params objects for SuSiE from individual-level data (X, y).
# Handles data preprocessing, parameter validation, and object creation.
# =============================================================================
#'
#' @return A list containing:
#' \item{data}{A processed list containing X and y matrices with appropriate scaling
#' attributes and sample dimensions}
#' \item{params}{Validated params object with all input algorithm parameters}
#'
#' @keywords internal
#' @importFrom stats var
#' @noRd
individual_data_constructor <- function(X, y, L = min(10, ncol(X)),
                                        scaled_prior_variance = 0.2,
                                        residual_variance = NULL,
                                        prior_weights = NULL,
                                        null_weight = 0,
                                        standardize = TRUE,
                                        intercept = TRUE,
                                        estimate_residual_variance = TRUE,
                                        estimate_residual_method = "MoM",
                                        estimate_prior_variance = TRUE,
                                        estimate_prior_method = "optim",
                                        prior_variance_grid = NULL,
                                        mixture_weights = NULL,
                                        unmappable_effects = "none",
                                        check_null_threshold = 0,
                                        prior_tol = 1e-9,
                                        residual_variance_upperbound = Inf,
                                        model_init = NULL,
                                        s_init = NULL,
                                        coverage = 0.95,
                                        min_abs_corr = 0.5,
                                        compute_univariate_zscore = FALSE,
                                        na.rm = FALSE,
                                        max_iter = 100,
                                        tol = 1e-3,
                                        convergence_method = "elbo",
                                        verbose = FALSE,
                                        track_fit = FALSE,
                                        residual_variance_lowerbound = NULL,
                                        refine = FALSE,
                                        n_purity = 100,
                                        alpha0 = 0,
                                        beta0 = 0,
                                        slot_prior = NULL,
                                        L_greedy = NULL,
                                        greedy_lbf_cutoff = 0.1) {

  # Handle deprecated s_init argument
  if (!is.null(s_init)) {
    if (!is.null(model_init))
      stop("Cannot specify both 's_init' and 'model_init'.")
    warning_message("s_init is deprecated and will be removed in a future ",
                    "version of susieR. Please use model_init instead.")
    model_init <- s_init
  }

  # Validate input X
  if (!(is.double(X) & is.matrix(X)) &
      !inherits(X, "sparseMatrix") &
      is.null(attr(X, "matrix.type"))) {
    stop("Input X must be a double-precision matrix, or a sparse matrix, or ",
         "a trend filtering matrix.")
  }

  if (anyNA(X)) {
    stop("X contains NA values.")
  }

  # Constant column check for regular matrix
  if (is.null(attr(X, "matrix.type")) || attr(X, "matrix.type") != "tfmatrix") {
    col_vars <- apply(X, 2, var)
    const_cols <- which(col_vars == 0 | is.na(col_vars))
    if (length(const_cols) > 0) {
      warning_message(sprintf("X contains %d constant columns (first few cols: %s).",
                 length(const_cols), paste(head(const_cols, 10), collapse = ", ")))
    }
  }

  # Handle missing values in y
  if (anyNA(y)) {
    if (na.rm) {
      samples_kept <- which(!is.na(y))
      y <- y[samples_kept]
      X <- X[samples_kept, , drop = FALSE]
    } else {
      stop("Input y must not contain missing values.")
    }
  }

  # Set residual_variance_lowerbound
  if (is.null(residual_variance_lowerbound)) {
    residual_variance_lowerbound <- var(drop(y)) / 1e4
  }

  mean_y <- mean(y)

  # Force required preprocessing for unmappable effects methods
  if (unmappable_effects != "none") {
    if (!intercept) {
      warning_message("Unmappable effects methods require centered data. Setting intercept=TRUE.")
      intercept <- TRUE
    }
    if (!standardize) {
      warning_message("Unmappable effects methods require scaled data. Setting standardize=TRUE.")
      standardize <- TRUE
    }
  }

  # Check for incompatible parameter combination
  if (unmappable_effects != "none" &&
      estimate_residual_method == "NIG") {
    stop("The combination of unmappable_effects = '", unmappable_effects,
         "' with estimate_residual_method = 'NIG' is not supported. ",
         "Please use estimate_residual_method = 'MoM' or 'MLE' instead.")
  }

  # Check for incompatible parameter combination
  if (unmappable_effects %in% c("ash", "ash_filter_archived") && estimate_prior_method == "EM") {
    stop("The combination of unmappable_effects = 'ash' with ",
         "estimate_prior_method = 'EM' is not supported. ",
         "Please use estimate_prior_method = 'optim' instead.")
  }

  # Handle null weights
  if (is.numeric(null_weight) && null_weight == 0) {
    null_weight <- NULL
  }

  if (!is.null(null_weight)) {
    if (!is.numeric(null_weight)) {
      stop("Null weight must be numeric.")
    }
    if (null_weight < 0 || null_weight >= 1) {
      stop("Null weight must be between 0 and 1.")
    }

    if (is.null(prior_weights)) {
      prior_weights <- c(rep(1 / ncol(X) * (1 - null_weight), ncol(X)), null_weight)
    } else {
      prior_weights <- c(prior_weights * (1 - null_weight), null_weight)
    }

    # add the extra 0 column to X
    X <- cbind(X, 0)
  }

  # Store dimensions
  n <- nrow(X)
  p <- ncol(X)

  # Set uniform prior weights if not provided
  if (is.null(prior_weights)) {
    prior_weights <- rep(1 / p, p)
  }

  # Validate and normalize prior_weights
  if (length(prior_weights) != p) {
    stop("Prior weights must have length p.")
  }
  if (all(prior_weights == 0)) {
    stop("Prior weight should be greater than 0 for at least one variable.")
  }
  prior_weights <- prior_weights / sum(prior_weights)

  # nocov start
  if (p > 1000 & !requireNamespace("Rfast", quietly = TRUE)) {
    warning_message("For an X with many columns, please consider installing ",
                    "the Rfast package for more efficient credible set (CS) ",
                    "calculations.",
                    style = "hint")
  }
  # nocov end

  # Center y if intercept is included
  if (intercept) {
    y <- y - mean_y
  }

  # Compute and set X matrix attributes
  out <- compute_colstats(X, center = intercept, scale = standardize)
  attr(X, "scaled:center") <- out$cm
  attr(X, "scaled:scale") <- out$csd
  attr(X, "d") <- out$d

  # Create params object with all input parameters
  params_object <- list(
    L = L,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights,
    null_weight = null_weight,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold,
    prior_tol = prior_tol,
    residual_variance_upperbound = residual_variance_upperbound,
    model_init = model_init,
    coverage = coverage,
    min_abs_corr = min_abs_corr,
    compute_univariate_zscore = compute_univariate_zscore,
    max_iter = max_iter,
    tol = tol,
    convergence_method = convergence_method,
    verbose = verbose,
    track_fit = track_fit,
    residual_variance_lowerbound = residual_variance_lowerbound,
    refine = refine,
    n_purity = n_purity,
    alpha0 = alpha0,
    beta0 = beta0,
    n = n,
    use_NIG = FALSE,  # Will be set by validation function
    intercept = intercept,
    standardize = standardize,
    slot_prior = slot_prior,
    L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Validate and apply parameter overrides
  params_object <- validate_and_override_params(params_object)
  data_object <- structure(
    list(
      X = X,
      y = y,
      mean_y = mean_y,
      n = n,
      p = p
    ),
    class = "individual"
  )

  # Configure data object based on params
  data_object <- configure_data(data_object, params_object)

  return(list(data = data_object, params = params_object))
}

# =============================================================================
# SUFFICIENT STATISTICS DATA CONSTRUCTOR
#
# Constructs data and params objects for SuSiE from sufficient statistics (XtX, Xty, yty).
# Handles data preprocessing, parameter validation, and object creation.
# =============================================================================
#'
#' @return A list containing:
#' \item{data}{A processed list containing XtX, Xty, yty matrices with appropriate scaling
#' attributes and sample dimensions}
#' \item{params}{Validated params object with all input algorithm parameters}
#'
#' @keywords internal
#' @noRd
sufficient_stats_constructor <- function(Xty, yty, n,
                                         XtX = NULL, X = NULL,
                                         L = min(10, if (!is.null(XtX)) ncol(XtX) else ncol(X)),
                                         X_colmeans = NA, y_mean = NA,
                                         maf = NULL, maf_thresh = 0,
                                         check_input = FALSE,
                                         r_tol = 1e-8,
                                         standardize = TRUE,
                                         scaled_prior_variance = 0.2,
                                         residual_variance = NULL,
                                         prior_weights = NULL,
                                         null_weight = 0,
                                         model_init = NULL,
                                         s_init = NULL,
                                         estimate_residual_variance = TRUE,
                                         estimate_residual_method = "MoM",
                                         residual_variance_lowerbound = 0,
                                         residual_variance_upperbound = Inf,
                                         estimate_prior_variance = TRUE,
                                         estimate_prior_method = "optim",
                                         prior_variance_grid = NULL,
                                         mixture_weights = NULL,
                                         unmappable_effects = "none",
                                         check_null_threshold = 0,
                                         prior_tol = 1e-9,
                                         max_iter = 100,
                                         tol = 1e-3,
                                         convergence_method = "elbo",
                                         coverage = 0.95,
                                         min_abs_corr = 0.5,
                                         n_purity = 100,
                                         verbose = FALSE,
                                         track_fit = FALSE,
                                         check_prior = FALSE,
                                         refine = FALSE,
                                         alpha0 = 0.1,
                                         beta0 = 0.1,
                                         slot_prior = NULL,
                                         L_greedy = NULL,
                                         greedy_lbf_cutoff = 0.1) {

  # Handle deprecated s_init argument
  if (!is.null(s_init)) {
    if (!is.null(model_init))
      stop("Cannot specify both 's_init' and 'model_init'.")
    warning_message("s_init is deprecated and will be removed in a future ",
                    "version of susieR. Please use model_init instead.")
    model_init <- s_init
  }

  # Validate required inputs
  if (missing(n)) {
    stop("n must be provided.")
  }
  if (n <= 1) {
    stop("n must be greater than 1.")
  }

  if (is.null(X)) {
    # XtX path: validate XtX
    if (is.null(XtX) || missing(Xty) || missing(yty)) {
      stop("XtX, Xty, yty must all be provided.")
    }

    if (!(is.double(XtX) && is.matrix(XtX)) &&
        !inherits(XtX, "sparseMatrix")) {
      stop("XtX must be a numeric dense or sparse matrix.")
    }

    if (ncol(XtX) != length(Xty)) {
      stop(paste0(
        "The dimension of XtX (", nrow(XtX), " by ", ncol(XtX),
        ") does not agree with expected (", length(Xty), " by ",
        length(Xty), ")."
      ))
    }

    # nocov start
    if (ncol(XtX) > 1000 & !requireNamespace("Rfast", quietly = TRUE)) {
      warning_message("For large R or large XtX, consider installing the ",
                      "Rfast package for better performance.",
                      style = "hint")
    }
    # nocov end

    # Ensure XtX is symmetric
    if (!is_symmetric_matrix(XtX)) {
      warning_message("XtX not symmetric; using (XtX + t(XtX))/2.")
      XtX <- (XtX + t(XtX)) / 2
    }

    # Apply MAF filter if provided
    if (!is.null(maf)) {
      if (length(maf) != length(Xty)) {
        stop(paste("The length of maf does not agree with expected", length(Xty), "."))
      }
      id <- which(maf > maf_thresh)
      XtX <- XtX[id, id]
      Xty <- Xty[id]
    }

    # Additional validation
    if (anyNA(XtX)) {
      stop("Input XtX matrix contains NAs.")
    }

    # Positive-semidefinite check
    if (check_input) {
      semi_pd <- check_semi_pd(XtX, r_tol)
      if (!semi_pd$status) {
        stop("XtX is not a positive semidefinite matrix.")
      }

      # Check whether Xty lies in space spanned by non-zero eigenvectors of XtX
      proj <- check_projection(semi_pd$matrix, Xty)
      if (!proj$status) {
        warning_message("Xty does not lie in the space of the non-zero eigenvectors ",
                        "of XtX.")
      }
    }
  } else {
    # X low-rank path: validate X
    if (ncol(X) != length(Xty)) {
      stop(paste0(
        "The number of columns of X (", ncol(X),
        ") does not agree with the length of Xty (", length(Xty), ")."
      ))
    }
  }

  # Common validation for Xty
  if (any(is.infinite(Xty))) {
    stop("Input Xty contains infinite values.")
  }
  if (anyNA(Xty)) {
    warning_message("NA values in Xty are replaced with 0.")
    Xty[is.na(Xty)] <- 0
  }

  # Define p before null_weight handling
  p <- if (!is.null(XtX)) ncol(XtX) else ncol(X)

  # Handle null weights
  if (is.numeric(null_weight) && null_weight == 0) {
    null_weight <- NULL
  }

  if (!is.null(null_weight)) {
    if (!is.numeric(null_weight)) {
      stop("Null weight must be numeric.")
    }
    if (null_weight < 0 || null_weight >= 1) {
      stop("Null weight must be between 0 and 1.")
    }
    if (is.null(prior_weights)) {
      prior_weights <- c(rep(1 / p * (1 - null_weight), p), null_weight)
    } else {
      prior_weights <- c(prior_weights * (1 - null_weight), null_weight)
    }
    if (!is.null(XtX)) {
      XtX <- cbind(rbind(XtX, 0), 0)
    }
    if (!is.null(X)) {
      X <- cbind(X, 0)
    }
    Xty <- c(Xty, 0)
    if (length(X_colmeans) == 1) {
      X_colmeans <- rep(X_colmeans, p)
    }
    if (length(X_colmeans) != p) {
      stop("The length of X_colmeans does not agree with number of variables.")
    }
    # Add 0 for null column
    X_colmeans <- c(X_colmeans, 0)
    # Update p after adding null column
    p <- p + 1
  }

  # Set uniform prior weights if not provided
  if (is.null(prior_weights)) {
    prior_weights <- rep(1 / p, p)
  }

  # Validate and normalize prior_weights
  if (length(prior_weights) != p) {
    stop("Prior weights must have length p.")
  }
  if (all(prior_weights == 0)) {
    stop("Prior weight should be greater than 0 for at least one variable.")
  }
  prior_weights <- prior_weights / sum(prior_weights)

  # Standardize if requested
  if (!is.null(X)) {
    # Low-rank X path: standardize columns of X
    if (standardize) {
      dXtX <- colSums(X^2)
      csd <- sqrt(dXtX / (n - 1))
      csd[csd == 0] <- 1
      X <- t(t(X) / csd)
      Xty <- Xty / csd
    } else {
      csd <- rep(1, length = p)
    }
    attr(X, "d") <- colSums(X^2)
    attr(X, "scaled:scale") <- csd
    colnames(X) <- names(Xty)
  } else {
    # XtX path: standardize XtX
    if (standardize) {
      dXtX <- diag(XtX)
      csd <- sqrt(dXtX / (n - 1))
      csd[csd == 0] <- 1
      XtX <- t((1 / csd) * XtX) / csd
      Xty <- Xty / csd
    } else {
      csd <- rep(1, length = p)
    }
    attr(XtX, "d") <- diag(XtX)
    attr(XtX, "scaled:scale") <- csd
  }

  if (length(X_colmeans) == 1) {
    X_colmeans <- rep(X_colmeans, p)
  }
  if (length(X_colmeans) != p) {
    stop(
      "`X_colmeans` length (", length(X_colmeans),
      ") does not match number of variables (", p, ")."
    )
  }

  # Create params object with all input parameters
  params_object <- list(
    L = L,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights,
    null_weight = null_weight,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold,
    prior_tol = prior_tol,
    residual_variance_upperbound = residual_variance_upperbound,
    model_init = model_init,
    coverage = coverage,
    min_abs_corr = min_abs_corr,
    compute_univariate_zscore = FALSE,  # SS doesn't support univariate zscore
    max_iter = max_iter,
    tol = tol,
    convergence_method = convergence_method,
    verbose = verbose,
    track_fit = track_fit,
    residual_variance_lowerbound = residual_variance_lowerbound,
    refine = refine,
    n_purity = n_purity,
    alpha0 = alpha0,
    beta0 = beta0,
    n = n,
    use_NIG = FALSE,
    intercept = FALSE,  # SS always uses intercept = FALSE
    standardize = standardize,
    check_prior = check_prior,
    slot_prior = slot_prior,
    L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Validate and apply parameter overrides
  params_object <- validate_and_override_params(params_object)

  # Assemble data object
  data_object <- structure(
    list(
      XtX = XtX,
      X = X,
      Xty = Xty,
      yty = yty,
      n = n,
      p = p,
      X_colmeans = X_colmeans,
      y_mean = y_mean
    ),
    class = "ss"
  )

  # Configure data object based on params
  data_object <- configure_data(data_object, params_object)

  return(list(data = data_object, params = params_object))
}

# =============================================================================
# SUMMARY STATISTICS (RSS) DATA CONSTRUCTOR
#
# Constructs data and params objects for SuSiE from summary statistics
# (z-scores, R matrix, or multi-panel R/X reference).
# =============================================================================
#'
#' @return A list containing:
#' \item{data}{A processed list containing converted matrices with appropriate scaling
#' attributes and sample dimensions}
#' \item{params}{Validated params object with all input algorithm parameters}
#'
#' @keywords internal
#' @noRd
summary_stats_constructor <- function(z = NULL, R = NULL, X = NULL,
                                      n = NULL, bhat = NULL,
                                      shat = NULL, var_y = NULL,
                                      L = min(10, if (!is.null(R)) ncol(R) else ncol(X)),
                                      lambda = 0,
                                      maf = NULL,
                                      maf_thresh = 0,
                                      prior_variance = 50,
                                      scaled_prior_variance = 0.2,
                                      residual_variance = NULL,
                                      prior_weights = NULL,
                                      null_weight = 0,
                                      standardize = TRUE,
                                      intercept_value = 0,
                                      estimate_residual_variance = FALSE,
                                      estimate_residual_method = "MoM",
                                      estimate_prior_variance = TRUE,
                                      estimate_prior_method = "optim",
                                      prior_variance_grid = NULL,
                                      mixture_weights = NULL,
                                      unmappable_effects = "none",
                                      check_null_threshold = 0,
                                      prior_tol = 1e-9,
                                      residual_variance_lowerbound = 0,
                                      residual_variance_upperbound = Inf,
                                      model_init = NULL,
                                      s_init = NULL,
                                      coverage = 0.95,
                                      min_abs_corr = 0.5,
                                      max_iter = 100,
                                      tol = 1e-3,
                                      convergence_method = "elbo",
                                      verbose = FALSE,
                                      track_fit = FALSE,
                                      check_input = FALSE,
                                      check_prior = TRUE,
                                      n_purity = 100,
                                      r_tol = 1e-8,
                                      refine = FALSE,
                                      R_finite = NULL,
                                      R_mismatch = "none",
                                      eig_delta_rel = 1e-3,
                                      eig_delta_abs = 0,
                                      artifact_threshold = 0.1,
                                      alpha0 = 0.1,
                                      beta0 = 0.1,
                                      slot_prior = NULL,
                                      L_greedy = NULL,
                                      greedy_lbf_cutoff = 0.1) {

  # Handle deprecated s_init argument
  if (!is.null(s_init)) {
    if (!is.null(model_init))
      stop("Cannot specify both 's_init' and 'model_init'.")
    warning_message("s_init is deprecated and will be removed in a future ",
                    "version of susieR. Please use model_init instead.")
    model_init <- s_init
  }

  # NIG prior requires an explicit sample size n: the default alpha0/beta0
  # scale as 1/sqrt(n) and the NIG marginal likelihood depends on n. Without
  # n, summary_stats_constructor bumps n to 2 internally (see below), which
  # would silently corrupt the NIG posterior. Reject early with a clear error.
  if (estimate_residual_method == "NIG" &&
      (is.null(n) || !is.numeric(n) || length(n) != 1 ||
       !is.finite(n) || n < 1)) {
    stop("estimate_residual_method = \"NIG\" requires a valid sample ",
         "size `n` (got n = ", paste(n, collapse = ""), "). ",
         "For susie_rss(), pass `n` explicitly.")
  }

  # PVE-adjusted z-scores: shrink large z toward zero to account for
  # winner's curse. Applied to ALL paths when sample size is available.
  # Guard: z may be NULL when bhat/shat are provided (converted later).
  pve_adjusted <- FALSE
  if (!is.null(z) && !is.null(n) && n > 1) {
    adj <- (n - 1) / (z^2 + n - 2)
    z <- sqrt(adj) * z
    pve_adjusted <- TRUE
  }

  is_multipanel <- (is.list(X) && !is.matrix(X)) ||
                   (is.list(R) && !is.matrix(R))
  R_mismatch <- match.arg(R_mismatch, c("none", "map", "map_qc"))
  if (isTRUE(R_finite) && is.null(X))
    stop("R_finite = TRUE requires X input. When using precomputed R, ",
         "provide the reference sample size explicitly.")
  R_finite <- resolve_R_finite(R_finite, if (!is.null(X)) X else R,
                               is_multipanel)
  if (is_multipanel) {
    if (lambda != 0)
      stop("Multi-panel mixture is available only on the sufficient-statistics path.")
    if (!is.null(bhat) || !is.null(shat)) {
      stop("Parameters 'bhat' and 'shat' are not supported in the ",
           "multi-panel summary-statistics path. ",
           "Please provide z-scores directly.")
    }
    if (!is.null(var_y))
      stop("Parameter 'var_y' is not supported in the multi-panel path.")
    return(ss_mixture_constructor(
      z = z, R = R, X = X, n = n, L = L,
      maf = maf, maf_thresh = maf_thresh,
      scaled_prior_variance = scaled_prior_variance,
      residual_variance = residual_variance,
      prior_weights = prior_weights, null_weight = null_weight,
      standardize = standardize,
      estimate_residual_variance = estimate_residual_variance,
      estimate_residual_method = estimate_residual_method,
      estimate_prior_variance = estimate_prior_variance,
      estimate_prior_method = estimate_prior_method,
      prior_variance_grid = prior_variance_grid,
      mixture_weights = mixture_weights,
      unmappable_effects = unmappable_effects,
      check_null_threshold = check_null_threshold, prior_tol = prior_tol,
      residual_variance_lowerbound = residual_variance_lowerbound,
      residual_variance_upperbound = residual_variance_upperbound,
      model_init = model_init, coverage = coverage,
      min_abs_corr = min_abs_corr, max_iter = max_iter, tol = tol,
      convergence_method = convergence_method, verbose = verbose,
      track_fit = track_fit, check_input = check_input,
      check_prior = check_prior, n_purity = n_purity,
      r_tol = r_tol, refine = refine, R_finite = R_finite,
      R_mismatch = R_mismatch, eig_delta_rel = eig_delta_rel,
      eig_delta_abs = eig_delta_abs, artifact_threshold = artifact_threshold,
      alpha0 = alpha0, beta0 = beta0, slot_prior = slot_prior,
      L_greedy = L_greedy, greedy_lbf_cutoff = greedy_lbf_cutoff
    ))
  }

  if (lambda != 0) {
    if (!is.null(R_finite))
      stop("R_finite is not available in the RSS-lambda path.")
    if (R_mismatch != "none")
      stop("R_mismatch is not available in the RSS-lambda path.")
    if (!is.null(bhat) || !is.null(shat)) {
      stop("Parameters 'bhat' and 'shat' are not supported in the ",
           "RSS-lambda path.")
    }
    if (!is.null(var_y))
      stop("Parameter 'var_y' is not supported in the RSS-lambda path.")
    return(rss_lambda_constructor(
      z = z, R = R, X = X, n = n,
      L = L, lambda = lambda, maf = maf, maf_thresh = maf_thresh,
      prior_variance = prior_variance,
      residual_variance = residual_variance, prior_weights = prior_weights,
      null_weight = null_weight, intercept_value = intercept_value,
      estimate_residual_variance = estimate_residual_variance,
      estimate_residual_method = estimate_residual_method,
      estimate_prior_variance = estimate_prior_variance,
      estimate_prior_method = estimate_prior_method,
      prior_variance_grid = prior_variance_grid,
      mixture_weights = mixture_weights,
      check_null_threshold = check_null_threshold, prior_tol = prior_tol,
      residual_variance_lowerbound = residual_variance_lowerbound,
      model_init = model_init, coverage = coverage, min_abs_corr = min_abs_corr,
      max_iter = max_iter, tol = tol, convergence_method = convergence_method,
      verbose = verbose, track_fit = track_fit,
      check_prior = check_prior, check_R = TRUE, check_z = FALSE,
      n_purity = n_purity, r_tol = r_tol, refine = refine,
      slot_prior = slot_prior, L_greedy = L_greedy,
      greedy_lbf_cutoff = greedy_lbf_cutoff
    ))
  }

  # Parameter validation for standard RSS (lambda = 0)
  if (intercept_value != 0) {
    stop("Parameter 'intercept_value' is only supported in the ",
         "eigendecomposition path (lambda != 0 or multi-panel).")
  }

  # Issue warning for estimate_residual_variance if TRUE
  if (estimate_residual_variance && lambda == 0) {
    warning_message("For estimate_residual_variance = TRUE, please check ",
            "that R is the \"in-sample\" R matrix; that is, the ",
            "correlation matrix obtained using the exact same data ",
            "matrix X that was used for the other summary ",
            "statistics. Also note, when covariates are included in ",
            "the univariate regressions that produced the summary ",
            "statistics, also consider removing these effects from ",
            "X before computing R.")
  }


  # For SuSiE-ash with summary statistics, recommend providing bhat/shat/var_y
  # for best agreement with individual-level analysis. The z+R-only path
  # operates on a standardized scale (var_y=1) and may give different results.
  if (unmappable_effects %in% c("ash", "ash_filter_archived") && is.null(bhat) && is.null(var_y)) {
    warning_message("SuSiE-ash with z-scores and R only operates on a ",
            "standardized scale. For best agreement with ",
            "individual-level analysis, provide bhat, shat, and ",
            "var_y instead of z-scores.")
  }

  # Determine p from z or bhat
  if (is.null(z) && !is.null(bhat)) {
    p <- length(bhat)
  } else if (!is.null(z)) {
    p <- length(z)
  } else {
    stop("Please provide either z or (bhat, shat).")
  }

  # Check dimensions of R or X
  if (!is.null(R)) {
    if (nrow(R) != p) {
      stop(paste0(
        "The dimension of R (", nrow(R), " x ", ncol(R), ") does not ",
        "agree with expected (", p, " x ", p, ")."
      ))
    }
  } else if (!is.null(X)) {
    if (ncol(X) != p) {
      stop(paste0(
        "The number of columns of X (", ncol(X), ") does not ",
        "agree with expected (", p, ")."
      ))
    }
  }

  # Check input n
  if (!is.null(n)) {
    if (n <= 1) {
      stop("n must be greater than 1.")
    }
  }

  # Check inputs z, bhat and shat
  if (sum(c(is.null(z), is.null(bhat) || is.null(shat))) != 1) {
    stop("Please provide either z or (bhat, shat), but not both.")
  }
  if (is.null(z)) {
    if (length(shat) == 1) {
      shat <- rep(shat, length(bhat))
    }
    if (length(bhat) != length(shat)) {
      stop("The lengths of bhat and shat do not agree.")
    }
    if (anyNA(bhat) || anyNA(shat)) {
      stop("bhat, shat cannot have missing values.")
    }
    if (any(shat <= 0)) {
      stop("shat cannot have zero or negative elements.")
    }
    z <- bhat / shat
  }
  if (length(z) < 1) {
    stop("Input vector z should have at least one element.")
  }
  z[is.na(z)] <- 0

  # Apply PVE adjustment if not already done (when z was computed from bhat/shat)
  if (!pve_adjusted && !is.null(n) && n > 1) {
    adj <- (n - 1) / (z^2 + n - 2)
    z <- sqrt(adj) * z
    pve_adjusted <- TRUE
  }

  # MAF filter (after z-scores are computed)
  if (!is.null(maf)) {
    if (length(maf) != length(z)) {
      stop(paste0("The length of maf does not agree with expected ", length(z)))
    }
    id <- which(maf > maf_thresh)
    if (!is.null(R)) R <- R[id, id]
    if (!is.null(X)) X <- X[, id, drop = FALSE]
    z <- z[id]
    # Update p after filtering
    p <- length(z)
  }

  # Standardize X so X'X = R (correlation matrix). The model assumes
  # column-standardized X; without this, X'X/B gives sample covariance
  # which != correlation when columns have different variances.
  if (!is.null(X)) {
    X <- standardize_X(X)
  }

  R_mismatch <- match.arg(R_mismatch, c("none", "map", "map_qc"))
  if (R_mismatch != "none" && is.null(R_finite))
    stop("R_mismatch requires R_finite because lambda_bias is estimated ",
         "as extra R bias beyond finite-reference uncertainty.")

  # R diagnostics (static, computed once at initialization).
  # X is standardized (X'X = R) at this point.
  R_finite_diagnostics <- NULL
  if (!is.null(R_finite)) {
    R_finite_diagnostics <- compute_R_finite_diagnostics(
      X = X, R = R, B = R_finite, p = length(z),
      x_is_standardized = TRUE)
  }

  # Cache eigen(R) for the Q_art QC diagnostic. Only computed when the
  # user opts into map_qc; the standard "map" path does not pay the
  # O(p^3) eigen cost. Works for both R-input and X-input: after
  # standardize_X, crossprod(X) == R. Reuses the attr(R, "eigen")
  # convention when the caller pre-computed it.
  eigen_R_cache <- NULL
  if (R_mismatch == "map_qc") {
    eigen_R_cache <- if (!is.null(R)) attr(R, "eigen") else NULL
    if (is.null(eigen_R_cache)) {
      R_for_eigen <- if (!is.null(R)) R else crossprod(X)
      eigen_R_cache <- eigen(R_for_eigen, symmetric = TRUE)
    }
  }

  # Convert to sufficient statistics format
  XtX <- NULL
  if (is.null(n)) {
    # Sample size not provided - use unadjusted z-scores
    warning_message("Providing the sample size (n), or even a rough estimate of n, ",
            "is highly recommended. Without n, the implicit assumption is ",
            "n is large (Inf) and the effect sizes are small (close to zero).")
    if (!is.null(R)) {
      XtX <- R
    }
    # X path: X'X = R already after standardize_X, no further scaling needed.
    Xty <- z
    yty <- 1
    n <- 2
    scaled_prior_variance <- prior_variance
  } else {
    # Sample size provided - use PVE-adjusted z-scores
    if (!is.null(shat) && !is.null(var_y)) {
      # var_y and shat provided - effects on original scale (R path only)
      XtXdiag <- var_y * adj / (shat^2)
      XtX <- t(R * sqrt(XtXdiag)) * sqrt(XtXdiag)
      XtX <- (XtX + t(XtX)) / 2
      Xty <- z * sqrt(adj) * var_y / shat
      yty <- (n - 1) * var_y
    } else {
      # Effects on standardized X, y scale
      if (!is.null(R)) {
        XtX <- (n - 1) * R
      } else {
        # X path: X'X = R after standardize_X, scale to X'X = (n-1)*R
        X <- X * sqrt(n - 1)
      }
      Xty <- sqrt(n - 1) * z
      yty <- (n - 1) * (if (!is.null(var_y)) var_y else 1)
    }
  }

  # Use sufficient_stats_constructor with ALL parameters
  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = n, XtX = XtX, X = X,
    L = L, X_colmeans = NA, y_mean = NA,
    maf = NULL, maf_thresh = 0, check_input = check_input,
    r_tol = r_tol, standardize = standardize,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance, prior_weights = prior_weights,
    null_weight = null_weight, model_init = model_init,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    residual_variance_lowerbound = residual_variance_lowerbound,
    residual_variance_upperbound = residual_variance_upperbound,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold, prior_tol = prior_tol,
    max_iter = max_iter, tol = tol, convergence_method = convergence_method,
    coverage = coverage, min_abs_corr = min_abs_corr, n_purity = n_purity,
    verbose = verbose, track_fit = track_fit, check_prior = check_prior,
    refine = refine, alpha0 = alpha0, beta0 = beta0,
    slot_prior = slot_prior, L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Attach finite-reference R metadata to data object.
  if (!is.null(R_finite)) {
    result$data$R_finite_B <- R_finite
    result$data$R_finite_diagnostics <- R_finite_diagnostics
    result$data$R_mismatch <- R_mismatch
  }

  # eigen(R) cache for Q_art diagnostic (map_qc only).
  if (!is.null(eigen_R_cache))
    result$data$eigen_R <- eigen_R_cache

  # Attach R-bias / mismatch params consumed by R/rss_mismatch.R.
  result$params$R_mismatch <- R_mismatch
  result$params$eig_delta_rel <- eig_delta_rel
  result$params$eig_delta_abs <- eig_delta_abs
  result$params$artifact_threshold <- artifact_threshold

  return(result)
}

# =============================================================================
# SS MULTI-PANEL MIXTURE DATA CONSTRUCTOR
# =============================================================================
#'
#' @keywords internal
#' @noRd
ss_mixture_constructor <- function(z, R = NULL, X = NULL, n,
                                   L = min(10, if (!is.null(R)) ncol(R[[1]])
                                           else ncol(X[[1]])),
                                   maf = NULL, maf_thresh = 0,
                                   scaled_prior_variance = 0.2,
                                   residual_variance = NULL,
                                   prior_weights = NULL,
                                   null_weight = 0,
                                   standardize = TRUE,
                                   estimate_residual_variance = FALSE,
                                   estimate_residual_method = "MoM",
                                   estimate_prior_variance = TRUE,
                                   estimate_prior_method = "optim",
                                   prior_variance_grid = NULL,
                                   mixture_weights = NULL,
                                   unmappable_effects = "none",
                                   check_null_threshold = 0,
                                   prior_tol = 1e-9,
                                   residual_variance_lowerbound = 0,
                                   residual_variance_upperbound = Inf,
                                   model_init = NULL,
                                   coverage = 0.95,
                                   min_abs_corr = 0.5,
                                   max_iter = 100,
                                   tol = 1e-3,
                                   convergence_method = "pip",
                                   verbose = FALSE,
                                   track_fit = FALSE,
                                   check_input = FALSE,
                                   check_prior = TRUE,
                                   n_purity = 100,
                                   r_tol = 1e-8,
                                   refine = FALSE,
                                   R_finite = NULL,
                                   R_mismatch = "none",
                                   eig_delta_rel = 1e-3,
                                   eig_delta_abs = 0,
                                   artifact_threshold = 0.1,
                                   alpha0 = 0.1,
                                   beta0 = 0.1,
                                   slot_prior = NULL,
                                   L_greedy = NULL,
                                   greedy_lbf_cutoff = 0.1) {
  if (is.null(n) || !is.numeric(n) || length(n) != 1 || n <= 1)
    stop("Sample size 'n' is required for multi-panel mode.")
  if (is.null(z))
    stop("Multi-panel mode requires z-scores.")
  if (!is.null(R) && !is.null(X))
    stop("Please provide either R or X, but not both.")

  use_R <- !is.null(R)
  panels <- if (use_R) R else X
  K <- length(panels)
  if (K < 1)
    stop("Multi-panel input must contain at least one panel.")
  p <- length(z)

  if (use_R) {
    for (k in seq_len(K)) {
      if (!is.matrix(R[[k]]) || !is.numeric(R[[k]]))
        stop("Each element of R list must be a numeric matrix.")
      if (nrow(R[[k]]) != p || ncol(R[[k]]) != p)
        stop("Each element of R list must have dimension length(z) by length(z).")
      if (!is_symmetric_matrix(R[[k]]))
        R[[k]] <- (R[[k]] + t(R[[k]])) / 2
    }
    panel_R <- lapply(R, safe_cov2cor)
    X_list <- NULL
    B_list <- R_finite
    init_panel <- attr(R, ".init_panel")
    omega_cache <- NULL
  } else {
    for (k in seq_len(K)) {
      if (!is.matrix(X[[k]]) || !is.numeric(X[[k]]))
        stop("Each element of X list must be a numeric matrix.")
      if (ncol(X[[k]]) != p)
        stop("Each element of X list must have length(z) columns.")
    }
    X_list <- lapply(X, standardize_X)
    panel_R <- lapply(X_list, function(Xk) cov2cor(crossprod(Xk)))
    B_list <- if (is.null(R_finite)) NULL else R_finite
    init_panel <- attr(X, ".init_panel")
    omega_cache <- if (sum(vapply(X_list, nrow, integer(1))) < p)
                     precompute_omega_cache(X_list, z) else NULL
  }

  if (!is.null(maf)) {
    if (length(maf) != p)
      stop(paste0("The length of maf does not agree with expected ", p, "."))
    id <- which(maf > maf_thresh)
    z <- z[id]
    panel_R <- lapply(panel_R, function(Rk) Rk[id, id, drop = FALSE])
    if (!is.null(X_list))
      X_list <- lapply(X_list, function(Xk) Xk[, id, drop = FALSE])
    p <- length(z)
  }

  if (any(is.infinite(z)))
    stop("z contains infinite values.")
  if (anyNA(z)) {
    warning_message("NA values in z-scores are replaced with 0.")
    z[is.na(z)] <- 0
  }

  if (is.numeric(null_weight) && null_weight == 0)
    null_weight <- NULL
  if (!is.null(null_weight)) {
    if (!is.numeric(null_weight))
      stop("Null weight must be numeric.")
    if (null_weight < 0 || null_weight >= 1)
      stop("Null weight must be between 0 and 1.")
    if (is.null(prior_weights)) {
      prior_weights <- c(rep(1 / p * (1 - null_weight), p), null_weight)
    } else {
      prior_weights <- c(prior_weights * (1 - null_weight), null_weight)
    }
    panel_R <- lapply(panel_R, function(Rk) cbind(rbind(Rk, 0), 0))
    if (!is.null(X_list))
      X_list <- lapply(X_list, function(Xk) cbind(Xk, 0))
    z <- c(z, 0)
    p <- p + 1L
  }

  if (is.null(prior_weights))
    prior_weights <- rep(1 / p, p)

  k_best <- if (!is.null(init_panel)) init_panel else 1L
  omega_init <- rep(0, K)
  omega_init[k_best] <- 1
  R_init <- Reduce("+", Map(function(w, Rk) w * Rk, omega_init, panel_R))
  R_init <- 0.5 * (R_init + t(R_init))

  R_finite_B <- NULL
  R_finite_diagnostics <- NULL
  if (!is.null(R_finite)) {
    B_list <- as.numeric(R_finite)
    R_finite_B <- 1 / sum(omega_init^2 / B_list)
    R_finite_diagnostics <- compute_R_finite_diagnostics(
      R = R_init, B = R_finite_B, p = p)
  }

  nm1 <- n - 1
  XtX <- nm1 * R_init
  X_ss <- NULL
  if (!is.null(X_list)) {
    X_ss <- form_X_meta(X_list, omega_init) * sqrt(nm1)
    attr(X_ss, "d") <- rep(nm1, p)
    attr(X_ss, "scaled:scale") <- rep(1, p)
    XtX <- NULL
  }

  params_object <- list(
    L = L,
    scaled_prior_variance = scaled_prior_variance,
    residual_variance = residual_variance,
    prior_weights = prior_weights,
    null_weight = null_weight,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    residual_variance_lowerbound = residual_variance_lowerbound,
    residual_variance_upperbound = residual_variance_upperbound,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = unmappable_effects,
    check_null_threshold = check_null_threshold,
    prior_tol = prior_tol,
    max_iter = max_iter,
    tol = tol,
    convergence_method = convergence_method,
    coverage = coverage,
    min_abs_corr = min_abs_corr,
    compute_univariate_zscore = FALSE,
    verbose = verbose,
    track_fit = track_fit,
    check_prior = check_prior,
    refine = refine,
    n_purity = n_purity,
    alpha0 = alpha0,
    beta0 = beta0,
    n = n,
    use_NIG = estimate_residual_method == "NIG",
    intercept = FALSE,
    standardize = standardize,
    model_init = model_init,
    slot_prior = slot_prior,
    L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff,
    R_mismatch = R_mismatch,
    eig_delta_rel = eig_delta_rel,
    eig_delta_abs = eig_delta_abs,
    artifact_threshold = artifact_threshold
  )
  params_object <- validate_and_override_params(params_object)

  data_object <- structure(
    list(
      X = X_ss, XtX = XtX,
      Xty = sqrt(nm1) * z, yty = nm1,
      n = n, p = p,
      X_colmeans = rep(0, p), y_mean = 0,
      nm1 = nm1, z = z, lambda = 0,
      R_finite_B = R_finite_B,
      R_finite_diagnostics = R_finite_diagnostics,
      R_mismatch = R_mismatch,
      X_list_std = X_list, B_list = B_list,
      K = K, panel_R = panel_R, omega_cache = omega_cache
    ),
    class = c("ss_mixture", "ss")
  )
  if (R_mismatch == "map_qc")
    data_object$eigen_R <- eigen(R_init, symmetric = TRUE)

  list(data = data_object, params = params_object)
}

# =============================================================================
# RSS LAMBDA DATA CONSTRUCTOR
#
# Constructs data and params objects for SuSiE from RSS data using eigendecomposition
# (lambda >= 0).
# Handles eigen decomposition, MAF filtering, and specialized RSS-lambda preprocessing.
# =============================================================================
#'
#' @return A list containing:
#' \item{data}{A processed list containing z-scores, R matrix, eigen decomposition,
#' and RSS-lambda specific fields}
#' \item{params}{Validated params object with all input algorithm parameters}
#'
#' @keywords internal
#' @noRd
rss_lambda_constructor <- function(z, R = NULL, X = NULL, n = NULL,
                                   L = min(10, if (!is.null(R)) ncol(R) else ncol(X)),
                                   lambda = 0,
                                   maf = NULL,
                                   maf_thresh = 0,
                                   prior_variance = 50,
                                   residual_variance = NULL,
                                   prior_weights = NULL,
                                   null_weight = 0,
                                   intercept_value = 0,
                                   estimate_residual_variance = FALSE,
                                   estimate_residual_method = "MLE",
                                   estimate_prior_variance = TRUE,
                                   estimate_prior_method = "optim",
                                   prior_variance_grid = NULL,
                                   mixture_weights = NULL,
                                   check_null_threshold = 0,
                                   prior_tol = 1e-9,
                                   residual_variance_lowerbound = 0,
                                   model_init = NULL,
                                   coverage = 0.95,
                                   min_abs_corr = 0.5,
                                   max_iter = 100,
                                   tol = 1e-3,
                                   convergence_method = "elbo",
                                   verbose = FALSE,
                                   track_fit = FALSE,
                                   check_prior = TRUE,
                                   check_R = TRUE,
                                   check_z = FALSE,
                                   n_purity = 100,
                                   r_tol = 1e-8,
                                   refine = FALSE,
                                   slot_prior = NULL,
                                   L_greedy = NULL,
                                   greedy_lbf_cutoff = 0.1) {

  if (!identical(estimate_residual_method, "MLE")) {
    stop("RSS-lambda supports estimate_residual_method = \"MLE\" only.")
  }
  if (is.list(R) && !is.matrix(R))
    stop("rss_lambda_constructor() accepts only a single R matrix.")
  if (is.list(X) && !is.matrix(X))
    stop("rss_lambda_constructor() accepts only a single X matrix.")

  # PVE-adjust z when sample size is provided. Shrinks large z toward
  # zero to account for winner's curse. Same form as the SS path
  # (summary_stats_constructor); skipped when n is unavailable.
  if (!is.null(z) && !is.null(n) && is.numeric(n) && length(n) == 1 &&
      is.finite(n) && n > 1) {
    adj <- (n - 1) / (z^2 + n - 2)
    z <- sqrt(adj) * z
  }

  if (is.null(X)) {
    # R path: validate R
    if (is.null(R))
      stop("Please provide either R or X for rss_lambda_constructor.")
    if (nrow(R) != length(z)) {
      stop(paste0(
        "The dimension of correlation matrix (", nrow(R), " by ",
        ncol(R), ") does not agree with expected (", length(z), " by ",
        length(z), ")."
      ))
    }
    if (!is_symmetric_matrix(R)) {
      warning_message("R not symmetric; using (R + t(R))/2.")
      R <- (R + t(R)) / 2
    }
    if (!(is.double(R) & is.matrix(R)) & !inherits(R, "sparseMatrix")) {
      stop("Input R must be a double-precision matrix or a sparse matrix.")
    }
  } else {
    # Single-panel X path: validate X
    if (ncol(X) != length(z)) {
      stop(paste0(
        "The number of columns of X (", ncol(X),
        ") does not agree with expected (", length(z), ")."
      ))
    }
  }

  # MAF filter
  if (!is.null(maf)) {
    if (length(maf) != length(z)) {
      stop(paste0("The length of maf does not agree with expected ", length(z), "."))
    }
    id <- which(maf > maf_thresh)
    if (!is.null(R)) R <- R[id, id]
    if (!is.null(X)) X <- X[, id, drop = FALSE]
    z <- z[id]
  }

  if (any(is.infinite(z))) {
    stop("z contains infinite values.")
  }

  # Check for NAs
  if (!is.null(R) && anyNA(R)) {
    stop("R matrix contains missing values.")
  }

  # Replace NAs in z with zero
  if (anyNA(z)) {
    warning_message("NA values in z-scores are replaced with 0.")
    z[is.na(z)] <- 0
  }

  # Handle null weight
  if (is.numeric(null_weight) && null_weight == 0) {
    null_weight <- NULL
  }
  if (!is.null(null_weight)) {
    if (!is.numeric(null_weight)) {
      stop("Null weight must be numeric.")
    }
    if (null_weight < 0 || null_weight >= 1) {
      stop("Null weight must be between 0 and 1.")
    }
    p_cur <- if (!is.null(R)) ncol(R) else ncol(X)
    if (is.null(prior_weights)) {
      prior_weights <- c(rep(1 / p_cur * (1 - null_weight), p_cur), null_weight)
    } else {
      prior_weights <- c(prior_weights * (1 - null_weight), null_weight)
    }
    if (!is.null(R)) R <- cbind(rbind(R, 0), 0)
    if (!is.null(X)) X <- cbind(X, 0)
    z <- c(z, 0)
  }

  # Determine p and set prior weights
  p <- if (!is.null(R)) ncol(R) else ncol(X)

  if (is.null(prior_weights)) {
    prior_weights <- rep(1 / p, p)
  }

  # Eigen decomposition: from R or SVD of X
  if (!is.null(X)) {
    # Single-panel: standardize so X'X = R, then SVD
    X <- standardize_X(X)
    eigen_R <- eigen_from_X(X, p)
  } else {
    eigen_R <- eigen(R, symmetric = TRUE)
  }

  if (is.null(X) && check_R && any(eigen_R$values < -r_tol)) {
    stop(paste0(
      "The correlation matrix (", nrow(R), " by ", ncol(R),
      ") is not a positive semidefinite matrix. ",
      "The smallest eigenvalue is ", min(eigen_R$values),
      ". You can bypass this by \"check_R = FALSE\" which instead ",
      "sets negative eigenvalues to 0 to allow for continued ",
      "computations."
    ))
  }

  # Check whether z in space spanned by the non-zero eigenvectors of R
  if (is.null(X) && check_z) {
    colspace <- which(eigen_R$values > r_tol)
    if (length(colspace) < length(z)) {
      znull <- crossprod(eigen_R$vectors[, -colspace], z)
      if (sum(znull^2) > r_tol * sum(z^2)) {
        warning_message("Input z does not lie in the space of non-zero eigenvectors of R.")
      } else {
        message("Input z is in space spanned by the non-zero eigenvectors of R.\n")
      }
    }
  }

  # Set negative eigenvalues to zero
  eigen_R$values[eigen_R$values < r_tol] <- 0

  # Precompute V'z
  Vtz <- crossprod(eigen_R$vectors, z)

  # Compute Null-space z-score norm: ||z||^2 - ||V'z||^2.
  z_null_norm2 <- max(sum(z^2) - sum(Vtz^2), 0)

  # Handle lambda estimation
  if (identical(lambda, "estimate")) {
    colspace <- which(eigen_R$values > 0)
    if (length(colspace) == length(z)) {
      lambda <- 0
    } else {
      znull <- crossprod(eigen_R$vectors[, -colspace], z)
      lambda <- sum(znull^2) / length(znull)
    }
  }

  if (is.null(residual_variance)) {
    residual_variance <- 1 - lambda
  } else {
    residual_variance <- residual_variance - lambda
  }

  # Create params object with ALL algorithm parameters
  params_object <- list(
    L = L,
    scaled_prior_variance = prior_variance, # Use unscaled prior_variance for RSS-lambda
    residual_variance = residual_variance,
    prior_weights = prior_weights,
    null_weight = null_weight,
    estimate_residual_variance = estimate_residual_variance,
    estimate_residual_method = estimate_residual_method,
    estimate_prior_variance = estimate_prior_variance,
    estimate_prior_method = estimate_prior_method,
    prior_variance_grid = prior_variance_grid,
    mixture_weights = mixture_weights,
    unmappable_effects = "none", # RSS-lambda doesn't support unmappable effects
    check_null_threshold = check_null_threshold,
    prior_tol = prior_tol,
    residual_variance_upperbound = 1, # RSS constraint
    model_init = model_init,
    coverage = coverage,
    min_abs_corr = min_abs_corr,
    compute_univariate_zscore = FALSE,
    max_iter = max_iter,
    tol = tol,
    convergence_method = convergence_method,
    verbose = verbose,
    track_fit = track_fit,
    residual_variance_lowerbound = residual_variance_lowerbound,
    refine = refine,
    n_purity = n_purity,
    alpha0 = 0,  # RSS doesn't support NIG
    beta0 = 0,   # RSS doesn't support NIG
    n = n,
    use_NIG = FALSE,
    intercept = FALSE,  # RSS always uses intercept = FALSE
    standardize = FALSE, # Never standardize RSS-lambda
    check_prior = check_prior,
    slot_prior = slot_prior,
    L_greedy = L_greedy,
    greedy_lbf_cutoff = greedy_lbf_cutoff
  )

  # Validate params
  params_object <- validate_and_override_params(params_object)

  # Create data object with RSS-lambda specific fields. n is the GWAS
  # sample size (used by the PVE adjustment above and by any downstream
  # consumer that needs to know the GWAS size); we store NA_integer_ when
  # the caller did not supply it. p (the number of variants) is always
  # length(z).
  data_object <- structure(
    list(
      z = z,
      R = R,
      X = X,
      n = if (is.null(n)) NA_integer_ else as.integer(n),
      p = length(z),
      lambda = lambda,
      intercept_value = intercept_value,
      r_tol = r_tol,
      prior_variance = prior_variance,
      eigen_R = eigen_R,
      Vtz = Vtz,
      z_null_norm2 = z_null_norm2
    ),
    class = "rss_lambda"
  )

  return(list(data = data_object, params = params_object))
}


================================================
FILE: R/susie_get_functions.R
================================================
#' @rdname susie_get_methods
#'
#' @title Inferences From Fitted SuSiE Model
#'
#' @description These functions access basic properties or draw
#'   inferences from a fitted susie model.
#'
#' @param res A susie fit, typically an output from
#'   \code{\link{susie}} or one of its variants. For
#'   \code{susie_get_pip} and \code{susie_get_cs}, this may instead be
#'   the posterior inclusion probability matrix, \code{alpha}.
#'
#' @param last_only If \code{last_only = FALSE}, return the ELBO from
#'   all iterations; otherwise return the ELBO from the last iteration
#'   only.
#'
#' @param warning_tol Warn if ELBO is decreasing by this
#'   tolerance level.
#'
#' @return \code{susie_get_objective} returns the evidence lower bound
#' (ELBO) achieved by the fitted susie model and, optionally, at each
#' iteration of the IBSS fitting procedure.
#'
#' \code{susie_get_residual_variance} returns the (estimated or
#' fixed) residual variance parameter.
#'
#' \code{susie_get_prior_variance} returns the (estimated or fixed)
#' prior variance parameters.
#'
#' \code{susie_get_posterior_mean} returns the posterior mean for the
#' regression coefficients of the fitted susie model.
#'
#' \code{susie_get_posterior_sd} returns the posterior standard
#' deviation for coefficients of the fitted susie model.
#'
#' \code{susie_get_niter} returns the number of model fitting
#' iterations performed.
#'
#' \code{susie_get_pip} returns a vector containing the posterior
#' inclusion probabilities (PIPs) for all variables.
#'
#' \code{susie_get_lfsr} returns a vector containing the average lfsr
#' across variables for each single-effect, weighted by the posterior
#' inclusion probability (alpha).
#'
#' \code{susie_get_posterior_samples} returns a list containing the
#' effect sizes samples and causal status with two components: \code{b},
#' an \code{num_variables} x \code{num_samples} matrix of effect
#' sizes; \code{gamma}, an \code{num_variables} x \code{num_samples}
#' matrix of causal status random draws.
#'
#' \code{susie_get_cs} returns credible sets (CSs) from a susie fit,
#' as well as summaries of correlation among the variables included in
#' each CS. If desired, one can filter out CSs that do not meet a
#' specified \dQuote{purity} threshold; to do this, either \code{X} or
#' \code{Xcorr} must be supplied. It returns a list with the following
#' elements:
#'
#' \item{cs}{A list in which each list element is a vector containing
#'   the indices of the variables in the CS.}
#'
#' \item{coverage}{The nominal coverage specified for each CS.}
#'
#' \item{purity}{If \code{X} or \code{Xcorr} iis provided), the
#'   purity of each CS.}
#'
#' \item{cs_index}{If \code{X} or \code{Xcorr} is provided) the index
#'   (number between 1 and L) of each reported CS in the supplied susie
#'   fit.}
#'
#' @examples
#' set.seed(1)
#' n <- 1000
#' p <- 1000
#' beta <- rep(0, p)
#' beta[1:4] <- 1
#' X <- matrix(rnorm(n * p), nrow = n, ncol = p)
#' X <- scale(X, center = TRUE, scale = TRUE)
#' y <- drop(X %*% beta + rnorm(n))
#' s <- susie(X, y, L = 10)
#' susie_get_objective(s)
#' susie_get_objective(s, last_only = FALSE)
#' susie_get_residual_variance(s)
#' susie_get_prior_variance(s)
#' susie_get_posterior_mean(s)
#' susie_get_posterior_sd(s)
#' susie_get_niter(s)
#' susie_get_pip(s)
#' susie_get_lfsr(s)
#'
#' @export
#'
susie_get_objective <- function(res, last_only = TRUE, warning_tol = 1e-6) {
  if (!all(diff(res$elbo) >= (-1 * warning_tol))) {
    warning_message("Objective is decreasing")
  }
  if (last_only) {
    return(res$elbo[length(res$elbo)])
  } else {
    return(res$elbo)
  }
}

#' @rdname susie_get_methods
#'
#' @export
#'
susie_get_posterior_mean <- function(res, prior_tol = 1e-9) {
  # Drop the single-effects with estimated prior of zero.
  if (is.numeric(res$V)) {
    include_idx <- which(res$V > prior_tol)
  } else {
    include_idx <- 1:nrow(res$alpha)
  }

  # Now extract relevant rows from alpha matrix.
  if (length(include_idx) > 0) {
    return(colSums((res$alpha * res$mu)[include_idx, , drop = FALSE]) /
      res$X_column_scale_factors)
  } else {
    return(numeric(ncol(res$mu)))
  }
}

#' @rdname susie_get_methods
#'
#' @export
#'
susie_get_posterior_sd <- function(res, prior_tol = 1e-9) {
  # Drop the single-effects with estimated prior of zero.
  if (is.numeric(res$V)) {
    include_idx <- which(res$V > prior_tol)
  } else {
    include_idx <- 1:nrow(res$alpha)
  }

  # Now extract relevant rows from alpha matrix.
  if (length(include_idx) > 0) {
    return(sqrt(colSums((res$alpha * res$mu2 -
      (res$alpha * res$mu)^2)[include_idx, , drop = FALSE])) /
      (res$X_column_scale_factors))
  } else {
    return(numeric(ncol(res$mu)))
  }
}

#' @rdname susie_get_methods
#'
#' @export
#'
susie_get_niter <- function(res) {
  res$niter
}

#' @rdname susie_get_methods
#'
#' @export
#'
susie_get_prior_variance <- function(res) {
  res$V
}

#' @rdname susie_get_methods
#'
#' @export
#'
susie_get_residual_variance <- function(res) {
  res$sigma2
}

#' @rdname susie_get_methods
#'
#' @importFrom stats pnorm
#'
#' @export
#'
susie_get_lfsr <- function(res) {
  pos_prob <- pnorm(0, mean = t(res$mu), sd = sqrt(res$mu2 - res$mu^2))
  neg_prob <- 1 - pos_prob
  return(1 - rowSums(res$alpha * t(pmax(pos_prob, neg_prob))))
}

#' @rdname susie_get_methods
#'
#' @param susie_fit A susie fit, an output from \code{\link{susie}}.
#'
#' @param num_samples The number of draws from the posterior
#'   distribution.
#'
#' @importFrom stats rmultinom
#' @importFrom stats rnorm
#'
#' @export
#'
susie_get_posterior_samples <- function(susie_fit, num_samples) {
  # Remove effects having estimated prior variance equals zero.
  if (is.numeric(susie_fit$V)) {
    include_idx <- which(susie_fit$V > 1e-9)
  } else {
    include_idx <- 1:nrow(susie_fit$alpha)
  }

  posterior_mean <- sweep(susie_fit$mu, 2, susie_fit$X_column_scale_factors, "/")
  posterior_sd <- sweep(
    sqrt(susie_fit$mu2 - (susie_fit$mu)^2), 2,
    susie_fit$X_column_scale_factors, "/"
  )

  pip <- susie_fit$alpha
  L <- nrow(pip)
  num_snps <- ncol(pip)
  b_samples <- matrix(as.numeric(NA), num_snps, num_samples)
  gamma_samples <- matrix(as.numeric(NA), num_snps, num_samples)
  for (sample_i in 1:num_samples) {
    b <- 0
    if (length(include_idx) > 0) {
      for (l in include_idx) {
        gamma_l <- rmultinom(1, 1, pip[l, ])
        effect_size <- rnorm(1,
          mean = posterior_mean[l, which(gamma_l != 0)],
          sd = posterior_sd[l, which(gamma_l != 0)]
        )
        b_l <- gamma_l * effect_size
        b <- b + b_l
      }
    }
    b_samples[, sample_i] <- b
    gamma_samples[, sample_i] <- as.numeric(b != 0)
  }
  return(list(b = b_samples, gamma = gamma_samples))
}

#' @rdname susie_get_methods
#' @param X n by p matrix of values of the p variables (covariates) in
#'   n samples. When provided, correlation between variables will be
#'   computed and used to remove CSs whose minimum correlation among
#'   variables is smaller than \code{min_abs_corr}.
#'
#' @param Xcorr p by p matrix of correlations between variables
#'   (covariates). When provided, it will be used to remove CSs whose
#'   minimum correlation among variables is smaller than
#'   \code{min_abs_corr}.
#'
#' @param coverage A number between 0 and 1 specifying desired
#'   coverage of each CS.
#'
#' @param min_abs_corr A "purity" threshold for the CS. Any CS that
#'   contains a pair of variables with correlation less than this
#'   threshold will be filtered out and not reported. This filter is
#'   only applied when \code{X} or \code{Xcorr} is provided; otherwise
#'   it is ignored and a warning is issued.
#'
#' @param dedup If \code{dedup = TRUE}, remove duplicate CSs.
#'
#' @param squared If \code{squared = TRUE}, report min, mean and
#'   median of squared correlation instead of the absolute correlation.
#'
#' @param check_symmetric If \code{check_symmetric = TRUE}, perform a
#'   check for symmetry of matrix \code{Xcorr} when \code{Xcorr} is
#'   provided (not \code{NULL}).
#'
#' @param n_purity The maximum number of credible set (CS) variables
#'   used in calculating the correlation (\dQuote{purity})
#'   statistics. When the number of variables included in the CS is
#'   greater than this number, the CS variables are randomly subsampled.
#'
#' @param use_rfast Use the Rfast package for the purity calculations.
#'   By default \code{use_rfast = TRUE} if the Rfast package is
#'   installed.
#'
#' @param ld_extend_threshold Threshold for extending CS by LD (default 0.99).
#'   Variants with |correlation| > threshold with any CS member are added.
#'   Set to NULL to disable LD extension. Requires Xcorr (would not work if only X is provided).
#'
#' @export
#'
susie_get_cs <- function(res, X = NULL, Xcorr = NULL, coverage = 0.95,
                         min_abs_corr = 0.5, dedup = TRUE, squared = FALSE,
                         check_symmetric = TRUE, n_purity = 100,
                         use_rfast = NULL, ld_extend_threshold = 0.99) {
  if (!is.null(X) && !is.null(Xcorr)) {
    stop("Only one of X or Xcorr should be specified")
  }
  if (is.null(X) && is.null(Xcorr)) {
    warning_message(
      "Neither X nor Xcorr was provided; purity filtering is skipped ",
      "and min_abs_corr will have no effect. Pass X or Xcorr to enable ",
      "the purity filter."
    )
  }
  if (check_symmetric) {
    if (!is.null(Xcorr) && !is_symmetric_matrix(Xcorr)) {
      warning_message(
        "Xcorr is not symmetric; forcing Xcorr to be symmetric ",
        "by replacing Xcorr with (Xcorr + t(Xcorr))/2"
      )
      Xcorr <- Xcorr + t(Xcorr)
      Xcorr <- Xcorr / 2
    }
  }

  null_index <- 0
  include_idx <- rep(TRUE, nrow(res$alpha))
  if (!is.null(res$null_index)) null_index <- res$null_index
  if (is.numeric(res$V)) include_idx <- res$V > 1e-9
  
  # L x P binary matrix
  status <- in_CS(res$alpha, coverage)

  # L-list of CS positions
  cs <- lapply(1:nrow(status), function(i) which(status[i, ] != 0))
  claimed_coverage <- sapply(
    1:length(cs),
    function(i) sum(res$alpha[i, ][cs[[i]]])
  )
  include_idx <- include_idx * (lapply(cs, length) > 0)

  # FIXME: see issue 21
  # https://github.com/stephenslab/susieR/issues/21
  if (dedup) {
    include_idx <- include_idx * (!duplicated(cs))
  }
  include_idx <- as.logical(include_idx)
  if (sum(include_idx) == 0) {
    return(list(
      cs = NULL,
      coverage = NULL,
      requested_coverage = coverage
    ))
  }
  
  cs <- cs[include_idx]
  claimed_coverage <- claimed_coverage[include_idx]
  # Track which original effects these correspond to
  effect_indices <- which(include_idx)

  # Compute and filter by "purity"
  if (is.null(use_rfast)) {
    use_rfast <- requireNamespace("Rfast", quietly = TRUE)
  }
  
  # If no correlation info, return without purity or LD extension
  if (is.null(Xcorr) && is.null(X)) {
    names(cs) <- paste0("L", effect_indices)
    return(list(
      cs = cs,
      coverage = claimed_coverage,
      requested_coverage = coverage
    ))
  }
  
  # Extend CS by LD if threshold is set and Xcorr is available
  # Note: LD extension requires Xcorr; if only X is provided, skip extension
  # (X may be sparse, and computing full Xcorr is expensive/infeasible)
  if (!is.null(ld_extend_threshold) && !is.null(Xcorr)) {
    for (i in 1:length(cs)) {
      cs_idx <- cs[[i]]
      # Find variants in tight LD with any CS member
      ld_with_cs <- abs(Xcorr[cs_idx, , drop = FALSE]) > ld_extend_threshold
      in_tight_ld <- which(colSums(ld_with_cs) > 0)
      # Extend CS
      cs[[i]] <- sort(unique(c(cs_idx, in_tight_ld)))
      # Update coverage for extended CS
      claimed_coverage[i] <- sum(res$alpha[effect_indices[i], cs[[i]]])
    }
  }

  # Compute purity for each CS
  purity <- NULL
  for (i in 1:length(cs)) {
    if (null_index > 0 && null_index %in% cs[[i]]) {
      purity <- rbind(purity, c(-9, -9, -9))
    } else {
      purity <- rbind(
        purity,
        matrix(get_purity(cs[[i]], X, Xcorr, squared, n_purity, use_rfast), 1, 3)
      )
    }
  }
  purity <- as.data.frame(purity)
  if (squared) {
    colnames(purity) <- c("min.sq.corr", "mean.sq.corr", "median.sq.corr")
  } else {
    colnames(purity) <- c("min.abs.corr", "mean.abs.corr", "median.abs.corr")
  }
  
  threshold <- ifelse(squared, min_abs_corr^2, min_abs_corr)
  is_pure <- which(purity[, 1] >= threshold)
  
  if (length(is_pure) > 0) {
    cs <- cs[is_pure]
    purity <- purity[is_pure, , drop = FALSE]
    claimed_coverage <- claimed_coverage[is_pure]
    effect_indices <- effect_indices[is_pure]
    
    row_names <- paste0("L", effect_indices)
    names(cs) <- row_names
    rownames(purity) <- row_names
    
    # Re-order CS list and purity rows based on purity
    ordering <- order(purity[, 1], decreasing = TRUE)
    return(list(
      cs = cs[ordering],
      purity = purity[ordering, , drop = FALSE],
      cs_index = effect_indices[ordering],
      coverage = claimed_coverage[ordering],
      requested_coverage = coverage
    ))
  } else {
    return(list(cs = NULL, coverage = NULL, requested_coverage = coverage))
  }
}

#' @title Get Correlations Between CSs, using Variable with Maximum PIP From Each CS
#'
#' @description This function evaluates the correlation between single effect
#'   CSs. It is not part of the SuSiE inference. Rather, it is designed as
#'   a diagnostic tool to assess how correlated the reported CS are.
#'
#' @param model A SuSiE fit, typically an output from
#'   \code{\link{susie}} or one of its variants.
#'
#' @param X n by p matrix of values of the p variables (covariates) in
#'   n samples. When provided, correlation between variables will be
#'   computed and used to remove CSs whose minimum correlation among
#'   variables is smaller than \code{min_abs_corr}.
#'
#' @param Xcorr p by p matrix of correlations between variables
#'   (covariates). When provided, it will be used to remove CSs whose
#'   minimum correlation among variables is smaller than
#'   \code{min_abs_corr}.
#'
#' @param max When \code{max = FAFLSE}, return a matrix of CS
#'   correlations. When \code{max = TRUE}, return only the maximum
#'   absolute correlation among all pairs of correlations.
#'
#' @return A matrix of correlations between CSs, or the maximum
#'   absolute correlation when \code{max = TRUE}.
#'
#' @export
#'
get_cs_correlation <- function(model, X = NULL, Xcorr = NULL, max = FALSE) {
  if (is.null(model$sets$cs) || length(model$sets$cs) == 1) {
    return(NA)
  }
  if (!is.null(X) && !is.null(Xcorr)) {
    stop("Only one of X or Xcorr should be specified")
  }
  if (is.null(Xcorr) && is.null(X)) {
    stop("One of X or Xcorr must be specified")
  }
  if (!is.null(Xcorr) && !is_symmetric_matrix(Xcorr)) {
    warning_message(
      "Xcorr is not symmetric; forcing Xcorr to be symmetric ",
      "by replacing Xcorr with (Xcorr + t(Xcorr))/2"
    )
    Xcorr <- Xcorr + t(Xcorr)
    Xcorr <- Xcorr / 2
  }
  # Get index for the best PIP per CS
  max_pip_idx <- sapply(model$sets$cs, function(cs) cs[which.max(model$pip[cs])])
  if (is.null(Xcorr)) {
    X_sub <- X[, max_pip_idx]
    cs_corr <- safe_cor(as.matrix(X_sub))
  } else {
    cs_corr <- Xcorr[max_pip_idx, max_pip_idx]
  }
  if (max) {
    cs_corr <- max(abs(cs_corr[upper.tri(cs_corr)]))
  } else {
    rownames(cs_corr) <- colnames(cs_corr) <- names(model$sets$cs)
  }
  return(cs_corr)
}

#' @rdname susie_get_methods
#'
#' @param prune_by_cs Whether or not to ignore single effects not in
#'   a reported CS when calculating PIP.
#'
#' @param prior_tol Filter out effects having estimated prior variance
#'   smaller than this threshold.
#'
#' @export
#'
susie_get_pip <- function(res, prune_by_cs = FALSE, prior_tol = 1e-9) {
  if (inherits(res, "susie")) {
    # Drop null weight columns.
    if (!is.null(res$null_index) && res$null_index > 0) {
      res$alpha <- res$alpha[, -res$null_index, drop = FALSE]
    }

    # Drop the single-effects with estimated prior of zero.
    if (is.numeric(res$V)) {
      include_idx <- which(res$V > prior_tol)
    } else {
      include_idx <- 1:nrow(res$alpha)
    }

    # Only consider variables in reported CS.
    # This is not what we do in the SuSiE paper.
    # So by default prune_by_cs = FALSE means we do not run the
    # following code.
    if (!is.null(res$sets$cs_index) && prune_by_cs) {
      include_idx <- intersect(include_idx, res$sets$cs_index)
    }
    if (is.null(res$sets$cs_index) && prune_by_cs) {
      include_idx <- numeric(0)
    }

    # Extract slot weights (c_hat) if available for Gamma-Poisson weighting.
    # PIP_j = 1 - prod_l(1 - c_hat[l] * alpha[l,j])
    # (Faithfully ported from susieAnn posterior.R:195-200)
    slot_wt <- res$slot_weights

    # now extract relevant rows from alpha matrix
    if (length(include_idx) > 0) {
      res_alpha <- res$alpha[include_idx, , drop = FALSE]
      if (!is.null(slot_wt)) {
        slot_wt <- slot_wt[include_idx]
      }
    } else {
      res_alpha <- matrix(0, 1, ncol(res$alpha))
      slot_wt <- NULL
    }
    res <- res_alpha
  }

  # c_hat-weighted PIPs when slot_weights are available
  if (exists("slot_wt", inherits = FALSE) && !is.null(slot_wt)) {
    weighted_alpha <- sweep(res, 1, slot_wt, `*`)
    return(as.vector(1 - apply(1 - weighted_alpha, 2, prod)))
  }
  return(as.vector(1 - apply(1 - res, 2, prod)))
}

#' @title Initialize a susie object using regression coefficients
#'
#' @param coef_index An L-vector containing the the indices of the
#'   nonzero coefficients.
#'
#' @param coef_value An L-vector containing initial coefficient
#' estimates.
#'
#' @param p A scalar giving the number of variables.
#'
#' @return A list with elements \code{alpha}, \code{mu} and \code{mu2}
#'   to be used by \code{susie}.
#'
#' @examples
#' set.seed(1)
#' n = 1000
#' p = 1000
#' beta = rep(0,p)
#' beta[sample(1:1000,4)] = 1
#' X = matrix(rnorm(n*p),nrow = n,ncol = p)
#' X = scale(X,center = TRUE,scale = TRUE)
#' y = drop(X %*% beta + rnorm(n))
#'
#' # Initialize susie to ground-truth coefficients.
#' s = susie_init_coef(which(beta != 0),beta[beta != 0],length(beta))
#' res = susie(X,y,L = 10,model_init=s)
#'
#' @export
#'
susie_init_coef = function (coef_index, coef_value, p) {
  L = length(coef_index)
  if (L <= 0)
    stop("Need at least one non-zero effect")
  if (!all(coef_value != 0))
    stop("Input coef_value must be non-zero for all its elements")
  if (L != length(coef_value))
    stop("Inputs coef_index and coef_value must of the same length")
  if (max(coef_index) > p)
    stop("Input coef_index exceeds the boundary of p")
  alpha = matrix(0,nrow = L,ncol = p)
  mu = matrix(0,nrow = L,ncol = p)
  for(i in 1:L){
    alpha[i,coef_index[i]] = 1
    mu[i,coef_index[i]] = coef_value[i]
  }
  out = list(alpha = alpha, mu = mu, mu2 = mu*mu)
  class(out) = c("susie","list")
  return(out)
}


================================================
FILE: R/susie_plot.R
================================================
#' @rdname susie_plots
#'
#' @title SuSiE Plots.
#'
#' @description \code{susie_plot} produces a per-variable summary of
#'   the SuSiE credible sets. \code{susie_plot_iteration} produces a
#'   diagnostic plot for the susie model fitting. For
#'   \code{susie_plot_iteration}, several plots will be created if
#'   \code{track_fit = TRUE} when calling \code{susie}.
#'
#' @param model A SuSiE fit, typically an output from
#'   \code{\link{susie}} or one of its variants. For \code{suse_plot},
#'   the susie fit must have \code{model$z}, \code{model$PIP}, and may
#'   include \code{model$sets}. \code{model} may also be a vector of
#'   z-scores or PIPs.
#'
#' @param y A string indicating what to plot: either \code{"z_original"} for
#'   z-scores, \code{"z"} for z-score derived p-values on (base-10) log-scale,
#'   \code{"PIP"} for posterior inclusion probabilities,
#'   \code{"log10PIP"} for posterior inclusion probabiliities on the
#'   (base-10) log-scale. For any other setting, the data are plotted as
#'   is.
#'
#' @param add_bar If \code{add_bar = TRUE}, add horizontal bar to
#'   signals in credible interval.
#'
#' @param pos This can be either be (1) a numeric vector of indices of
#'   subset of variables to plot, or (2) a list with the following list
#'   elements: \code{pos$attr}, \code{pos$start} and \code{pos$end},
#'   where \code{pos$attr} is a character string of the name of index
#'   variable in \code{model} object, and \code{pos$start} and
#'   \code{pos$end} are boundaries of indices to plot. See the provided
#'   examples.
#'
#' @param b For simulated data, set \code{b = TRUE} to highlight
#'   "true" effects (highlights in red).
#'
#' @param max_cs The largest credible set to display, either based on
#'   purity (set \code{max_cs} between 0 and 1), or based on size (set
#'   \code{max_cs > 1}).
#'
#' @param add_legend If \code{add_legend = TRUE}, add a legend to
#'   annotate the size and purity of each CS discovered. It can also be
#'   specified as location where legends should be added, e.g.,
#'   \code{add_legend = "bottomright"} (default location is
#'   \code{"topright"}).
#'
#' @param \dots Additional arguments passed to
#'   \code{\link[graphics]{plot}}.
#'
#' @return Invisibly returns \code{NULL}.
#'
#' @seealso \code{\link{susie_plot_changepoint}}
#'
#' @examples
#' set.seed(1)
#' n <- 1000
#' p <- 1000
#' beta <- rep(0, p)
#' beta[sample(1:1000, 4)] <- 1
#' X <- matrix(rnorm(n * p), nrow = n, ncol = p)
#' X <- scale(X, center = TRUE, scale = TRUE)
#' y <- drop(X %*% beta + rnorm(n))
#' res <- susie(X, y, L = 10)
#' susie_plot(res, "PIP")
#' susie_plot(res, "PIP", add_bar = TRUE)
#' susie_plot(res, "PIP", add_legend = TRUE)
#' susie_plot(res, "PIP", pos = 1:500, add_legend = TRUE)
#' # Plot selected regions with adjusted x-axis position label
#' res$genomic_position <- 1000 + (1:length(res$pip))
#' susie_plot(res, "PIP",
#'   add_legend = TRUE,
#'   pos = list(attr = "genomic_position", start = 1000, end = 1500)
#' )
#' # True effects are shown in red.
#' susie_plot(res, "PIP", b = beta, add_legend = TRUE)
#'
#' @importFrom utils head
#' @importFrom stats pnorm
#' @importFrom graphics plot
#' @importFrom graphics segments
#' @importFrom graphics points
#' @importFrom graphics legend
#' @importFrom graphics par
#'
#' @export
#'
susie_plot <- function(model, y, add_bar = FALSE, pos = NULL, b = NULL,
                       max_cs = 400, add_legend = NULL, ...) {
  is_susie <- inherits(model, "susie")
  ylab <- y
  color <- c(
    "dodgerblue2",
    "green4",
    "#6A3D9A", # purple
    "#FF7F00", # orange
    "gold1",
    "skyblue2", "#FB9A99", # lt pink
    "palegreen2",
    "#CAB2D6", # lt purple
    "#FDBF6F", # lt orange
    "gray70", "khaki2",
    "maroon", "orchid1", "deeppink1", "blue1", "steelblue4",
    "darkturquoise", "green1", "yellow4", "yellow3",
    "darkorange4", "brown"
  )
  if (y == "z") {
    if (is_susie) {
      if (is.null(model$z)) {
        stop(
          "z-scores are not available from SuSiE fit; please set ",
          "compute_univariate_zscore = TRUE in susie() call"
        )
      }
      zneg <- -abs(model$z)
    } else {
      zneg <- -abs(model)
    }
    p <- -log10(2 * pnorm(zneg))
    ylab <- "-log10(p)"
  } else if (y == "z_original") {
    if (is_susie) {
      if (is.null(model$z)) {
        stop(
          "z-scores are not available from SuSiE fit; please set ",
          "compute_univariate_zscore = TRUE in susie() call"
        )
      }
      p <- model$z
    } else {
      p <- model
    }
    ylab <- "z score"
  } else if (y == "PIP") {
    if (is_susie) {
      p <- model$pip
    } else {
      p <- model
    }
  } else if (y == "log10PIP") {
    if (is_susie) {
      p <- log10(model$pip)
    } else {
      p <- log10(model)
    }
    ylab <- "log10(PIP)"
  } else {
    if (is_susie) {
      stop("Need to specify z_original, z, PIP or log10PIP for SuSiE fits")
    }
    p <- model
  }
  if (is.null(b)) {
    b <- rep(0, length(p))
  }
  if (is.null(pos)) {
    pos <- 1:length(p)
  }
  start <- 0
  if (inherits(pos, "list")) {
    # Check input.
    if (is.null(pos$attr) || is.null(pos$start) || is.null(pos$end)) {
      stop("pos argument should be a list of list(attr=,start=,end=)")
    }
    if (!(pos$attr %in% names(model))) {
      stop(paste("Cannot find attribute", pos$attr, "in input model object"))
    }
    if (pos$start >= pos$end) {
      stop("Position start should be smaller than end")
    }
    start <- min(min(model[[pos$attr]]), pos$start)
    end <- max(max(model[[pos$attr]]), pos$end)

    # Add zeros to alpha and p.
    new_p <- rep(NA, end - start + 1)
    pos_with_value <- model[[pos$attr]] - start + 1
    new_p[pos_with_value] <- p
    p <- new_p

    # Adjust model$cs.
    if (!is.null(model$sets$cs)) {
      for (i in 1:length(model$sets$cs)) {
        model$sets$cs[[i]] <- pos_with_value[model$sets$cs[[i]]]
      }
    }

    # Change "pos" object to be indices.
    start_adj <- -min(min(model[[pos$attr]]) - pos$start, 0)
    end_adj <- max(max(model[[pos$attr]]) - pos$end, 0)
    pos <- (1 + start_adj):(length(p) - end_adj)
  } else {
    if (!all(pos %in% 1:length(p))) {
      stop("Provided position is outside the range of variables")
    }
    pos_with_value <- 1:length(p)
  }
  legend_text <- list(col = vector(), purity = vector(), size = vector(), cs_index = vector())
  # scipen0 = options()$scipen
  # options(scipen = 10)
  args <- list(...)
  if (!exists("xlab", args)) args$xlab <- "variable"
  if (!exists("ylab", args)) args$ylab <- ylab
  if (!exists("pch", args)) args$pch <- 16
  args$x <- pos + start
  args$y <- p[pos]
  do.call(plot, args)
  if (is_susie && !is.null(model$sets$cs)) {
    for (cs_idx in rev(seq_along(model$sets$cs))) {

      cs_vars <- model$sets$cs[[cs_idx]]
      purity <- model$sets$purity[cs_idx, 1]

      # Apply filtering based on max_cs parameter
      if (!is.null(model$sets$purity) && max_cs < 1 && purity >= max_cs) {
        x0 <- intersect(pos, cs_vars)
        y1 <- p[x0]
      } else if (length(cs_vars) < max_cs) {
        x0 <- intersect(pos, cs_vars)
        y1 <- p[x0]
      } else {
        x0 <- NULL
        y1 <- NULL
      }

      if (is.null(x0)) {
        next
      }
      if (add_bar) {
        y0 <- rep(0, length(x0))
        x1 <- x0
        segments(x0 + start, y0, x1 + start, y1, lwd = 1.5, col = "gray")
      }
      points(x0 + start, y1, col = head(color, 1), cex = 1.5, lwd = 2.5)
      legend_text$col <- append(head(color, 1), legend_text$col)

      # Rotate color.
      color <- c(color[-1], color[1])
      legend_text$purity <- append(round(purity, 4), legend_text$purity)
      legend_text$size <- append(length(x0), legend_text$size)

      # Store the original cs_index
      if (!is.null(model$sets$cs_index)) {
        legend_text$cs_index <- append(model$sets$cs_index[cs_idx], legend_text$cs_index)
      } else {
        legend_text$cs_index <- append(cs_idx, legend_text$cs_index)
      }
    }
    if (length(legend_text$col) > 0 && !is.null(add_legend) &&
      !identical(add_legend, FALSE)) {
      # Plot legend.
      text <- vector()
      for (i in 1:length(legend_text$col)) {
        effect_label <- if (length(legend_text$cs_index) >= i) legend_text$cs_index[i] else i
        if (legend_text$size[i] == 1) {
          text[i] <- paste0("L", effect_label, ": C=1")
        } else {
          text[i] <- paste0(
            "L", effect_label, ": C=", legend_text$size[i], "/R=",
            legend_text$purity[i]
          )
        }
      }
      if (!(add_legend %in% c(
        "bottomright", "bottom", "bottomleft", "left",
        "topleft", "top", "topright", "right", "center"
      ))) {
        add_legend <- "topright"
      }
      legend(add_legend, text,
        bty = "n", col = legend_text$col, cex = 0.65,
        pch = 15
      )
    }
  }
  points(pos[b != 0] + start, p[b != 0] + start, col = 2, pch = 16)
  # options(scipen = scipen0)
  return(invisible())
}

#' @rdname susie_plots
#'
#' @param L An integer specifying the number of credible sets to plot.
#'
#' @param file_prefix Prefix to path of output plot file. If not
#'   specified, the plot, or plots, will be saved to a temporary
#'   directory generated using \code{\link{tempdir}}.
#'
#' @param pos Indices of variables to plot. If \code{pos = NULL} all
#'   variables are plotted.
#'
#' @examples
#' set.seed(1)
#' n <- 1000
#' p <- 1000
#' beta <- rep(0, p)
#' beta[sample(1:1000, 4)] <- 1
#' X <- matrix(rnorm(n * p), nrow = n, ncol = p)
#' X <- scale(X, center = TRUE, scale = TRUE)
#' y <- drop(X %*% beta + rnorm(n))
#' res <- susie(X, y, L = 10)
#' susie_plot_iteration(res, L = 10)
#'
#' @importFrom grDevices pdf
#' @importFrom grDevices dev.off
#' @importFrom reshape melt
#' @importFrom ggplot2 ggplot
#' @importFrom ggplot2 aes
#' @importFrom ggplot2 geom_col
#' @importFrom ggplot2 ggtitle
#' @importFrom ggplot2 theme_classic
#' @importFrom ggplot2 .data
#'
#' @export
#'
susie_plot_iteration <- function(model, L, file_prefix, pos = NULL) {
  get_layer <- function(obj, k, idx, vars) {
    alpha <- melt(obj$alpha[1:k, vars, drop = FALSE])
    colnames(alpha) <- c("L", "variables", "alpha")
    alpha$L <- as.factor(alpha$L)
    ggplot(alpha, aes(x = .data$variables, y = .data$alpha, group = .data$L)) +
      geom_col(aes(fill = .data$L)) +
      ggtitle(paste("Iteration", idx)) +
      theme_classic()
  }
  k <- min(nrow(model$alpha), L)
  if (is.null(pos)) {
    vars <- 1:ncol(model$alpha)
  } else {
    vars <- pos
  }
  if (missing(file_prefix)) {
    file_prefix <- file.path(tempdir(), "susie_plot")
  }
  pdf(paste0(file_prefix, ".pdf"), 8, 3)
  if (is.null(model$trace)) {
    print(get_layer(model, k, model$niter, vars))
  } else {
    for (i in 2:length(model$trace)) {
      print(get_layer(model$trace[[i]], k, i - 1, vars))
    }
  }
  dev.off()
  format <- ".pdf"
  if (!is.null(model$trace)) {
    cmd <- paste(
      "convert -delay 30 -loop 0 -density 300 -dispose previous",
      paste0(file_prefix, ".pdf"),
      "\\( -clone 0 -set delay 300 \\) -swap 0 +delete",
      "\\( +clone -set delay 300 \\) +swap +delete -coalesce",
      "-layers optimize", paste0(file_prefix, ".gif")
    )
    message("Creating GIF animation...")
    if (file.exists(paste0(file_prefix, ".gif"))) {
      file.remove(paste0(file_prefix, ".gif"))
    }
    output <- try(system(cmd))
    if (inherits(output, "try-error")) {
      stop("Cannot create GIF animation because convert command failed")
    } else {
      format <- ".gif"
    }
  }
  message(paste0("Iterplot saved to ", file_prefix, format, "\n"))
  return(invisible())
}

#' @title Plot changepoint data and susie fit using ggplot2
#'
#' @description Plots original data, y, overlaid with line showing
#'   susie fitted value and shaded rectangles showing credible sets for
#'   changepoint locations.
#'
#' @param y An n-vector of observations that are ordered in time or
#'   space (assumed equally-spaced).
#'
#' @param s A susie fit generated by
#'   \code{susie_trendfilter(y,order = 0)}.
#'
#' @param line_col Color for the line showing fitted values.
#'
#' @param line_size Size of the lines showing fitted values
#'
#' @param cs_col Color of the shaded rectangles showing credible
#'   sets.
#'
#' @return A ggplot2 plot object.
#'
#' @examples
#' set.seed(1)
#' mu <- c(rep(0, 50), rep(1, 50), rep(3, 50), rep(-2, 50), rep(0, 300))
#' y <- mu + rnorm(500)
#' # Here we use a less sensitive tolerance so that the example takes
#' # less time; in practice you will likely want to use a more stringent
#' # setting such as tol = 0.001.
#' s <- susie_trendfilter(y, tol = 0.1)
#'
#' # Produces ggplot with credible sets for changepoints.
#' susie_plot_changepoint(s, y)
#'
#' @importFrom ggplot2 ggplot
#' @importFrom ggplot2 aes
#' @importFrom ggplot2 geom_point
#' @importFrom ggplot2 geom_line
#' @importFrom ggplot2 annotate
#' @importFrom ggplot2 .data
#'
#' @export
#'
susie_plot_changepoint <- function(s, y, line_col = "blue", line_size = 1.5,
                                   cs_col = "red") {
  df <- data.frame(x = 1:length(y), y = y, mu = predict.susie(s))
  CS <- susie_get_cs(s)$cs
  p <- ggplot(df) +
    geom_point(data = df, aes(x = .data$x, y = .data$y)) +
    geom_line(
      color = line_col, data = df, aes(x = .data$x, y = .data$mu),
      linewidth = line_size
    )
  for (i in seq_along(CS)) {
    p <- p + annotate("rect",
      fill = cs_col, alpha = 0.5,
      xmin = min(CS[[i]]) - 0.5, xmax = max(CS[[i]]) + 0.5,
      ymin = -Inf, ymax = Inf
    )
  }
  return(p)
}


================================================
FILE: R/susie_post_outcome_configuration.R
================================================
# Post-hoc causal-configuration probabilities for one or more SuSiE-class fits.
#
# Two algorithms live here, exposed through one entry point:
#
#   * SuSiEx (Nature Genetics, 2024): N-trait 2^N enumeration. Per CS tuple
#     (one CS chosen from each trait), report posterior probabilities over
#     all 2^N "which traits share the causal" patterns plus per-trait
#     marginals. Legacy reference implementation:
#     `mvf.susie.alpha::posthoc_multfsusie`.
#
#   * Coloc pairwise ABF (Wallace, 2020 / `coloc::coloc.bf_bf`): pairwise
#     H0/H1/H2/H3/H4 posteriors for every (trait, trait') pair across every
#     (CS in trait, CS in trait') pair. Implemented inline here as a
#     verbatim port of `coloc:::combine.abf` so susieR has no soft
#     dependency on coloc.
#
# The public function normalises any supported input shape (single fit, list
# of fits, or a single multi-output fit treated outcome-wise) to a flat list
# of "trait views", then runs the requested algorithms against that list.
# Class-aware branches use `inherits()` and are confined to one helper.
#
# The return value is tagged with class `"susie_post_outcome_configuration"`
# so `summary()` dispatches to the pretty-printer at the bottom of this file.

#' Post-hoc causal-configuration probabilities for one or more SuSiE-class fits
#'
#' Runs one of two complementary post-hoc analyses, selected by
#' \code{method}: \code{"susiex"} (default) for the SuSiEx \eqn{2^N}
#' combinatorial enumeration, reporting the posterior probability of
#' every binary causality pattern across the \eqn{N} input traits; or
#' \code{"coloc_pairwise"} for the coloc pairwise ABF, reporting the
#' five colocalisation hypothesis posteriors (H0/H1/H2/H3/H4) for every
#' pair of traits. To get both, call the function twice and combine.
#'
#' Two grouping modes are supported through the \code{by} argument:
#' \describe{
#'   \item{\code{"fit"}}{Each input fit contributes a single trait view.
#'     Multi-output fits (\code{mvsusie}, \code{mfsusie}) are kept whole: the
#'     trait's per-(CS, SNP) log Bayes factors are the joint composite
#'     stored on the fit as \code{lbf_variable}. Configuration enumeration
#'     loops over the cross-product \eqn{L_1 \times \dots \times L_N} of CS
#'     indices.}
#'   \item{\code{"outcome"}}{Multi-output fits fan out into per-outcome views,
#'     each with its own per-(CS, SNP) log Bayes factors read from
#'     \code{fit$lbf_variable_outcome} (an \eqn{L \times J \times R} or
#'     \eqn{L \times J \times M} array). All per-outcome views share the
#'     joint fit's PIP matrix and CS list, so the configuration enumeration
#'     reduces to a single index \eqn{l \in 1..L}. Single-output \code{susie}
#'     fits pass through unchanged. Requires \code{$lbf_variable_outcome} on the
#'     fit (set \code{attach_lbf_variable_outcome = TRUE} when fitting).}
#' }
#'
#' \subsection{SuSiEx algorithm}{
#' For each credible-set tuple \eqn{(l_1, \dots, l_N)}:
#' \enumerate{
#'   \item Per-trait CS-level log BF (alpha-weighted SNP average):
#'     \deqn{\log\mathrm{BF}^{(n)}_{l_n} = \sum_j \alpha_{n,l_n,j}\,
#'       \log\mathrm{BF}_{n,l_n,j}.}
#'   \item Enumerate the \eqn{2^N} binary configurations
#'     \eqn{c \in \{0,1\}^N}.
#'   \item Configuration log BF:
#'     \deqn{\log\mathrm{BF}^{(c)} = \sum_{n: c_n = 1} \log\mathrm{BF}^{(n)}_{l_n}.}
#'   \item Normalise under a uniform prior over the \eqn{2^N} configurations.
#'   \item Per-trait marginal: \eqn{P(\mathrm{trait}\,n\,\mathrm{causal}) =
#'     \sum_{c: c_n = 1} P(c \mid \mathrm{tuple})}.
#' }
#' }
#'
#' \subsection{Coloc pairwise algorithm}{
#' For each unordered trait pair \eqn{(n, n')} and each CS pair
#' \eqn{(l_n, l_{n'})}, with per-SNP log BFs
#' \eqn{\ell_1 = \log\mathrm{BF}_{n,l_n,\cdot}} and
#' \eqn{\ell_2 = \log\mathrm{BF}_{n',l_{n'},\cdot}} (length \eqn{J}), the
#' five hypothesis log-BFs are
#' \deqn{\log\mathrm{BF}_{H_0} = 0,\quad
#'       \log\mathrm{BF}_{H_1} = \log p_1 + \mathrm{LSE}(\ell_1),\quad
#'       \log\mathrm{BF}_{H_2} = \log p_2 + \mathrm{LSE}(\ell_2),}
#' \deqn{\log\mathrm{BF}_{H_3} = \log p_1 + \log p_2 +
#'       \mathrm{logdiff}(\mathrm{LSE}(\ell_1) + \mathrm{LSE}(\ell_2),\;
#'                        \mathrm{LSE}(\ell_1 + \ell_2)),}
#' \deqn{\log\mathrm{BF}_{H_4} = \log p_{12} + \mathrm{LSE}(\ell_1 + \ell_2),}
#' and the corresponding posteriors are
#' \eqn{\mathrm{PP.H}_h = \exp(\log\mathrm{BF}_{H_h} -
#'       \mathrm{LSE}(\log\mathrm{BF}_{H_0:H_4}))}, where
#' \eqn{\mathrm{LSE}} is the log-sum-exp.
#' \itemize{
#'   \item H0: no causal variant in either CS.
#'   \item H1: causal in trait \eqn{n} only.
#'   \item H2: causal in trait \eqn{n'} only.
#'   \item H3: distinct causals in the two traits.
#'   \item H4: a single shared causal variant.
#' }
#' }
#'
#' @param input A single fit of class \code{susie}, \code{mvsusie}, or
#'   \code{mfsusie}, OR a list of such fits.
#' @param by Either \code{"fit"} (one trait per input fit; default) or
#'   \code{"outcome"} (multi-output fits expand into per-outcome traits).
#' @param method Character scalar; one of \code{"susiex"} (default) or
#'   \code{"coloc_pairwise"}. Pick the analysis to run; for both, call
#'   the function twice.
#' @param prob_thresh Per-trait marginal threshold for the convenience
#'   \code{$active} flags in the SuSiEx output. Default \code{0.8}.
#' @param cs_only Logical. If \code{TRUE} (default) only enumerate over CSs
#'   present in each fit's \code{$sets$cs}; if \code{FALSE} loop over all L
#'   rows of \code{$alpha}. Either way, effects whose entire alpha row is
#'   zero are skipped. When \code{TRUE}, every fit must carry a non-null
#'   \code{$sets$cs} or the function errors.
#' @param p1,p2,p12 Coloc per-SNP causal priors: \code{p1} for trait 1
#'   alone, \code{p2} for trait 2 alone, \code{p12} for shared causal.
#'   Defaults match \code{coloc::coloc.bf_bf}: \code{p1 = p2 = 1e-4},
#'   \code{p12 = 5e-6}. Only used when \code{"coloc_pairwise"} is in
#'   \code{methods}.
#' @param ... Currently ignored.
#'
#' @return A list of class \code{"susie_post_outcome_configuration"} with
#' exactly one of the following components, depending on \code{method}:
#' \describe{
#'   \item{\code{$susiex}}{(when \code{method = "susiex"}) A list of length
#'     equal to the number of CS tuples considered. Each element has
#'     components \code{cs_indices} (length-N integer tuple),
#'     \code{logBF_trait} (length N), \code{configs} (\eqn{2^N \times N}
#'     binary matrix), \code{config_prob} (length \eqn{2^N}),
#'     \code{marginal_prob} (length-N per-trait marginal posterior
#'     probability of being active across the configuration ensemble),
#'     and \code{active} (logical, \code{marginal_prob >= prob_thresh}).}
#'   \item{\code{$coloc_pairwise}}{(when \code{method = "coloc_pairwise"})
#'     A data.frame with one row per (trait1, trait2, l1, l2)
#'     combination, columns \code{trait1, trait2, l1, l2, hit1, hit2,
#'     PP.H0, PP.H1, PP.H2, PP.H3, PP.H4}.}
#' }
#' Pretty-print with \code{summary(out)}.
#'
#' @references
#' SuSiEx, Nature Genetics 2024 (combinatorial \eqn{2^N} enumeration).
#' Wallace, PLoS Genetics 2020 (coloc pairwise H0/H1/H2/H3/H4 ABF).
#'
#' @export
susie_post_outcome_configuration <- function(input,
                                             by          = c("fit", "outcome"),
                                             method      = c("susiex",
                                                             "coloc_pairwise"),
                                             prob_thresh = 0.8,
                                             cs_only     = TRUE,
                                             p1          = 1e-4,
                                             p2          = 1e-4,
                                             p12         = 5e-6,
                                             ...) {
  by     <- match.arg(by)
  method <- match.arg(method)

  if (!is.numeric(prob_thresh) || length(prob_thresh) != 1L ||
      !is.finite(prob_thresh) || prob_thresh < 0 || prob_thresh > 1) {
    stop("`prob_thresh` must be a single numeric in [0, 1].")
  }
  if (!is.logical(cs_only) || length(cs_only) != 1L || is.na(cs_only)) {
    stop("`cs_only` must be a single logical (TRUE or FALSE).")
  }
  for (nm in c("p1", "p2", "p12")) {
    v <- get(nm)
    if (!is.numeric(v) || length(v) != 1L || !is.finite(v) ||
        v <= 0 || v >= 1) {
      stop("`", nm, "` must be a single numeric in (0, 1).")
    }
  }

  views <- normalise_to_views(input, by = by, cs_only = cs_only)

  out <- list()
  if (identical(method, "susiex")) {
    out$susiex <- susiex_configurations(views,
                                        by          = by,
                                        prob_thresh = prob_thresh)
  } else {
    # method == "coloc_pairwise"
    out$coloc_pairwise <- coloc_pairwise_abf(views,
                                             p1  = p1,
                                             p2  = p2,
                                             p12 = p12)
  }
  attr(out, "prob_thresh") <- prob_thresh
  attr(out, "method")      <- method
  class(out) <- c("susie_post_outcome_configuration", "list")
  out
}

# -----------------------------------------------------------------------------
# Input normalisation
# -----------------------------------------------------------------------------

is_susie_fit <- function(x) {
  inherits(x, "susie") || inherits(x, "mvsusie") || inherits(x, "mfsusie")
}

normalise_to_views <- function(input, by, cs_only) {
  fits <- if (is_susie_fit(input)) list(input) else as.list(input)

  if (length(fits) == 0L) {
    stop("`input` must be a SuSiE-class fit or a non-empty list of fits.")
  }
  for (k in seq_along(fits)) {
    if (!is_susie_fit(fits[[k]])) {
      stop("Element ", k,
           " of `input` is not a SuSiE-class fit (`susie`, `mvsusie`, or ",
           "`mfsusie`).")
    }
    if (cs_only && is.null(fits[[k]]$sets$cs)) {
      stop("Fit ", k, ": `cs_only = TRUE` requires `$sets$cs` to be present. ",
           "Either pass `cs_only = FALSE` or attach a credible-set list via ",
           "susie_get_cs() before calling.")
    }
  }

  raw_names <- names(fits)
  if (is.null(raw_names)) raw_names <- character(length(fits))
  default_names <- paste0("trait_", seq_along(fits))
  raw_names[!nzchar(raw_names)] <- default_names[!nzchar(raw_names)]

  views <- vector("list", 0)
  for (k in seq_along(fits)) {
    views <- c(views, expand_one_fit(fits[[k]], raw_names[k], by = by))
  }
  views
}

expand_one_fit <- function(fit, base_name, by) {
  if (by == "fit") {
    return(list(make_view(
      name    = base_name,
      alpha   = fit$alpha,
      lbf     = fit$lbf_variable,
      sets_cs = fit$sets$cs
    )))
  }

  # by = "outcome": multi-output fits fan out; single-output fits pass
  # through as one view.
  if (inherits(fit, "mvsusie") || inherits(fit, "mfsusie")) {
    if (is.null(fit$lbf_variable_outcome)) {
      stop("Fit '", base_name, "': `by = \"outcome\"` requires `$lbf_variable_outcome` ",
           "(an L x J x R or L x J x M array) on the fit. ",
           "Refit with `attach_lbf_variable_outcome = TRUE` (the default in mfsusie / ",
           "mvsusie), or pass `by = \"fit\"` to use the joint composite log ",
           "BF instead.")
    }
    R <- dim(fit$lbf_variable_outcome)[3L]
    out_names <- dimnames(fit$lbf_variable_outcome)[[3L]]
    if (is.null(out_names)) out_names <- paste0("outcome_", seq_len(R))
    views <- vector("list", R)
    for (r in seq_len(R)) {
      views[[r]] <- make_view(
        name    = paste0(base_name, "_", out_names[r]),
        alpha   = fit$alpha,
        lbf     = fit$lbf_variable_outcome[, , r, drop = TRUE],
        sets_cs = fit$sets$cs
      )
    }
    return(views)
  }

  # Single-output `susie` under by = "outcome": same as by = "fit".
  list(make_view(
    name    = base_name,
    alpha   = fit$alpha,
    lbf     = fit$lbf_variable,
    sets_cs = fit$sets$cs
  ))
}

make_view <- function(name, alpha, lbf, sets_cs) {
  if (is.null(alpha) || is.null(lbf)) {
    stop("Trait '", name, "': both `$alpha` and `$lbf_variable` (or per-",
         "outcome lbf row) must be non-null.")
  }
  if (!is.matrix(alpha)) alpha <- as.matrix(alpha)
  if (!is.matrix(lbf))   lbf   <- as.matrix(lbf)
  if (!identical(dim(alpha), dim(lbf))) {
    stop("Trait '", name, "': `alpha` and `lbf` must have identical shape; ",
         "got ", paste(dim(alpha), collapse = "x"), " vs ",
         paste(dim(lbf), collapse = "x"), ".")
  }
  list(name = name, alpha = alpha, lbf = lbf, sets_cs = sets_cs)
}

# -----------------------------------------------------------------------------
# CS-tuple enumeration shared by both algorithms.
# -----------------------------------------------------------------------------

# Per-view CS index set, restricted to $sets$cs when cs_only = TRUE.
view_cs_indices <- function(view, cs_only) {
  L_n <- nrow(view$alpha)
  if (!cs_only) return(seq_len(L_n))

  idx <- attr(view$sets_cs, "cs_idx")
  if (is.null(idx)) {
    # Fall back to the names of $sets$cs ("L1", "L2", ... in susieR's format).
    if (length(view$sets_cs) > 0L && !is.null(names(view$sets_cs))) {
      idx <- as.integer(sub("^L", "", names(view$sets_cs)))
    } else {
      idx <- seq_len(L_n)
    }
  }
  idx[idx >= 1L & idx <= L_n]
}

# Returns a list of length-N integer tuples (one CS index per view).
# Under by = "outcome" all views share CSs and we use the diagonal.
# Under by = "fit" we use the cross-product.
enumerate_cs_tuples <- function(views, by, cs_only) {
  per_view <- lapply(views, view_cs_indices, cs_only = cs_only)
  if (any(vapply(per_view, length, integer(1)) == 0L)) return(list())

  if (by == "outcome") {
    common <- Reduce(intersect, per_view)
    lapply(common, function(l) rep.int(l, length(views)))
  } else {
    grid <- expand.grid(per_view, KEEP.OUT.ATTRS = FALSE)
    lapply(seq_len(nrow(grid)), function(i) as.integer(grid[i, , drop = TRUE]))
  }
}

# -----------------------------------------------------------------------------
# SuSiEx 2^N configuration enumeration.
# -----------------------------------------------------------------------------

susiex_configurations <- function(views, by, prob_thresh,
                                  max_traits = 20L) {
  N <- length(views)
  if (N > max_traits) {
    stop("susiex: N = ", N, " traits exceeds the safety ceiling (",
         max_traits, "); 2^N enumeration would be too large.")
  }

  cs_tuples <- enumerate_cs_tuples(views, by = by, cs_only = TRUE)
  if (length(cs_tuples) == 0L) return(list())

  configs <- as.matrix(expand.grid(rep(list(c(0L, 1L)), N)))
  colnames(configs) <- paste0("trait_", seq_len(N))
  trait_names <- vapply(views, function(v) v$name, character(1))

  out <- vector("list", length(cs_tuples))
  for (ti in seq_along(cs_tuples)) {
    tuple <- cs_tuples[[ti]]

    logBF_trait <- numeric(N)
    skip <- FALSE
    for (n in seq_len(N)) {
      l_n       <- tuple[n]
      alpha_row <- views[[n]]$alpha[l_n, ]
      lbf_row   <- views[[n]]$lbf  [l_n, ]
      if (all(alpha_row == 0)) { skip <- TRUE; break }
      logBF_trait[n] <- sum(alpha_row * lbf_row)   # alpha-weighted SNP avg
    }
    if (skip) {
      out[[ti]] <- NULL
      next
    }

    logBF_conf    <- as.vector(configs %*% logBF_trait)
    maxlog        <- max(logBF_conf)
    prob_conf     <- exp(logBF_conf - maxlog)
    prob_conf     <- prob_conf / sum(prob_conf)
    marginal_prob <- as.vector(crossprod(configs, prob_conf))

    out[[ti]] <- list(
      cs_indices    = setNames(as.integer(tuple),  trait_names),
      logBF_trait   = setNames(logBF_trait,        trait_names),
      configs       = configs,
      config_prob   = prob_conf,
      marginal_prob = setNames(marginal_prob,      trait_names),
      active        = setNames(marginal_prob >= prob_thresh, trait_names)
    )
  }

  out[!vapply(out, is.null, logical(1))]
}

# -----------------------------------------------------------------------------
# Coloc pairwise ABF (verbatim port of coloc:::combine.abf).
# -----------------------------------------------------------------------------

# Numerically stable log(sum(exp(x))).
.logsum <- function(x) {
  m <- max(x)
  m + log(sum(exp(x - m)))
}

# Numerically stable log(exp(a) - exp(b)) for a > b.
.logdiff <- function(a, b) {
  m <- max(a, b)
  m + log(exp(a - m) - exp(b - m))
}

# Compute (PP.H0, PP.H1, PP.H2, PP.H3, PP.H4) from per-SNP log-BF vectors,
# matching coloc:::combine.abf line-for-line.
combine_abf_pair <- function(l1, l2, p1, p2, p12) {
  stopifnot(length(l1) == length(l2))
  lsum    <- l1 + l2
  lH0     <- 0
  lH1     <- log(p1)  + .logsum(l1)
  lH2     <- log(p2)  + .logsum(l2)
  lH3     <- log(p1)  + log(p2) +
             .logdiff(.logsum(l1) + .logsum(l2), .logsum(lsum))
  lH4     <- log(p12) + .logsum(lsum)
  all_lH  <- c(lH0, lH1, lH2, lH3, lH4)
  pp      <- exp(all_lH - .logsum(all_lH))
  names(pp) <- paste0("PP.H", 0:4)
  pp
}

coloc_pairwise_abf <- function(views, p1, p2, p12) {
  N <- length(views)
  empty <- data.frame(trait1 = character(0), trait2 = character(0),
                      l1 = integer(0), l2 = integer(0),
                      hit1 = character(0), hit2 = character(0),
                      PP.H0 = numeric(0), PP.H1 = numeric(0),
                      PP.H2 = numeric(0), PP.H3 = numeric(0),
                      PP.H4 = numeric(0),
                      stringsAsFactors = FALSE)
  if (N < 2L) return(empty)

  trait_names <- vapply(views, function(v) v$name, character(1))
  rows <- list()

  for (a in seq_len(N - 1L)) {
    for (b in (a + 1L):N) {
      L1 <- view_cs_indices(views[[a]], cs_only = TRUE)
      L2 <- view_cs_indices(views[[b]], cs_only = TRUE)
      if (length(L1) == 0L || length(L2) == 0L) next

      var_names_a <- colnames(views[[a]]$lbf)
      var_names_b <- colnames(views[[b]]$lbf)

      for (i in L1) {
        if (all(views[[a]]$alpha[i, ] == 0)) next
        l1_row <- views[[a]]$lbf[i, ]
        for (j in L2) {
          if (all(views[[b]]$alpha[j, ] == 0)) next
          l2_row <- views[[b]]$lbf[j, ]

          pp <- combine_abf_pair(l1_row, l2_row, p1 = p1, p2 = p2, p12 = p12)

          hit1 <- if (!is.null(var_names_a)) {
                    var_names_a[which.max(l1_row)]
                  } else {
                    paste0("snp_", which.max(l1_row))
                  }
          hit2 <- if (!is.null(var_names_b)) {
                    var_names_b[which.max(l2_row)]
                  } else {
                    paste0("snp_", which.max(l2_row))
                  }

          rows[[length(rows) + 1L]] <- data.frame(
            trait1 = trait_names[a], trait2 = trait_names[b],
            l1     = i,              l2     = j,
            hit1   = hit1,           hit2   = hit2,
            PP.H0  = pp["PP.H0"],    PP.H1  = pp["PP.H1"],
            PP.H2  = pp["PP.H2"],    PP.H3  = pp["PP.H3"],
            PP.H4  = pp["PP.H4"],
            stringsAsFactors = FALSE,
            row.names = NULL
          )
        }
      }
    }
  }

  if (length(rows) == 0L) return(empty)
  do.call(rbind, rows)
}
# =============================================================================
# Summary / print methods for `susie_post_outcome_configuration` results.
# =============================================================================
#
# Goals:
#   * Be the one-stop pretty-printer so users almost never have to inspect
#     the raw nested list.
#   * Color-code signal vs. no-signal so the eye reads the table at a glance
#     (BOLD DARK GREEN = active / shared, YELLOW = ambiguous, DIM = below
#     threshold; coloc verdicts H4 = green/bold, H3 = magenta, H1/H2 = blue,
#     H0 = dim).
#   * Filter no-signal rows by default (signal_only = TRUE) and footer the
#     hidden count.
#   * Be robust to malformed / partial input objects: missing fields,
#     missing columns, empty lists, length-mismatched per-trait fields,
#     trait names colliding with reserved column names, etc. None of these
#     should error -- they should degrade gracefully.

# Reserved column names that the SuSiEx tidy table adds. Trait names that
# collide get a "trait_" prefix during materialisation.
.SUSIEX_RESERVED <- c("tuple", "top_pattern", "top_prob")

# Coloc PP columns. We tolerate the data.frame missing some, only enforce
# that PP.H0..PP.H4 are present (the source enforces all five).
.COLOC_PP_COLS  <- c("PP.H0", "PP.H1", "PP.H2", "PP.H3", "PP.H4")
.COLOC_DISPLAY  <- c("trait1", "trait2", "l1", "l2", "hit1", "hit2")
.COLOC_LABELS   <- c("H0 no signal",
                     "H1 trait1-only",
                     "H2 trait2-only",
                     "H3 distinct",
                     "H4 shared")

#' Summarise a susie_post_outcome_configuration result
#'
#' Builds tidy tables from the nested list returned by
#' [susie_post_outcome_configuration()] and prints them with ANSI color
#' highlighting via [print.summary.susie_post_outcome_configuration()].
#' The summary itself is an S3 object: index `$susiex` and
#' `$coloc_pairwise` to grab the data.frames for downstream use.
#'
#' Color encoding (when ANSI colors are available):
#' \itemize{
#'   \item SuSiEx per-trait marginal probability: bold dark green when
#'     `>= prob_thresh` (active), yellow when in
#'     `[ambiguous_lower, prob_thresh)`, dim otherwise. The `active`
#'     logical from the raw result is encoded by color and is not shown
#'     as a separate column.
#'   \item Coloc verdict: bold dark green for H4 (shared causal), magenta
#'     for H3 (distinct causals), blue for H1 or H2 (single-trait causal),
#'     dim for H0 (no signal). The dominant PP per row is bolded.
#' }
#'
#' Robustness: this method is defensive against malformed input. Empty
#' lists, NULL components, missing fields, length-mismatched per-trait
#' vectors, trait names that collide with reserved columns
#' (`tuple`, `top_pattern`, `top_prob`), and coloc data.frames that
#' lack some optional columns (`hit1`, `hit2`) all degrade gracefully
#' rather than erroring.
#'
#' @param object Output of [susie_post_outcome_configuration()].
#' @param prob_thresh Threshold above which `marginal_prob` counts as a
#'   signal (default `0.8`).
#' @param ambiguous_lower Lower edge of the "ambiguous" band for the
#'   SuSiEx color coding: marginals in
#'   `[ambiguous_lower, prob_thresh)` are colored yellow. Default `0.5`.
#'   Set to `prob_thresh` to disable the band.
#' @param signal_only Logical. If `TRUE` (default), drop CS tuples where
#'   no trait is active and drop coloc rows whose dominant hypothesis is
#'   H0. Pass `FALSE` to keep everything.
#' @param color One of `"auto"` (default; honors [crayon::has_color()]),
#'   `TRUE` (force colors on), or `FALSE` (force them off).
#' @param ... Ignored.
#'
#' @return A list of class `"summary.susie_post_outcome_configuration"`
#' with components:
#' \describe{
#'   \item{`$susiex`}{`data.frame` (or `NULL` when no signals): one row per
#'     CS tuple. Columns: `tuple` (e.g. `"(1,1,1)"`), one numeric column
#'     per trait carrying that trait's `marginal_prob`, `top_pattern`
#'     (binary configuration string for the most-probable configuration),
#'     `top_prob` (its probability).}
#'   \item{`$coloc_pairwise`}{`data.frame` (or `NULL`): the original coloc
#'     table extended with `verdict` (named hypothesis label) and `top_pp`
#'     (the dominant PP value).}
#'   \item{`$susiex_n_total`, `$susiex_n_kept`, `$coloc_n_total`,
#'     `$coloc_n_kept`}{row counts before and after `signal_only`
#'     filtering, used by the print method to footer hidden rows.}
#'   \item{`$prob_thresh`, `$ambiguous_lower`, `$signal_only`, `$color`}{
#'     parameters echoed for the print method.}
#' }
#'
#' @seealso [susie_post_outcome_configuration()],
#'   [print.summary.susie_post_outcome_configuration()]
#'
#' @method summary susie_post_outcome_configuration
#' @export summary.susie_post_outcome_configuration
#' @export
summary.susie_post_outcome_configuration <- function(
    object,
    prob_thresh     = 0.8,
    ambiguous_lower = 0.5,
    signal_only     = TRUE,
    color           = "auto",
    ...) {
  if (!is.numeric(prob_thresh) || length(prob_thresh) != 1L ||
      !is.finite(prob_thresh) || prob_thresh < 0 || prob_thresh > 1) {
    stop("`prob_thresh` must be a single numeric in [0, 1].")
  }
  if (!is.numeric(ambiguous_lower) || length(ambiguous_lower) != 1L ||
      !is.finite(ambiguous_lower) ||
      ambiguous_lower < 0 || ambiguous_lower > prob_thresh) {
    stop("`ambiguous_lower` must be a single numeric in [0, prob_thresh].")
  }
  if (!is.logical(signal_only) || length(signal_only) != 1L ||
      is.na(signal_only)) {
    stop("`signal_only` must be a single logical (TRUE or FALSE).")
  }
  if (!(isTRUE(color) || isFALSE(color) || identical(color, "auto"))) {
    stop("`color` must be one of TRUE, FALSE, or \"auto\".")
  }

  ses <- .summarise_susiex(object$susiex, signal_only, prob_thresh)
  cls <- .summarise_coloc(object$coloc_pairwise, signal_only)
  out <- list(
    susiex          = ses$df,
    susiex_n_total  = ses$n_total,
    susiex_n_kept   = ses$n_kept,
    coloc_pairwise  = cls$df,
    coloc_n_total   = cls$n_total,
    coloc_n_kept    = cls$n_kept,
    prob_thresh     = prob_thresh,
    ambiguous_lower = ambiguous_lower,
    signal_only     = signal_only,
    color           = color
  )
  class(out) <- c("summary.susie_post_outcome_configuration", "list")
  out
}

# Tidy `configs$susiex` (list of CS-tuple result lists) into a data.frame
# wrapped in a small list with kept/total counts so the print method can
# tell users what was hidden. Returns NULL `df` when input is empty or
# fully filtered.
#
# Defensive against per-tuple field omissions: a tuple missing
# `marginal_prob` or `config_prob` is silently skipped. Trait names that
# collide with reserved columns are prefixed with "trait_". Trait sets
# that vary across tuples are unioned.
.summarise_susiex <- function(susiex, signal_only, prob_thresh) {
  if (is.null(susiex) || !is.list(susiex) || length(susiex) == 0L) {
    return(list(df = NULL, n_total = 0L, n_kept = 0L))
  }
  n_total <- length(susiex)

  # Pull the union of trait names across all tuples (some tuples might be
  # malformed and missing fields; we just skip those).
  trait_names_all <- unique(unlist(lapply(susiex, function(tup) {
    if (is.list(tup) && !is.null(tup$marginal_prob)) {
      names(tup$marginal_prob)
    } else character(0)
  })))
  if (length(trait_names_all) == 0L) {
    return(list(df = NULL, n_total = n_total, n_kept = 0L))
  }
  # Avoid collisions with reserved column names by prefixing.
  trait_cols <- ifelse(trait_names_all %in% .SUSIEX_RESERVED,
                       paste0("trait_", trait_names_all),
                       trait_names_all)
  trait_cols <- make.unique(trait_cols)
  names(trait_cols) <- trait_names_all   # raw -> column-name mapping

  rows <- lapply(susiex, function(tup) {
    if (!is.list(tup) || is.null(tup$marginal_prob) ||
        is.null(tup$config_prob) || is.null(tup$configs)) {
      return(NULL)
    }
    mp <- tup$marginal_prob
    if (signal_only) {
      # Re-derive active using current prob_thresh (don't trust the stored
      # active flag, which was computed against the call-time threshold).
      if (!any(is.finite(mp) & mp >= prob_thresh)) return(NULL)
    }
    cp <- tup$config_prob
    if (length(cp) == 0L || !all(is.finite(cp))) return(NULL)
    top_idx <- which.max(cp)
    cfg     <- tup$configs
    top_pat <- if (is.matrix(cfg) && nrow(cfg) >= top_idx) {
      paste(cfg[top_idx, ], collapse = "")
    } else NA_character_
    cs_idx_str <- if (!is.null(tup$cs_indices)) {
      paste0("(", paste(tup$cs_indices, collapse = ","), ")")
    } else NA_character_

    out <- data.frame(tuple = cs_idx_str, stringsAsFactors = FALSE)
    for (raw in trait_names_all) {
      out[[trait_cols[[raw]]]] <- if (raw %in% names(mp)) {
        as.numeric(mp[[raw]])
      } else NA_real_
    }
    out$top_pattern <- top_pat
    out$top_prob    <- as.numeric(cp[top_idx])
    out
  })
  rows <- rows[!vapply(rows, is.null, logical(1))]
  if (length(rows) == 0L) {
    return(list(df = NULL, n_total = n_total, n_kept = 0L))
  }
  df <- do.call(rbind, rows)
  rownames(df) <- NULL
  list(df = df, n_total = n_total, n_kept = nrow(df))
}

# Annotate the coloc data.frame with verdict + dominant PP, and optionally
# drop rows whose dominant hypothesis is H0. Returns the df and kept/total
# counts so the print method can footer the hidden count. Tolerates the
# input data.frame already carrying a `verdict` or `top_pp` column (we
# overwrite). Errors if any of PP.H0..PP.H4 is missing -- those columns
# define the algorithm.
.summarise_coloc <- function(df, signal_only) {
  if (is.null(df) || !is.data.frame(df) || nrow(df) == 0L) {
    return(list(df = NULL, n_total = 0L, n_kept = 0L))
  }
  missing_pp <- setdiff(.COLOC_PP_COLS, colnames(df))
  if (length(missing_pp) > 0L) {
    warning("coloc_pairwise table missing required columns: ",
            paste(missing_pp, collapse = ", "),
            "; skipping coloc summary.", call. = FALSE)
    return(list(df = NULL, n_total = nrow(df), n_kept = 0L))
  }

  pp_mat <- as.matrix(df[, .COLOC_PP_COLS, drop = FALSE])
  storage.mode(pp_mat) <- "double"
  # Rows where every PP is NA / non-finite are unscoreable; treat as H0.
  bad_row <- !apply(pp_mat, 1L, function(r) any(is.finite(r)))
  pp_mat[bad_row, ] <- 0
  pp_mat[bad_row, 1L] <- 1

  top    <- max.col(pp_mat, ties.method = "first")
  df$verdict <- .COLOC_LABELS[top]
  df$top_pp  <- pp_mat[cbind(seq_len(nrow(df)), top)]
  n_total    <- nrow(df)

  if (signal_only) {
    df <- df[top != 1L, , drop = FALSE]
    rownames(df) <- NULL
  }
  if (nrow(df) == 0L) {
    return(list(df = NULL, n_total = n_total, n_kept = 0L))
  }
  list(df = df, n_total = n_total, n_kept = nrow(df))
}

#' Print a summary.susie_post_outcome_configuration object
#'
#' Pretty-prints the tidy tables built by
#' [summary.susie_post_outcome_configuration()] with optional ANSI color
#' highlighting. See that page for the color encoding.
#'
#' @param x Output of [summary.susie_post_outcome_configuration()].
#' @param ... Ignored.
#' @return The input invisibly.
#'
#' @seealso [summary.susie_post_outcome_configuration()]
#'
#' @method print summary.susie_post_outcome_configuration
#' @export print.summary.susie_post_outcome_configuration
#' @export
#' @importFrom crayon has_color bold silver green yellow blue magenta cyan
print.summary.susie_post_outcome_configuration <- function(x, ...) {
  use_color <- isTRUE(x$color) ||
    (identical(x$color, "auto") && has_color())

  # Force-enable crayon when the caller asked for colors explicitly. Crayon
  # otherwise respects its own global `crayon.enabled` option and may strip
  # ANSI in non-tty contexts (R CMD CHECK, capture.output, knitr) even when
  # the user passed `color = TRUE`.
  if (isTRUE(x$color)) {
    old_opt <- options(crayon.enabled = TRUE)
    on.exit(options(old_opt), add = TRUE)
  }

  paint <- if (use_color) {
    function(s, style) style(s)
  } else {
    function(s, style) s
  }

  if (is.null(x$susiex) && is.null(x$coloc_pairwise)) {
    cat("susie_post_outcome_configuration: no signals to report",
        if (isTRUE(x$signal_only)) " (signal_only = TRUE)" else "",
        "\n", sep = "")
    return(invisible(x))
  }

  if (!is.null(x$susiex) && nrow(x$susiex) > 0L) {
    cat("\n",
        paint("SuSiEx: per-trait marginal P(active) per CS tuple", bold),
        "\n", sep = "")
    cat(paint(sprintf(
      "  prob_thresh = %.2f, ambiguous = [%.2f, %.2f)",
      x$prob_thresh, x$ambiguous_lower, x$prob_thresh),
      silver), "\n\n", sep = "")
    .print_susiex_table(x$susiex, x$prob_thresh, x$ambiguous_lower, use_color)
    if (isTRUE(x$signal_only) && x$susiex_n_total > x$susiex_n_kept) {
      cat(paint(sprintf(
        "  (%d/%d CS tuples hidden -- no trait above prob_thresh; pass signal_only = FALSE to show)",
        x$susiex_n_total - x$susiex_n_kept, x$susiex_n_total),
        silver), "\n", sep = "")
    }
  }

  if (!is.null(x$coloc_pairwise) && nrow(x$coloc_pairwise) > 0L) {
    cat("\n",
        paint("Coloc pairwise: dominant hypothesis per (trait, trait', l1, l2)",
              bold),
        "\n", sep = "")
    cat(paint(
      "  H0 no signal | H1 trait1-only | H2 trait2-only | H3 distinct | H4 shared",
      silver), "\n\n", sep = "")
    .print_coloc_table(x$coloc_pairwise, use_color)
    if (isTRUE(x$signal_only) && x$coloc_n_total > x$coloc_n_kept) {
      cat(paint(sprintf(
        "  (%d/%d pairs hidden -- H0 dominant; pass signal_only = FALSE to show)",
        x$coloc_n_total - x$coloc_n_kept, x$coloc_n_total),
        silver), "\n", sep = "")
    }
  }

  invisible(x)
}

# ---- table renderers -------------------------------------------------------

.print_susiex_table <- function(df, prob_thresh, ambiguous_lower, use_color) {
  trait_cols <- setdiff(colnames(df), .SUSIEX_RESERVED)

  fmt_prob <- function(p) {
    s <- if (is.na(p)) "  NA" else sprintf("%.3f", p)
    if (!use_color) return(s)
    if (is.na(p))                    silver(s)
    else if (p >= prob_thresh)       bold(green(s))
    else if (p >= ambiguous_lower)   yellow(s)
    else                              silver(s)
  }
  fmt_pat <- function(pat) {
    if (is.na(pat)) return("NA")
    if (!use_color) return(pat)
    cyan(pat)
  }

  hdr  <- c("CS tuple", trait_cols, "top pattern", "top P")
  rows <- lapply(seq_len(nrow(df)), function(i) {
    c(as.character(df$tuple[i]),
      vapply(trait_cols, function(t) fmt_prob(df[[t]][i]), character(1)),
      fmt_pat(df$top_pattern[i]),
      sprintf("%.3f", df$top_prob[i]))
  })
  .print_aligned(hdr, rows)
}

.print_coloc_table <- function(df, use_color) {
  display_present <- intersect(.COLOC_DISPLAY, colnames(df))
  pp_present      <- intersect(.COLOC_PP_COLS, colnames(df))

  pp_mat  <- as.matrix(df[, pp_present, drop = FALSE])
  storage.mode(pp_mat) <- "double"
  top_idx <- max.col(pp_mat, ties.method = "first")

  fmt_pp <- function(p, is_top) {
    s <- if (is.na(p)) "  NA" else sprintf("%.3f", p)
    if (!use_color) return(s)
    if (is.na(p))   silver(s)
    else if (is_top) bold(s)
    else            s
  }
  fmt_verdict <- function(v) {
    if (is.na(v) || !nzchar(v)) return(if (is.na(v)) "NA" else v)
    if (!use_color) return(v)
    style <- switch(
      substr(v, 1L, 2L),
      "H0" = silver,
      "H1" = blue,
      "H2" = blue,
      "H3" = magenta,
      "H4" = function(s) bold(green(s)),
      identity)
    style(v)
  }

  hdr  <- c(display_present, pp_present, "verdict")
  rows <- lapply(seq_len(nrow(df)), function(i) {
    pp_strs <- vapply(seq_along(pp_present), function(k) {
      fmt_pp(pp_mat[i, k], k == top_idx[i])
    }, character(1))
    c(vapply(display_present, function(col) {
        as.character(df[[col]][i])
      }, character(1)),
      pp_strs,
      fmt_verdict(df$verdict[i]))
  })
  .print_aligned(hdr, rows)
}

# Width-aware aligned printing. `vwidth` strips ANSI escape sequences so
# colored cells line up correctly; `pad_to` right-pads to a target width.
.print_aligned <- function(hdr, rows) {
  vwidth <- function(s) nchar(gsub("\033\\[[0-9;]*m", "", s))
  pad_to <- function(s, w) {
    pad <- max(0L, w - vwidth(s))
    paste0(s, strrep(" ", pad))
  }

  ncols <- length(hdr)
  if (length(rows) == 0L) {
    cat("  ", paste(hdr, collapse = "  "), "\n", sep = "")
    return(invisible())
  }
  widths <- vapply(seq_len(ncols), function(k) {
    body_w <- max(vapply(rows, function(r) vwidth(r[[k]]), integer(1)))
    max(vwidth(hdr[k]), body_w)
  }, integer(1))

  cat("  ",
      paste(vapply(seq_len(ncols), function(k) pad_to(hdr[k], widths[k]),
                   character(1)),
            collapse = "  "),
      "\n", sep = "")
  cat("  ",
      paste(strrep("-", widths), collapse = "  "),
      "\n", sep = "")
  for (r in rows) {
    cat("  ",
        paste(vapply(seq_len(ncols), function(k) pad_to(r[[k]], widths[k]),
                     character(1)),
              collapse = "  "),
        "\n", sep = "")
  }
  invisible()
}


================================================
FILE: R/susie_rss_utils.R
================================================
# =============================================================================
# FUNDAMENTAL COMPUTATIONS
#
# Basic mathematical utilities and core RSS computations. These functions
# handle fundamental operations like sufficient statistics computation and
# eigenvalue inverse calculations.
#
# Functions: compute_suff_stat, compute_Dinv, safe_pd_decomp
# =============================================================================

# Decompose a symmetric PSD matrix for efficient log-determinant and solve.
# Uses Cholesky when the matrix is PD (fast, O(r^3/6)). Falls back to
# eigendecomposition when the matrix is singular (e.g. lambda=0 at simplex
# vertices in omega optimization), projecting out the null-space.
#
# Returns a list with:
#   logdet  - log-determinant (only over positive eigenvalues)
#   r_eff   - effective rank (number of positive eigenvalues)
#   solve   - function(v) that computes S^{-1} v (or pseudoinverse for singular S)
#   solve_z - S^{-1} applied to a specific vector z (precomputed for speed)
#
#' @keywords internal
safe_pd_decomp <- function(S, z = NULL) {
  r <- nrow(S)
  # Try Cholesky first (fast path)
  L <- tryCatch(chol(S), error = function(e) NULL)

  if (!is.null(L)) {
    # Cholesky succeeded: S is PD
    logdet <- 2 * sum(log(diag(L)))
    solve_fn <- function(v) backsolve(L, backsolve(L, v, transpose = TRUE))
    solve_z <- if (!is.null(z)) solve_fn(z) else NULL
    return(list(logdet = logdet, r_eff = r, solve = solve_fn, solve_z = solve_z))
  }

  # Cholesky failed: use eigendecomposition (handles singular matrices)
  eig <- eigen(S, symmetric = TRUE)
  d <- pmax(eig$values, 0)
  Q <- eig$vectors
  pos <- d > .Machine$double.eps * max(d)
  d_pos <- d[pos]
  Q_pos <- Q[, pos, drop = FALSE]

  logdet <- sum(log(d_pos))
  solve_fn <- function(v) Q_pos %*% (crossprod(Q_pos, v) / d_pos)
  solve_z <- if (!is.null(z)) {
    Qt_z <- crossprod(Q_pos, z)
    Q_pos %*% (Qt_z / d_pos)
  } else NULL

  list(logdet = logdet, r_eff = sum(pos), solve = solve_fn, solve_z = solve_z)
}


#' @title Compute sufficient statistics for input to \code{susie_ss}
#'
#' @description Computes the sufficient statistics \eqn{X'X, X'y, y'y}
#'   and \eqn{n} after centering (and possibly standardizing) the
#'   columns of \eqn{X} and centering \eqn{y} to have mean zero. We also
#'   store the column means of \eqn{X} and mean of \eqn{y}.
#'
#' @param X An n by p matrix of covariates.
#'
#' @param y An n vector.
#'
#' @param standardize Logical flag indicating whether to standardize
#'   columns of X to unit variance prior to computing summary data
#'
#' @return A list of sufficient statistics (\code{XtX, Xty, yty, n})
#'   and \code{X_colmeans}, \code{y_mean}.
#'
#' @importFrom methods as
#' @importFrom Matrix colMeans
#' @importFrom Matrix crossprod
#'
#' @examples
#' data(N2finemapping)
#' ss <- compute_suff_stat(N2finemapping$X, N2finemapping$Y[, 1])
#'
#' @export
#'
compute_suff_stat <- function(X, y, standardize = FALSE) {
  y_mean <- mean(y)
  y <- y - y_mean
  n <- nrow(X)
  mu <- colMeans(X)
  s <- compute_colSds(X)
  Xty <- drop(y %*% X)
  XtX <- crossprod(X)
  XtX <- as.matrix(XtX)
  XtX <- XtX - n * tcrossprod(mu)
  if (standardize) {
    XtX <- XtX / s
    XtX <- t(XtX)
    XtX <- XtX / s
    Xty <- Xty / s
  }
  n <- length(y)
  yty <- sum(y^2)
  return(list(
    XtX = XtX, Xty = Xty, yty = yty, n = n,
    y_mean = y_mean, X_colmeans = mu
  ))
}

# Compute inverse eigenvalues for RSS-lambda methods
#' @keywords internal
compute_Dinv <- function(model, data) {
  eigen_R <- get_eigen_R(data, model)
  Dinv <- 1 / (model$sigma2 * eigen_R$values + data$lambda)
  Dinv[is.infinite(Dinv)] <- 0
  return(Dinv)
}

# Accessor for eigen_R: check model first (multi-panel), fall through to data
#' @keywords internal
get_eigen_R <- function(data, model) {
  if (!is.null(model$eigen_R)) model$eigen_R else data$eigen_R
}

# Accessor for Vtz: check model first (multi-panel), fall through to data
#' @keywords internal
get_Vtz <- function(data, model) {
  if (!is.null(model$Vtz)) model$Vtz else data$Vtz
}

# =============================================================================
# RSS MODEL METHODS
#
# Core RSS algorithm functions including parameter estimation and model
# preprocessing. These implement the mathematical framework for RSS-based
# fine-mapping and handle iteration-specific computations.
#
# Functions: estimate_s_rss, precompute_rss_lambda_terms
# =============================================================================

#' @title Estimate s in \code{susie_rss} Model Using Regularized LD
#'
#' @description The estimated s gives information about the
#'   consistency between the z scores and LD matrix. A larger \eqn{s}
#'   means there is a strong inconsistency between z scores and LD
#'   matrix. The \dQuote{null-mle} method obtains mle of \eqn{s} under
#'   \eqn{z | R ~ N(0,(1-s)R + s I)}, \eqn{0 < s < 1}. The
#'   \dQuote{null-partialmle} method obtains mle of \eqn{s} under
#'   \eqn{U^T z | R ~ N(0,s I)}, in which \eqn{U} is a matrix containing
#'   the of eigenvectors that span the null space of R; that is, the
#'   eigenvectors corresponding to zero eigenvalues of R. The estimated
#'   \eqn{s} from \dQuote{null-partialmle} could be greater than 1. The
#'   \dQuote{null-pseudomle} method obtains mle of \eqn{s} under
#'   pseudolikelihood \eqn{L(s) = \prod_{j=1}^{p} p(z_j | z_{-j}, s,
#'   R)}, \eqn{0 < s < 1}.
#'
#' @param z A p-vector of z scores.
#'
#' @param R A p by p symmetric, positive semidefinite correlation
#'   matrix.
#'
#' @param n The sample size. (Optional, but highly recommended.)
#'
#' @param r_tol Tolerance level for eigenvalue check of positive
#'   semidefinite matrix of R.
#'
#' @param method a string specifies the method to estimate \eqn{s}.
#'
#' @return A number between 0 and 1.
#'
#' @examples
#' set.seed(1)
#' n <- 500
#' p <- 1000
#' beta <- rep(0, p)
#' beta[1:4] <- 0.01
#' X <- matrix(rnorm(n * p), nrow = n, ncol = p)
#' X <- scale(X, center = TRUE, scale = TRUE)
#' y <- drop(X %*% beta + rnorm(n))
#' input_ss <- compute_suff_stat(X, y, standardize = TRUE)
#' ss <- univariate_regression(X, y)
#' R <- cor(X)
#' attr(R, "eigen") <- eigen(R, symmetric = TRUE)
#' zhat <- with(ss, betahat / sebetahat)
#'
#' # Estimate s using the unadjusted z-scores.
#' s0 <- estimate_s_rss(zhat, R)
#'
#' # Estimate s using the adjusted z-scores.
#' s1 <- estimate_s_rss(zhat, R, n)
#'
#' @importFrom stats dnorm
#' @importFrom stats optim
#'
#' @export
#'
estimate_s_rss <- function(z, R, n, r_tol = 1e-08, method = "null-mle") {
  # Check and process input arguments z, R.
  z[is.na(z)] <- 0
  if (is.null(attr(R, "eigen"))) {
    attr(R, "eigen") <- eigen(R, symmetric = TRUE)
  }
  eigenld <- attr(R, "eigen")
  if (any(eigenld$values < -r_tol)) {
    warning_message(
      "The matrix R is not positive semidefinite. Negative ",
      "eigenvalues are set to zero"
    )
  }
  eigenld$values[eigenld$values < r_tol] <- 0

  # Check input n, and adjust the z-scores if n is provided.
  if (missing(n)) {
    warning_message(
      "Providing the sample size (n), or even a rough estimate of n, ",
      "is highly recommended. Without n, the implicit assumption is ",
      "n is large (Inf) and the effect sizes are small (close to zero)."
    )
  } else if (n <= 1) {
    stop("n must be greater than 1")
  }
  if (!missing(n)) {
    sigma2 <- (n - 1) / (z^2 + n - 2)
    z <- sqrt(sigma2) * z
  }

  if (method == "null-mle") {
    negloglikelihood <- function(s, ztv, d) {
      0.5 * sum(log((1 - s) * d + s)) +
        0.5 * tcrossprod(ztv / ((1 - s) * d + s), ztv)
    }
    s <- optim(0.5,
               fn = negloglikelihood, ztv = crossprod(z, eigenld$vectors),
               d = eigenld$values, method = "Brent", lower = 0, upper = 1
    )$par
  } else if (method == "null-partialmle") {
    colspace <- which(eigenld$values > 0)
    if (length(colspace) == length(z)) {
      s <- 0
    } else {
      znull <- crossprod(eigenld$vectors[, -colspace], z) # U2^T z
      s <- sum(znull^2) / length(znull)
    }
  } else if (method == "null-pseudomle") {
    pseudolikelihood <- function(s, z, eigenld) {
      precision <- eigenld$vectors %*% (t(eigenld$vectors) *
                                          (1 / ((1 - s) * eigenld$values + s)))
      postmean <- rep(0, length(z))
      postvar <- rep(0, length(z))
      for (i in 1:length(z)) {
        postmean[i] <- -(1 / precision[i, i]) * precision[i, -i] %*% z[-i]
        postvar[i] <- 1 / precision[i, i]
      }
      return(-sum(dnorm(z, mean = postmean, sd = sqrt(postvar), log = TRUE)))
    }
    s <- optim(0.5,
               fn = pseudolikelihood, z = z, eigenld = eigenld,
               method = "Brent", lower = 0, upper = 1
    )$par
  } else {
    stop("The method is not implemented")
  }
  return(s)
}

# Precompute RSS lambda terms that change per IBSS iteration
#' @keywords internal
precompute_rss_lambda_terms <- function(data, model) {
  # Precompute quantities that change per IBSS iteration.
  # When slot_weights (c_hat) are active, Z and zbar are weighted by sw_l
  # so that get_ER2.rss_lambda and the omega evaluator see c_hat-weighted
  # posterior means. diag_postb2 is weighted by sw_l (not sw_l^2) because
  # E[c_l^2] = c_hat_l for Bernoulli.
  sw <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, nrow(model$alpha))
  model$Z           <- sw * model$alpha * model$mu
  model$zbar        <- colSums(model$Z)
  model$diag_postb2 <- colSums(sw * model$alpha * model$mu2)

  return(model)
}

# estimate_lambda_bias and apply_inflation_state moved to R/rss_mismatch.R.

# =============================================================================
# MULTI-PANEL LD MIXTURE
#
# Functions for combining K reference LD panels with learnable convex weights.
# R(omega) = sum_k omega_k R_hat_k, with X_meta = [sqrt(omega_1) X_1; ...].
#
# Key functions:
#   form_X_meta             -- form composite X from K panels with weights
#   eigen_from_X            -- SVD-based eigendecomposition from X matrix
#   precompute_omega_cache  -- joint SVD for reduced-basis optimization
#   precompute_omega_iteration -- per-IBSS-iter bilinear forms
#   eval_omega_eloglik_reduced -- O(r^3) Eloglik evaluator (Cholesky)
#   eigen_from_reduced      -- recover full p-dim eigen from reduced basis
#   eval_omega_eloglik_R    -- O(p^3) reference implementation (testing)
#   optimize_omega          -- simplex optimizer (Grid+Brent or Frank-Wolfe)
# =============================================================================

# Form composite X from K panels with weights omega
# Pre-allocates output to avoid K intermediate copies
#' @keywords internal
form_X_meta <- function(X_list, omega) {
  K   <- length(X_list)
  p   <- ncol(X_list[[1]])
  nrs <- vapply(X_list, nrow, integer(1))
  X_meta <- matrix(0, sum(nrs), p)
  offset <- 0L
  for (k in seq_len(K)) {
    rows <- offset + seq_len(nrs[k])
    if (omega[k] > 0)
      X_meta[rows, ] <- sqrt(omega[k]) * X_list[[k]]
    offset <- offset + nrs[k]
  }
  X_meta
}

# SVD-based eigendecomposition from X matrix (X'X = R)
#' @keywords internal
eigen_from_X <- function(X, p) {
  sv <- svd(X, nu = 0)
  eigen_values <- pmax(sv$d^2, 0)
  eigen_vectors <- sv$v
  if (ncol(eigen_vectors) < p) {
    eigen_vectors <- cbind(eigen_vectors,
                           matrix(0, p, p - ncol(eigen_vectors)))
    eigen_values <- c(eigen_values, rep(0, p - length(eigen_values)))
  }
  idx <- order(eigen_values, decreasing = TRUE)
  list(values = eigen_values[idx], vectors = eigen_vectors[, idx])
}

# Precompute reduced-basis quantities for fast omega optimization.
#
# For K panels with reference factor matrices X_k (B_k x p), projects all panel
# correlations into a joint reduced basis V_s (p x r) where r = rank of
# [X_1; ...; X_K]. Each Brent evaluation then works on r x r matrices
# (Cholesky + backsolves) instead of p x p eigendecompositions.
#
# Returns a list to be stored in data$omega_cache.
#' @keywords internal
precompute_omega_cache <- function(X_list, z, r_tol = 1e-8) {
  X_stack <- do.call(rbind, X_list)
  sv <- svd(X_stack, nu = 0)
  keep <- sv$d > r_tol
  V_s <- sv$v[, keep, drop = FALSE]
  r <- ncol(V_s)

  # Project each panel into reduced basis: A_k = V_s' R_k V_s (r x r)
  A_list <- lapply(X_list, function(Xk) {
    Zk <- Xk %*% V_s
    crossprod(Zk)
  })

  list(
    V_s = V_s,
    r = r,
    A_list = A_list,
    Vsz = as.vector(crossprod(V_s, z)),
    z_norm2 = sum(z^2)
  )
}

# Precompute per-IBSS-iteration quantities for the omega Brent evaluator.
# Called once per IBSS iteration (not per Brent eval).
#' @keywords internal
precompute_omega_iteration <- function(cache, zbar, diag_postb2, Z) {
  Vsz_bar <- as.vector(crossprod(cache$V_s, zbar))
  ZVs <- Z %*% cache$V_s   # L x r
  M_postb2 <- crossprod(cache$V_s * diag_postb2, cache$V_s)  # r x r

  list(Vsz_bar = Vsz_bar, ZVs = ZVs, M_postb2 = M_postb2)
}

# Evaluate Eloglik at a candidate omega using reduced basis + Cholesky.
#
# Uses precomputed A_k*vector products from precompute_omega_iteration,
# so per-eval work is dominated by the r x r Cholesky + backsolves.
#' @keywords internal
eval_omega_eloglik_reduced <- function(cache, omega, iter_cache,
                                        sigma2, lambda, K, p) {
  r <- cache$r

  # Form A(omega) = sum_k omega_k A_k once; reused for all terms
  A_omega <- omega[1] * cache$A_list[[1]]
  for (k in seq_len(K)[-1])
    A_omega <- A_omega + omega[k] * cache$A_list[[k]]

  # S_r = sigma2 * A(omega) + lambda * I_r
  # Uses safe_pd_decomp: Cholesky when PD, eigen fallback when singular
  # (lambda=0 at simplex vertices where one panel's weight = 0).
  S_r <- sigma2 * A_omega + lambda * diag(r)
  decomp <- safe_pd_decomp(S_r, z = cache$Vsz)
  Sinv_Vsz <- decomp$solve_z
  solve_S  <- decomp$solve

  # log|S|: column-space from decomp, null-space from lambda (if > 0)
  logdet_null <- if (lambda > 0) (p - r) * log(lambda) else 0
  logdet_term <- -0.5 * (decomp$logdet + logdet_null)

  # z^T S^{-1} z: null-space term only when lambda > 0
  z_null_norm2 <- max(cache$z_norm2 - sum(cache$Vsz^2), 0)
  zSinvz <- sum(cache$Vsz * Sinv_Vsz)
  if (lambda > 0) zSinvz <- zSinvz + z_null_norm2 / lambda

  # Effective dimension: full p when lambda > 0 (null-space contributes),
  # only the effective rank of S_r when lambda = 0.
  p_eff <- if (lambda > 0) p else decomp$r_eff

  # term2: -2 * zbar' R(omega) S^{-1} z
  RSinvz_r <- A_omega %*% Sinv_Vsz
  term2 <- -2 * sum(iter_cache$Vsz_bar * RSinvz_r)

  # term3: zbar' R(omega) S^{-1} R(omega) zbar
  A_Vsz_bar <- A_omega %*% iter_cache$Vsz_bar
  Sinv_A_Vsz_bar <- solve_S(A_Vsz_bar)
  term3 <- sum(A_Vsz_bar * Sinv_A_Vsz_bar)

  # term4: -tr(Z' R(omega) S^{-1} R(omega) Z)
  A_ZVs_t <- A_omega %*% t(iter_cache$ZVs)
  Sinv_A_ZVs_t <- solve_S(A_ZVs_t)
  term4 <- -sum(A_ZVs_t * Sinv_A_ZVs_t)

  # term5: tr(diag(postb2) R(omega) S^{-1} R(omega))
  AMA_omega <- A_omega %*% iter_cache$M_postb2 %*% A_omega
  Sinv_AMA <- solve_S(AMA_omega)
  term5 <- sum(diag(Sinv_AMA))

  ER2 <- zSinvz + term2 + term3 + term4 + term5
  # Always include the column-space log|S(omega)|: it is omega-dependent and
  # is the primary driver of mixture weight selection. At lambda=0 the
  # null-space pieces (logdet_null, z_null_norm2/lambda) are constants in
  # omega given the joint reduced basis, so dropping them is fine --- but
  # dropping logdet_term itself erases the omega signal.
  -p_eff / 2 * log(2 * pi) + logdet_term - 0.5 * ER2
}

# Recover full eigendecomposition from reduced basis after omega is chosen.
# Called once per IBSS iteration (after Brent converges), not per eval.
#' @keywords internal
eigen_from_reduced <- function(cache, omega, K, p) {
  A_omega <- omega[1] * cache$A_list[[1]]
  for (k in seq_len(K)[-1])
    A_omega <- A_omega + omega[k] * cache$A_list[[k]]

  eig <- eigen(0.5 * (A_omega + t(A_omega)), symmetric = TRUE)
  d <- pmax(eig$values, 0)
  V_full <- cache$V_s %*% eig$vectors

  if (cache$r < p) {
    V_full <- cbind(V_full, matrix(0, p, p - cache$r))
    d <- c(d, rep(0, p - cache$r))
  }

  list(values = d, vectors = V_full)
}

# Naive O(p^3) Eloglik evaluator (used for testing and as reference).
# Forms R(omega), eigendecomposes the p x p matrix, evaluates Eloglik.
#' @keywords internal
eval_omega_eloglik_R <- function(panel_R, omega, z, zbar, diag_postb2, Z,
                                  sigma2, lambda, K, p) {
  # Form R(omega) = sum_k omega_k R_k
  R_omega <- omega[1] * panel_R[[1]]
  for (k in seq_len(K)[-1]) R_omega <- R_omega + omega[k] * panel_R[[k]]
  R_omega <- 0.5 * (R_omega + t(R_omega))

  # Eigendecompose
  eig <- eigen(R_omega, symmetric = TRUE)
  D <- pmax(eig$values, 0)
  V <- eig$vectors

  # Eloglik computation
  Vtz <- crossprod(V, z)
  z_null_norm2 <- max(sum(z^2) - sum(Vtz^2), 0)
  S_diag <- sigma2 * D + lambda
  Dinv <- ifelse(S_diag > 0, 1 / S_diag, 0)
  DinvD2 <- Dinv * D^2

  # When lambda=0, skip zero entries in log-det and null-space terms
  S_pos <- S_diag[S_diag > 0]
  logdet_term <- -0.5 * sum(log(S_pos))
  zSinvz <- sum(Dinv * Vtz^2)
  if (lambda > 0) zSinvz <- zSinvz + z_null_norm2 / lambda

  RSinvz <- V %*% (Dinv * D * Vtz)
  term2 <- -2 * sum(zbar * RSinvz)

  Vtzbar <- crossprod(V, zbar)
  term3 <- sum(Vtzbar^2 * DinvD2)

  ZV <- Z %*% V
  term4 <- -sum(ZV^2 %*% DinvD2)

  diag_RSinvR <- colSums(t(V)^2 * DinvD2)
  term5 <- sum(diag_RSinvR * diag_postb2)

  ER2 <- zSinvz + term2 + term3 + term4 + term5
  p_eff <- length(S_pos)
  # See eval_omega_eloglik_reduced: always keep column-space logdet_term.
  -p_eff / 2 * log(2 * pi) + logdet_term - 0.5 * ER2
}

# Optimize omega on the K-simplex by maximizing eval_fn.
# Uses the Frank-Wolfe conditional gradient algorithm: each iteration
# evaluates the objective at all K simplex vertices to find the steepest
# ascent direction, then performs a line search (Brent's method) toward
# that vertex.  For K=2 a coarse grid warm-start is prepended since the
# simplex is 1D and the grid cost is negligible.
# Returns list(omega, converged) where converged indicates max|delta| < tol.
#' @keywords internal
#' @importFrom stats optimize
optimize_omega <- function(eval_fn, omega_cur, K,
                           tol = .omega_tol) {
  omega   <- omega_cur
  cur_val <- eval_fn(omega)

  # K=2 warm-start: coarse grid over the 1D simplex
  if (K == 2) {
    grid <- seq(0, 1, tol$grid_spacing)
    vals <- vapply(grid, function(w1) eval_fn(c(w1, 1 - w1)), numeric(1))
    best_w1 <- grid[which.max(vals)]
    omega   <- c(best_w1, 1 - best_w1)
    cur_val <- max(vals)
  }

  # Frank-Wolfe: conditional gradient on simplex with Brent line search.
  # For K=2 the grid already evaluated the vertices; cache them.
  vertex_cache <- if (K == 2) c(vals[1], vals[length(vals)]) else NULL
  for (fw_iter in seq_len(tol$fw_max_iter)) {
    vertex_vals <- if (!is.null(vertex_cache)) {
      vertex_cache
    } else {
      vapply(seq_len(K), function(k) {
        e_k <- rep(0, K); e_k[k] <- 1; eval_fn(e_k)
      }, numeric(1))
    }
    vertex_cache <- NULL  # only reuse on first iteration
    k_star <- which.max(vertex_vals)
    s <- rep(0, K); s[k_star] <- 1
    opt <- optimize(function(gamma) eval_fn((1 - gamma) * omega + gamma * s),
                    interval = c(0, 1), maximum = TRUE)
    # Absolute improvement check: conservative for large negative Eloglik values
    if (opt$objective - cur_val < tol$fw_stop) break
    omega   <- (1 - opt$maximum) * omega + opt$maximum * s
    cur_val <- opt$objective
  }

  converged <- max(abs(omega - omega_cur)) < tol$convergence
  list(omega = omega, converged = converged)
}

# =============================================================================
# DIAGNOSTIC & QUALITY CONTROL
#
# Functions for RSS model diagnostics, data quality assessment, and
# validation. These help users assess the compatibility between z-scores
# and LD matrices and identify potential data issues.
#
# Functions: kriging_rss
# =============================================================================

#' @title Compute Distribution of z-scores of Variant j Given Other z-scores, and Detect Possible Allele Switch Issue
#'
#' @description Under the null, the rss model with regularized LD
#'   matrix is \eqn{z|R,s ~ N(0, (1-s)R + s I))}. We use a mixture of
#'   normals to model the conditional distribution of z_j given other z
#'   scores, \eqn{z_j | z_{-j}, R, s ~ \sum_{k=1}^{K} \pi_k
#'   N(-\Omega_{j,-j} z_{-j}/\Omega_{jj}, \sigma_{k}^2/\Omega_{jj})},
#'   \eqn{\Omega = ((1-s)R + sI)^{-1}}, \eqn{\sigma_1, ..., \sigma_k}
#'   is a grid of fixed positive numbers. We estimate the mixture
#'   weights \eqn{\pi}  We detect the possible allele switch issue
#'   using likelihood ratio for each variant.
#'
#' @param z A p-vector of z scores.
#'
#' @param R A p by p symmetric, positive semidefinite correlation
#'   matrix.
#'
#' @param n The sample size. (Optional, but highly recommended.)
#'
#' @param r_tol Tolerance level for eigenvalue check of positive
#'   semidefinite matrix of R.
#'
#' @param s an estimated s from \code{estimate_s_rss}
#'
#' @return a list containing a ggplot2 plot object and a table. The plot
#'   compares observed z score vs the expected value. The possible allele
#'   switched variants are labeled as red points (log LR > 2 and abs(z) > 2).
#'   The table summarizes the conditional distribution for each variant
#'   and the likelihood ratio test. The table has the following columns:
#'   the observed z scores, the conditional expectation, the conditional
#'   variance, the standardized differences between the observed z score
#'   and expected value, the log likelihood ratio statistics.
#'
#' @importFrom stats dnorm
#' @importFrom ggplot2 ggplot
#' @importFrom ggplot2 geom_point
#' @importFrom ggplot2 geom_abline
#' @importFrom ggplot2 theme_bw
#' @importFrom ggplot2 labs
#' @importFrom ggplot2 aes_string
#' @importFrom mixsqp mixsqp
#'
#' @examples
#' # See also the vignette, "Diagnostic for fine-mapping with summary
#' # statistics."
#' set.seed(1)
#' n <- 500
#' p <- 1000
#' beta <- rep(0, p)
#' beta[1:4] <- 0.01
#' X <- matrix(rnorm(n * p), nrow = n, ncol = p)
#' X <- scale(X, center = TRUE, scale = TRUE)
#' y <- drop(X %*% beta + rnorm(n))
#' ss <- univariate_regression(X, y)
#' R <- cor(X)
#' attr(R, "eigen") <- eigen(R, symmetric = TRUE)
#' zhat <- with(ss, betahat / sebetahat)
#' cond_dist <- kriging_rss(zhat, R, n = n)
#' cond_dist$plot
#'
#' @export
#'
kriging_rss <- function(z, R, n, r_tol = 1e-08,
                        s = estimate_s_rss(z, R, n, r_tol, method = "null-mle")) {
  # Check and process input arguments z, R.
  z[is.na(z)] <- 0
  if (is.null(attr(R, "eigen"))) {
    attr(R, "eigen") <- eigen(R, symmetric = TRUE)
  }
  eigenld <- attr(R, "eigen")
  if (any(eigenld$values < -r_tol)) {
    warning_message(
      "The matrix R is not positive semidefinite. Negative ",
      "eigenvalues are set to zero."
    )
  }
  eigenld$values[eigenld$values < r_tol] <- 0

  # Check and progress input argument s.
  force(s)
  if (s > 1) {
    warning_message("The given s is greater than 1. We replace it with 0.8.")
    s <- 0.8
  } else if (s < 0) {
    stop("The s must be non-negative")
  }

  # Check input n, and adjust the z-scores if n is provided.
  if ((!missing(n)) && (n <= 1)) {
    stop("n must be greater than 1")
  }
  if (missing(n)) {
    warning_message(
      "Providing the sample size (n), or even a rough estimate of n, ",
      "is highly recommended. Without n, the implicit assumption is ",
      "n is large (Inf) and the effect sizes are small (close to zero)."
    )
  } else {
    sigma2 <- (n - 1) / (z^2 + n - 2)
    z <- sqrt(sigma2) * z
  }

  dinv <- 1 / ((1 - s) * eigenld$values + s)
  dinv[is.infinite(dinv)] <- 0
  precision <- eigenld$vectors %*% (t(eigenld$vectors) * dinv)
  condmean <- rep(0, length(z))
  condvar <- rep(0, length(z))
  for (i in 1:length(z)) {
    condmean[i] <- -(1 / precision[i, i]) * precision[i, -i] %*% z[-i]
    condvar[i] <- 1 / precision[i, i]
  }
  z_std_diff <- (z - condmean) / sqrt(condvar)

  # obtain grid
  a_min <- 0.8
  if (max(z_std_diff^2) < 1) {
    a_max <- 2
  } else {
    a_max <- 2 * sqrt(max(z_std_diff^2))
  }
  npoint <- ceiling(log2(a_max / a_min) / log2(1.05))
  a_grid <- 1.05^(seq(-npoint, 0)) * a_max

  # compute likelihood
  sd_mtx <- outer(sqrt(condvar), a_grid)
  matrix_llik <- dnorm(z - condmean, sd = sd_mtx, log = TRUE)
  lfactors <- apply(matrix_llik, 1, max)
  matrix_llik <- matrix_llik - lfactors

  # estimate weight
  w <- mixsqp(matrix_llik, log = TRUE, control = list(verbose = FALSE))$x

  # Compute denominators in likelihood ratios.
  logl0mix <- drop(log(exp(matrix_llik) %*% (w + 1e-15))) + lfactors

  # Compute numerators in likelihood ratios.
  matrix_llik <- dnorm(z + condmean, sd = sd_mtx, log = TRUE)
  lfactors <- apply(matrix_llik, 1, max)
  matrix_llik <- matrix_llik - lfactors
  logl1mix <- drop(log(exp(matrix_llik) %*% (w + 1e-15))) + lfactors

  # Compute (log) likelihood ratios.
  logLRmix <- logl1mix - logl0mix

  z <- drop(z)
  z_std_diff <- drop(z_std_diff)
  res <- data.frame(
    z = z,
    condmean = condmean,
    condvar = condvar,
    z_std_diff = z_std_diff,
    logLR = logLRmix
  )
  p <- ggplot(res, aes(y = .data$z, x = .data$condmean)) +
    geom_point() +
    labs(y = "Observed z scores", x = "Expected value") +
    geom_abline(intercept = 0, slope = 1) +
    theme_bw()
  idx <- which(logLRmix > 2 & abs(z) > 2)
  if (length(idx) > 0) {
    p <- p + geom_point(
      data = res[idx, ],
      aes(y = .data$z, x = .data$condmean), col = "red"
    )
  }
  return(list(plot = p, conditional_dist = res))
}


================================================
FILE: R/susie_trendfilter.R
================================================
#' @title Apply susie to trend filtering (especially changepoint
#'   problems), a type of non-parametric regression.
#'
#' @description Fits the non-parametric Gaussian regression model
#'   \eqn{y = mu + e}, where the mean \eqn{mu} is modelled as \eqn{mu =
#'   Xb}, X is a matrix with columns containing an appropriate basis,
#'   and b is vector with a (sparse) SuSiE prior. In particular, when
#'   \code{order = 0}, the jth column of X is a vector with the first j
#'   elements equal to zero, and the remaining elements equal to 1, so
#'   that \eqn{b_j} corresponds to the change in the mean of y between
#'   indices j and j+1. For background on trend filtering, see
#'   Tibshirani (2014). See also the "Trend filtering" vignette,
#'   \code{vignette("trend_filtering")}.
#'
#' @details This implementation exploits the special structure of X,
#'   which means that the matrix-vector product \eqn{X^Ty} is fast to
#'   compute; in particular, the computation time is \eqn{O(n)} rather
#'   than \eqn{O(n^2)} if \code{X} were formed explicitly. For
#'   implementation details, see the "Implementation of SuSiE trend
#'   filtering" vignette by running
#'   \code{vignette("trendfiltering_derivations")}.
#'
#' @param y An n-vector of observations ordered in time or space
#'   (assumed to be equally spaced).
#'
#' @param order An integer specifying the order of trend filtering.
#'   The default, \code{order = 0}, corresponds to "changepoint"
#'   problems (\emph{i.e.}, piecewise constant \eqn{mu}). Although
#'   \code{order > 0} is implemented, we do not recommend its use; in
#'   practice, we have found problems with convergence of the algorithm
#'   to poor local optima, producing unreliable inferences.
#'
#' @param standardize Logical indicating whether to standardize the X
#'   variables ("basis functions"); \code{standardize = FALSE} is
#'   recommended as these basis functions already have a natural scale.
#'
#' @param use_mad Logical indicating whether to use the "median
#'   absolute deviation" (MAD) method to the estimate residual
#'   variance. If \code{use_mad = TRUE}, susie is run twice, first by
#'   fixing the residual variance to the MAD value, then a second time,
#'   initialized to the first fit, but with residual variance estimated
#'   the usual way (by maximizing the ELBO). We have found this strategy
#'   typically improves reliability of the results by reducing a
#'   tendency to converge to poor local optima of the ELBO.
#'
#' @param ... Other arguments passed to \code{\link{susie}}.
#'
#' @return A "susie" fit; see \code{\link{susie}} for details.
#'
#' @references R. J. Tibshirani (2014). Adaptive piecewise polynomial
#'   estimation via trend filtering. \emph{Annals of Statistics}
#'   \bold{42}, 285-323.
#'
#' @examples
#' set.seed(1)
#' mu <- c(rep(0, 50), rep(1, 50), rep(3, 50), rep(-2, 50), rep(0, 200))
#' y <- mu + rnorm(400)
#' s <- susie_trendfilter(y)
#' plot(y)
#' lines(mu, col = 1, lwd = 3)
#' lines(predict(s), col = 2, lwd = 2)
#'
#' # Calculate credible sets (indices of y that occur just before
#' # changepoints).
#' susie_get_cs(s)
#'
#' # Plot with credible sets for changepoints.
#' susie_plot_changepoint(s, y)
#'
#' @importFrom Matrix sparseMatrix
#'
#' @export
#'
susie_trendfilter <- function(y, order = 0, standardize = FALSE,
                              use_mad = TRUE, ...) {
  if (order > 0) {
    warning_message("order > 0 is not recommended")
  }
  n <- length(y)
  X <- sparseMatrix(i = NULL, j = NULL, dims = c(n, n))
  attr(X, "matrix.type") <- "tfmatrix"
  attr(X, "order") <- order
  if (use_mad && !("model_init" %in% names(list(...)))) {
    mad <- estimate_mad_residual_variance(y)
    s_mad_init <- suppressWarnings(susie(
      X = X, y = y, standardize = standardize,
      estimate_residual_variance = FALSE, residual_variance = mad, ...
    ))
    s <- susie(X = X, y = y, standardize = standardize, model_init = s_mad_init, ...)
  } else {
    s <- susie(X = X, y = y, standardize = standardize, ...)
  }
  return(s)
}

# @title estimate residual variance using MAD estimator
# @param y an n-vector
# @return a scalar of estimated residual variance
estimate_mad_residual_variance <- function(y) {
  sigma2 <- 0.5 * (median(abs(diff(y)) / 0.6745)^2)
  if (sigma2 == 0) {
    stop("Cannot use median absolute deviation (MAD) to initialize residual variance because MAD = 0 for the input data. Please set 'use_mad = FALSE'")
  }
  return(sigma2)
}

================================================
FILE: R/susie_trendfilter_utils.R
================================================
# @title Compute unscaled X %*% b using the special structure of trend
#   filtering
# @param order is the order of trend filtering
# @param b an n=p vector
# @return an n vector
compute_tf_Xb <- function(order, b) {
  for (i in 1:(order + 1)) {
    b <- rev(-1 * cumsum(rev(b)))
  }
  return(b)
}

# @title Compute unscaled t(X) %*% y using the special structure of
#   trend filtering
# @param order is the order of trend filtering
# @param y an n vector
# @return an n vector
compute_tf_Xty <- function(order, y) {
  for (i in 1:(order + 1)) {
    y <- -1 * cumsum(y)
  }
  return(y)
}

# @title Compute colSums(X*X) for X under four scenarios
# @param order is the order of trend filtering
# @param n the length of y
# @param cm column means of X
# @param csd column standard deviations of X
# @param intercept a boolean denotes whether mean centering X
# @param standardize a boolean denotes whether scaling X by standard deviation
# @return an n vector
compute_tf_d <- function(order, n, cm, csd, standardize = FALSE,
                         intercept = FALSE) {
  if (intercept) {
    # When standardize = TRUE, intercept = TRUE: by special
    # observation d = [n-1, n-1, ...]
    d <- rep(n - 1, n)
    if (order == 0) {
      d[n] <- 0
    }

    # When standardize = FALSE, intercept = TRUE:
    # d = [n-1, n-1, ...] * (csd^2)
    if (!standardize) {
      d <- d * csd^2
    }
    return(d)
  } else {
    # When standardize = FALSE, intercept = FALSE: d = colSums(X^2)
    base <- rep(-1, n)
    if (order == 0) {
      d <- cumsum(base^2)
    } else {
      for (i in 1:order) {
        base <- cumsum(base)
      }
      d <- cumsum(base^2)
    }

    # When standardize = TRUE, intercept = TRUE:
    # d = colSums(X^2) / (csd^2)
    if (standardize) {
      d <- d / csd^2
    }
    return(d)
  }
}

# @title Compute column mean of the trend filtering matrix X.
# @param order is the order of trend filtering
# @param n the length of y
# @return an n vector
compute_tf_cm <- function(order, n) {
  base <- rep(1, n)
  for (i in 1:(order + 1)) {
    base <- -cumsum(base)
  }
  return(base / n)
}

# @title Compute column standard deviation of the trend filtering
#   matrix X
# @param order is the order of trend filtering
# @param n is the length of y
# @return an n vector
compute_tf_csd <- function(order, n) {
  cm <- compute_tf_cm(order, n)
  csd <- sqrt((compute_tf_d(order, n) / n - cm^2) * n / (n - 1))
  csd[which(csd == 0)] <- 1
  return(csd)
}

# @title A fast way to compute colSums(X*X), where X is a
#   mean-centered and standardized trend filtering matrix.
# @param order order of trend filtering
# @param n the length of y
# @return an n vector
compute_tf_std_d <- function(order, n) {
  res <- rep(n - 1, n)
  if (order == 0) {
    res[n] <- 0
  }
  return(res)
}


================================================
FILE: R/susie_utils.R
================================================
# =============================================================================
# FUNDAMENTAL BUILDING BLOCKS
#
# Basic mathematical operations and utilities that serve as dependencies
# for other functions. These include matrix operations, statistical computations,
# and general-purpose helper functions.
#
# Functions: warning_message, safe_cor, safe_cov2cor, is_symmetric_matrix,
# apply_nonzeros, compute_colSds, compute_colstats
# =============================================================================

# Report R process memory usage (GB). Uses gc() which is cheap.
#' @keywords internal
mem_used_gb <- function() {
  gc_info <- gc(verbose = FALSE, reset = FALSE)
  sum(gc_info[, "(Mb)"]) / 1024
}

# Format prior variance vector: show non-zero values, summarize zeros.
# E.g., "[1.23e-01, 5.34e-02, 0 x 3]"
#' @keywords internal
format_V_summary <- function(V) {
  n_na   <- sum(is.na(V))
  V_nona <- V[!is.na(V)]
  n_zero <- sum(V_nona == 0)
  nz <- V_nona[V_nona != 0]
  parts <- sprintf("%.2e", nz)
  if (n_zero > 0) parts <- c(parts, sprintf("0 x %d", n_zero))
  if (n_na > 0)   parts <- c(parts, sprintf("NA x %d", n_na))
  paste0("[", paste(parts, collapse = ", "), "]")
}

# Format slot activity (c_hat) summary for verbose output.
# Shows per-slot c_hat values and lbf when active, empty string when not.
# E.g., ", c_hat=[0.99,0.87,0.12,0.45], lbf=[12.3,8.1,0.0,-0.2], C_hat=2.4"
#' @keywords internal
format_chat_summary <- function(model) {
  if (is.null(model$slot_weights)) return("")
  sw <- model$slot_weights
  lbf <- model$lbf
  lbf[is.na(lbf)] <- 0
  chat_vals <- paste(sprintf("%.2f", sw), collapse = ",")
  lbf_vals <- paste(sprintf("%.1f", lbf), collapse = ",")
  n_active <- sum(sw > 0.5)
  sprintf(", c_hat=[%s], lbf=[%s], C_hat=%.1f(%d>0.5)",
          chat_vals, lbf_vals, sum(sw), n_active)
}

# Utility function to display warning messages as they occur
#' @importFrom crayon combine_styles
#' @keywords internal
warning_message <- function(..., style = c("warning", "hint")) {
  style <- match.arg(style)
  if (style == "warning" && getOption("warn") >= 0) {
    alert <- combine_styles("bold", "underline", "red")
    message(alert("WARNING:"), " ", ...)
  } else {
    alert <- combine_styles("bold", "underline", "magenta")
    message(alert("HINT:"), " ", ...)
  }
}

#' Converts covariance matrix to correlation matrix
#' Constant variables (zero variance) get correlation 0 with others, 1 with self
#'
#' @param V Covariance matrix
#' @return Correlation matrix
#' @keywords internal
safe_cov2cor <- function(V) {
  d <- sqrt(diag(V))
  d_inv <- 1 / d
  d_inv[d == 0] <- 0
  R <- V * outer(d_inv, d_inv)
  diag(R) <- 1
  R
}

#' Computes correlation matrix from data matrix
#' Handles constant columns without warnings - returns 0 correlation for constant cols
#' Uses Rfast::cora when available (much faster for large matrices), falls back
#' to crossprod-based computation otherwise.
#'
#' @param X Data matrix (n x p)
#' @return Correlation matrix (p x p)
#' @keywords internal
safe_cor <- function(X) {
  n <- nrow(X)
  cm <- colMeans(X)
  css <- colSums(X^2) - n * cm^2   # column sum of squares (centered)
  has_const <- any(css == 0)

  # Fast path: use Rfast::cora when available and no constant columns
  if (!has_const && requireNamespace("Rfast", quietly = TRUE)) {
    return(Rfast::cora(X))
  }

  # Fallback: manual crossprod, handling constant columns
  X_centered <- X - rep(cm, each = n)
  sds <- sqrt(css / n)
  sds_inv <- 1 / sds
  sds_inv[sds == 0] <- 0
  X_scaled <- X_centered * rep(sds_inv, each = n)
  R <- crossprod(X_scaled) / n
  diag(R) <- 1
  R
}

# Standardize X so that X'X equals the correlation matrix R.
# Centers columns, divides by column sd, then scales by 1/sqrt(n)
# so that crossprod(X_out) = cor(X_in). Constant columns are zeroed.
# This is the in-place analog of safe_cor: safe_cor(X) == crossprod(standardize_X(X)).
#' @keywords internal
standardize_X <- function(X) {
  n <- nrow(X)
  cm <- colMeans(X)
  X <- X - rep(cm, each = n)
  css <- colSums(X^2)
  sds <- sqrt(css / n)
  sds[sds < .Machine$double.eps] <- 1  # constant columns: avoid 0/0
  X <- X * rep(1 / (sds * sqrt(n)), each = n)
  X
}

#' Check for symmetric matrix
#'
#' @param x A matrix to check
#' @return Logical indicating if x is symmetric
#' @export
#' @keywords internal
is_symmetric_matrix <- function(x) {
  if (is.matrix(x) && is.numeric(x) && !isS4(x) &&
      requireNamespace("Rfast", quietly = TRUE)) {
    return(Rfast::is.symmetric(x))
  } else {
    return(Matrix::isSymmetric(x, check.attributes = FALSE))
  }
}

# Apply operation f to all nonzeros of a sparse matrix.
#' @importFrom Matrix sparseMatrix
#' @importFrom Matrix summary
#' @keywords internal
apply_nonzeros <- function(X, f) {
  d <- summary(X)
  return(sparseMatrix(i = d$i, j = d$j, x = f(d$x), dims = dim(X)))
}

# Computes column standard deviations for any type of matrix
# This should give the same result as matrixStats::colSds(X),
# but allows for sparse matrices as well as dense ones.
#' @importFrom matrixStats colSds
#' @importFrom Matrix summary
#' @keywords internal
compute_colSds <- function(X) {
  if (is.matrix(X)) {
    return(colSds(X))
  } else {
    n <- nrow(X)
    Y <- apply_nonzeros(X, function(u) u^2)
    d <- colMeans(Y) - colMeans(X)^2
    return(sqrt(d * n / (n - 1)))
  }
}

# Compute the column means of X, the column standard deviations of X,
# and rowSums(Y^2), where Y is the centered and/or scaled version of
# X.
#
#' @importFrom Matrix rowSums
#' @importFrom Matrix colMeans
#' @keywords internal
compute_colstats <- function(X, center = TRUE, scale = TRUE) {
  n <- nrow(X)
  p <- ncol(X)
  if (!is.null(attr(X, "matrix.type"))) {
    # X is a trend filtering matrix.
    cm <- compute_tf_cm(attr(X, "order"), p)
    csd <- compute_tf_csd(attr(X, "order"), p)
    d <- compute_tf_d(attr(X, "order"), p, cm, csd, scale, center)
    if (!center) {
      cm <- rep(0, p)
    }
    if (!scale) {
      csd <- rep(1, p)
    }
  } else {
    # X is an ordinary dense or sparse matrix. Set sd = 1 when the
    # column has variance 0.
    if (center) {
      cm <- colMeans(X, na.rm = TRUE)
    } else {
      cm <- rep(0, p)
    }
    if (scale) {
      csd <- compute_colSds(X)
      csd[csd == 0] <- 1
    } else {
      csd <- rep(1, p)
    }

    # These two lines of code should give the same result as
    #
    #   Y = (t(X) - cm)/csd
    #   d = rowSums(Y^2)
    #
    # for all four combinations of "center" and "scale", but do so
    # without having to modify X, or create copies of X in memory. In
    # particular the first line should be equivalent to colSums(X^2).
    d <- n * colMeans(X)^2 + (n - 1) * compute_colSds(X)^2
    d <- (d - n * cm^2) / csd^2
  }

  return(list(cm = cm, csd = csd, d = d))
}

# Compute standard error for regression coef.
# S = (X'X)^-1 \Sigma
calc_stderr = function (X, residuals)
  sqrt(diag(sum(residuals^2)/(nrow(X) - 2) * chol2inv(chol(crossprod(X)))))

#' Check alpha/PIP fixed-point or short-cycle convergence
#'
#' Uses one tolerance for both marginal PIPs and alpha. Lag 1 is ordinary
#' convergence; larger lags detect a periodic orbit and average alpha over it.
#'
#' @keywords internal
check_alpha_pip_cycle_convergence <- function(data, params, model) {
  tol <- params$tol
  cycle_window <- if (!is.null(params$pip_stall_window))
    params$pip_stall_window
  else
    5
  cycle_window <- max(1L, as.integer(cycle_window))
  prior_tol <- if (!is.null(params$prior_tol)) params$prior_tol else 1e-9

  alpha_pip <- function(alpha) {
    tmp <- model
    tmp$alpha <- alpha
    if (inherits(tmp, "susie"))
      susie_get_pip(tmp, prior_tol = prior_tol)
    else
      susie_get_pip(alpha, prior_tol = prior_tol)
  }

  current_alpha <- model$alpha
  current_pip <- alpha_pip(current_alpha)

  alpha_history <- model$runtime$alpha_history
  pip_history <- model$runtime$pip_history
  if (is.null(alpha_history) || is.null(pip_history)) {
    alpha_history <- list(model$runtime$prev_alpha)
    pip_history <- list(alpha_pip(model$runtime$prev_alpha))
  }

  state_diff <- function(alpha_old, pip_old)
    max(max(abs(current_alpha - alpha_old)), max(abs(current_pip - pip_old)))

  max_lag <- min(cycle_window, length(alpha_history))
  lag_diff <- state_diff(alpha_history[[length(alpha_history)]],
                         pip_history[[length(pip_history)]])
  reason <- NULL

  if (lag_diff < tol) {
    reason <- "alpha_pip_fixed_point"
  } else if (max_lag >= 2) {
    for (lag in 2:max_lag) {
      idx <- length(alpha_history) - lag + 1
      lag_diff <- state_diff(alpha_history[[idx]], pip_history[[idx]])
      if (lag_diff < tol) {
        reason <- paste0("alpha_pip_cycle_", lag)
        cycle_alpha <- c(tail(alpha_history, lag - 1), list(current_alpha))
        model$alpha <- Reduce(`+`, cycle_alpha) / lag
        current_alpha <- model$alpha
        current_pip <- alpha_pip(current_alpha)
        break
      }
    }
  }

  model$converged <- !is.null(reason)
  model$convergence_reason <- reason
  model$runtime$pip_diff <- lag_diff
  model$runtime$alpha_history <- c(alpha_history, list(current_alpha))
  model$runtime$pip_history <- c(pip_history, list(current_pip))
  if (length(model$runtime$alpha_history) > cycle_window) {
    keep <- seq.int(length(model$runtime$alpha_history) - cycle_window + 1,
                    length(model$runtime$alpha_history))
    model$runtime$alpha_history <- model$runtime$alpha_history[keep]
    model$runtime$pip_history <- model$runtime$pip_history[keep]
  }
  return(model)
}

# =============================================================================
# DATA PROCESSING & VALIDATION
#
# Functions for input validation, data conversion between formats, and
# preprocessing operations. These ensure data integrity and compatibility
# across different SuSiE data types.
#
# Functions: check_semi_pd, check_projection, validate_init,
# convert_individual_to_ss, extract_prior_weights, reconstruct_full_weights,
# validate_and_override_params
# =============================================================================

# Check whether A is positive semidefinite
#' @keywords internal
check_semi_pd <- function(A, tol) {
  attr(A, "eigen") <- eigen(A, symmetric = TRUE)
  v <- attr(A, "eigen")$values
  v[abs(v) < tol] <- 0
  return(list(
    matrix = A,
    status = !any(v < 0),
    eigenvalues = v
  ))
}

# Check whether b is in space spanned by the non-zero eigenvectors of A
#' @keywords internal
check_projection <- function(A, b) {
  if (is.null(attr(A, "eigen"))) {
    attr(A, "eigen") <- eigen(A, symmetric = TRUE)
  }
  v <- attr(A, "eigen")$values
  B <- attr(A, "eigen")$vectors[, v > .Machine$double.eps]
  msg <- all.equal(as.vector(B %*% crossprod(B, b)), as.vector(b),
                   check.names = FALSE
  )
  if (!is.character(msg)) {
    return(list(status = TRUE, msg = NA))
  } else {
    return(list(status = FALSE, msg = msg))
  }
}

# Validate Model Initialization Object
#' @keywords internal
validate_init <- function(data, params) {
  if (!inherits(params$model_init, "susie")) {
    stop("model_init must be a 'susie' object")
  }

  # Assign values from initialized model
  L       <- params$L
  alpha   <- params$model_init$alpha
  mu      <- params$model_init$mu
  mu2     <- params$model_init$mu2
  V       <- params$model_init$V
  sigma2  <- params$model_init$sigma2
  pi_w    <- params$model_init$pi
  null_id <- params$model_init$null_index

  # Verify no NA/Inf values in alpha
  if (any(!is.finite(alpha))) {
    stop("model_init$alpha contains NA/Inf values")
  }

  # Verify no NA/Inf values in mu
  if (any(!is.finite(mu))) {
    stop("model_init$mu contains NA/Inf values")
  }

  # Verify no NA/Inf values in mu2
  if (any(!is.finite(mu2))) {
    stop("model_init$mu2 contains NA/Inf values")
  }

  # Only check V if it exists
  if (!is.null(V)) {
    # Verify no NA/Inf values in V
    if (any(!is.finite(V))) {
      stop("model_init$V contains NA/Inf values")
    }
  }

  # Only check sigma2 if it exists
  if (!is.null(sigma2)) {
    # Verify no NA/Inf values in sigma2
    if (any(!is.finite(sigma2))) {
      stop("model_init$sigma2 contains NA/Inf")
    }
  }

  # Only check pi_w if it exists
  if (!is.null(pi_w)) {
    # Verify no NA/Inf values in prior weights
    if (any(!is.finite(pi_w))) {
      stop("model_init$pi contains NA/Inf")
    }
  }

  # Verify alpha is matrix
  if (!is.matrix(alpha)) {
    stop("model_init$alpha must be a matrix")
  }

  # Verify alpha values are between [0,1]
  if (max(alpha) > 1 || min(alpha) < 0) {
    stop(
      "model_init$alpha has invalid values outside range [0,1]; please ",
      "check your input"
    )
  }

  # Verify mu & mu2 dimensions match alpha
  if (!all(dim(mu) == dim(alpha))) {
    stop("model_init$mu and model_init$alpha dimensions do not match")
  }
  if (!all(dim(mu2) == dim(alpha))) {
    stop("model_init$mu2 and model_init$alpha dimensions do not match")
  }

  # Only validate V dimensions and values if V exists
  if (!is.null(V)) {
    # Verify V & alpha dimensions agree
    if (length(V) != nrow(alpha)) {
      stop(
        "length(model_init$V) (", length(V), ") does not equal nrow(model_init$alpha) (",
        nrow(alpha), ")"
      )
    }

    # Verify V is numeric and non-negative
    if (!is.numeric(V)) {
      stop("model_init$V must be numeric")
    }
    if (any(V < 0)) {
      stop("model_init$V has at least one negative value")
    }
  }

  # Verify sigma2 is numeric and non-negative if it exists
  if (!is.null(sigma2)) {
    if (!is.numeric(sigma2)) {
      stop("model_init$sigma2 must be numeric")
    }
    if (sigma2 < 0) {
      stop("model_init$sigma2 is negative")
    }
  }

  # Verify prior weight properties if they exist
  if (!is.null(pi_w)) {
    if (length(pi_w) != ncol(alpha)) {
      stop(
        "model_init$pi should have the same length as the number of columns",
        " in model_init$alpha"
      )
    }
  }

  invisible(params$model_init)
}

# Convert individual data to ss with unmappable effects components.
#' @keywords internal
convert_individual_to_ss <- function(data, params) {
  # Compute sufficient statistics
  XtX <- compute_XtX(data$X)
  Xty <- compute_Xty(data$X, data$y)
  yty <- sum(data$y^2)

  # Get column means and scaling from attributes
  X_colmeans <- attr(data$X, "scaled:center")

  # Create sufficient statistics data object
  ss_data <- structure(
    list(
      XtX = XtX,
      X = NULL,
      Xty = Xty,
      yty = yty,
      n = data$n,
      p = data$p,
      X_colmeans = X_colmeans,
      y_mean = data$mean_y
    ),
    class = "ss"
  )

  # Set attributes on XtX from individual X
  attr(ss_data$XtX, "d") <- attr(data$X, "d")
  attr(ss_data$XtX, "scaled:scale") <- attr(data$X, "scaled:scale")

  # Add eigen decomposition for unmappable effects methods
  ss_data <- add_eigen_decomposition(ss_data, params, data)

  return(ss_data)
}

# Extract non-null prior weights from a model
#' @keywords internal
extract_prior_weights <- function(model, null_weight = NULL) {
  # Use model's null_weight if not provided (backwards compatibility)
  if (is.null(null_weight)) {
    null_weight <- model$null_weight
  }
  
  if (!is.null(null_weight) && null_weight != 0 && !is.null(model$null_index) && model$null_index != 0) {
    # Extract non-null prior weights and rescale
    pw_s <- model$pi[-model$null_index] / (1 - null_weight)
  } else {
    pw_s <- model$pi
  }
  return(pw_s)
}

# Reconstruct full prior weights with null weight handling
#' @keywords internal
reconstruct_full_weights <- function(non_null_weights, null_weight) {
  if (!is.null(null_weight) && null_weight != 0) {
    # Reconstruct full prior weights including null component
    full_weights <- c(non_null_weights * (1 - null_weight), null_weight)
  } else {
    full_weights <- non_null_weights
  }
  # Normalize to sum to 1
  return(full_weights / sum(full_weights))
}


# Validate and Override Parameters
#' @keywords internal
validate_and_override_params <- function(params) {

  # Validate prior tolerance threshold
  if (!is.numeric(params$prior_tol) || length(params$prior_tol) != 1) {
    stop("prior_tol must be a numeric scalar.")
  }
  if (params$prior_tol < 0) {
    stop("prior_tol must be non-negative.")
  }

  # Validate greedy-L parameters.
  if (!is.null(params$L_greedy)) {
    if (!is.numeric(params$L_greedy) || length(params$L_greedy) != 1 ||
        is.na(params$L_greedy) || !is.finite(params$L_greedy) ||
        params$L_greedy < 1 ||
        params$L_greedy != as.integer(params$L_greedy)) {
      stop("L_greedy must be NULL or a positive integer.")
    }
    params$L_greedy <- as.integer(params$L_greedy)
    if (params$L_greedy > params$L) {
      warning_message("L_greedy is greater than L; using L instead.")
      params$L_greedy <- as.integer(params$L)
    }
  }
  if (!is.numeric(params$greedy_lbf_cutoff) ||
      length(params$greedy_lbf_cutoff) != 1 ||
      is.na(params$greedy_lbf_cutoff) ||
      !is.finite(params$greedy_lbf_cutoff)) {
    stop("greedy_lbf_cutoff must be a numeric scalar.")
  }

  # Validate residual_variance_upperbound
  if (!is.numeric(params$residual_variance_upperbound) || length(params$residual_variance_upperbound) != 1) {
    stop("residual_variance_upperbound must be a numeric scalar.")
  }
  if (params$residual_variance_upperbound <= 0) {
    stop("residual_variance_upperbound must be positive.")
  }

  # Validate scaled prior variance
  if (!is.numeric(params$scaled_prior_variance) || any(params$scaled_prior_variance < 0)) {
    stop("Scaled prior variance should be positive number.")
  }
  spv_len <- length(params$scaled_prior_variance)
  if (spv_len != 1 && spv_len != params$L) {
    stop("scaled_prior_variance must be a scalar or a vector of length L.")
  }

  # Validate unmappable_effects
  # "ash_filter_archived" is a hidden option for internal diagnostics/archiving
  # of the original SuSiE-ASH filter-based masking heuristic.
  valid_unmappable <- c("none", "inf", "ash", "ash_filter_archived")
  if (!params$unmappable_effects %in% valid_unmappable) {
    stop("unmappable_effects must be one of 'none', 'inf', or 'ash'.")
  }

  # Auto-create Beta-Binomial slot prior for ash mode (identifiability).
  if (params$unmappable_effects == "ash" && is.null(params$slot_prior)) {
    params$slot_prior <- slot_prior_betabinom()
    warning_message(
      "For SuSiE-ash it is strongly advised to set slot_prior with ",
      "a beta-binomial prior based on your expected sparsity of data. ",
      "Set slot_prior = slot_prior_betabinom(a_beta, b_beta) explicitly.")
  }
  # Report BB default parameters (separate from the warning above).
  if (!is.null(params$slot_prior) && inherits(params$slot_prior, "slot_prior_betabinom") &&
      isTRUE(params$slot_prior$ab_was_default)) {
    sp <- params$slot_prior
    n_active <- round(sp$a_beta / (sp$a_beta + sp$b_beta) * params$L)
    warning_message(
      "Beta-Binomial prior parameters not specified, using default ",
      "Beta(a=", sp$a_beta, ", b=", sp$b_beta, "), ",
      "roughly expecting ~", n_active, " of ", params$L,
      " slots to be active. Set a_beta and b_beta explicitly ",
      "to change this behavior.")
  }
  # Report nu default after the C message so the user sees C first.
  if (!is.null(params$slot_prior) && !inherits(params$slot_prior, "slot_prior_betabinom") &&
      isTRUE(params$slot_prior$nu_was_default)) {
    sp <- params$slot_prior
    sd_mu <- sp$C / sqrt(sp$nu)
    warning_message(
      "Overdispersion parameter nu not specified, using default nu = ",
      sp$nu, ". With C = ", sp$C,
      " this implies sd(mu) = ", round(sd_mu, 2),
      ", so the number of active effects ranges roughly from ",
      round(max(0, sp$C - 2 * sd_mu), 1), " to ",
      round(sp$C + 2 * sd_mu, 1),
      " around the prior mean. Set nu explicitly to change this behavior.")
  }

  # Override convergence method for unmappable effects or slot_prior.
  # The ELBO is not well-defined when slot_weights != 1 (c_hat active)
  # or when unmappable effects modify the residual structure.
  needs_pip <- params$unmappable_effects != "none" || !is.null(params$slot_prior)
  if (needs_pip && params$convergence_method != "pip") {
    if (params$unmappable_effects != "none") {
      warning_message("Unmappable effects models (inf/ash) do not have a well ",
              "defined ELBO and require PIP convergence. ",
              "Setting convergence_method='pip'.")
    } else {
      warning_message("Slot activity model modifies fitted values ",
              "by slot weights, making the standard ELBO invalid. ",
              "Setting convergence_method='pip'.")
    }
    params$convergence_method <- "pip"
  }

  # Check for incompatible parameter combinations
  if (!is.null(params$refine) && params$refine && params$unmappable_effects != "none") {
    stop("Refinement is not supported with unmappable effects (inf/ash) as it relies on ELBO, ",
         "which is not well-defined for these models. Please set refine = FALSE.")
  }

  # Override prior estimation method when estimation is disabled,
  # unless using a fixed mixture prior (which does not estimate V but
  # still needs the mixture BF computation path)
  if (!params$estimate_prior_variance &&
      params$estimate_prior_method != "fixed_mixture") {
    params$estimate_prior_method <- "none"
  }

  # Handle NIG parameters for small sample correction
  if (params$estimate_residual_method == "NIG") {
    params$use_NIG <- TRUE

    # Require a valid sample size n. The default alpha0/beta0 scale as
    # 1/sqrt(n), so n must be a positive finite scalar. susie() infers
    # this from nrow(X); susie_ss()'s constructor enforces it; susie_rss()
    # allows n = NULL by default, so users who select NIG must also
    # supply `n` explicitly.
    if (is.null(params$n) || !is.numeric(params$n) || length(params$n) != 1 ||
        !is.finite(params$n) || params$n < 1) {
      stop("estimate_residual_method = \"NIG\" requires a valid sample ",
           "size `n` (got n = ", paste(params$n, collapse = ""), "). ",
           "susie() infers n from nrow(X); for susie_ss() and susie_rss(), ",
           "pass `n` explicitly.")
    }

    # Validate NIG prior parameters: both must be strictly positive for a proper
    # Inverse-Gamma prior. Otherwise compute_null_loglik_NIG() evaluates
    # lgamma(alpha0 / 2) at <= 0 and the marginal log-likelihood (and ELBO)
    # become Inf or NaN.
    if (!is.numeric(params$alpha0) || length(params$alpha0) != 1 ||
        !is.finite(params$alpha0) || params$alpha0 <= 0 ||
        !is.numeric(params$beta0)  || length(params$beta0)  != 1 ||
        !is.finite(params$beta0)  || params$beta0  <= 0) {
      stop("estimate_residual_method = \"NIG\" requires ",
           "alpha0 > 0 and beta0 > 0 (proper Inverse-Gamma prior). ",
           "Got alpha0 = ", params$alpha0, ", beta0 = ", params$beta0, ". ",
           "The default is alpha0 = beta0 = 1/sqrt(n).")
    }

    # The NIG prior inherently estimates residual variance (integrates out sigma^2).
    # If estimate_residual_variance is FALSE, override it -- the user chose a method
    # that estimates sigma^2 by design. To suppress this warning, explicitly set
    # estimate_residual_variance = TRUE in the function call.
    if (!isTRUE(params$estimate_residual_variance)) {
      warning_message("NIG prior integrates out residual variance, ",
                      "implying estimate_residual_variance = TRUE. ",
                      "Setting estimate_residual_variance = TRUE. ",
                      "To suppress this warning, explicitly set ",
                      "estimate_residual_variance = TRUE in the function call.")
      params$estimate_residual_variance <- TRUE
    }

    # Override convergence method only when L > 1
    if (params$L > 1 && params$convergence_method != "pip") {
      warning_message("NIG method with L > 1 requires PIP convergence. Setting convergence_method='pip'.")
      params$convergence_method <- "pip"
    }

    # Override prior variance estimation method (only when estimation is enabled)
    if (params$estimate_prior_variance && params$estimate_prior_method != "EM") {
      warning_message("NIG method works better with EM. Setting estimate_prior_method='EM'.")
      params$estimate_prior_method <- "EM"
    }
  } else {
    params$use_NIG <- FALSE
    params$alpha0 <- NULL
    params$beta0 <- NULL
  }

  return(params)
}

# =============================================================================
# MODEL INITIALIZATION
#
# Functions that set up initial model states, create model matrices,
# and handle model configuration. These prepare the SuSiE model object
# for iterative fitting.
#
# Functions: initialize_null_index, assign_names,
# adjust_L, prune_single_effects, add_null_effect
# =============================================================================

# Initialize Null Index
#' @keywords internal
initialize_null_index <- function(data, model) {
  if (is.null(model$null_weight) || model$null_weight == 0) {
    null_idx <- 0
  } else {
    null_idx <- data$p
  }
  return(null_idx)
}

# Helper function to assign variable names to model components
#' @keywords internal
assign_names <- function(data, model, variable_names) {
  if (!is.null(variable_names)) {
    if (!is.null(model$null_weight) && model$null_weight != 0 && !is.null(model$null_index) && model$null_index != 0) {
      variable_names[length(variable_names)] <- "null"
      names(model$pip) <- variable_names[-data$p]
    } else {
      names(model$pip) <- variable_names
    }
    colnames(model$alpha)        <- variable_names
    colnames(model$mu)           <- variable_names
    colnames(model$mu2)          <- variable_names
    colnames(model$lbf_variable) <- variable_names
  }
  return(model)
}

# Expand scaled_prior_variance into a length-L vector of prior variances.
# Accepts either a scalar (recycled to length L) or a length-L vector
# (used as-is, one prior variance per single-effect slot).
#' @keywords internal
expand_scaled_prior_variance <- function(scaled_prior_variance, var_y, L) {
  if (length(scaled_prior_variance) == 1) {
    rep(scaled_prior_variance * var_y, L)
  } else {
    scaled_prior_variance * var_y
  }
}

# Adjust the number of effects
#' @keywords internal
adjust_L <- function(params, model_init_pruned, var_y) {
  num_effects <- nrow(model_init_pruned$alpha)
  L <- params$L

  if (num_effects > L) {
    warning_message(paste0(
      "Requested L = ", L,
      " is smaller than the ", num_effects,
      " effects in model_init after pruning; ",
      "using L = ", num_effects, " instead."
    ))
    L <- num_effects
  }

  V <- expand_scaled_prior_variance(params$scaled_prior_variance, var_y, L)
  model_init <- prune_single_effects(model_init_pruned, L = L, V = V)

  return(list(model_init = model_init, L = L))
}

# Prune single effects to given number L in susie model object.
#' @keywords internal
prune_single_effects <- function(model_init, L = 0, V = NULL) {
  num_effects <- nrow(model_init$alpha)
  if (L == 0) {
    # Filtering will be based on non-zero elements in model_init$V.
    if (!is.null(model_init$V)) {
      L <- length(which(model_init$V > 0))
    } else {
      L <- num_effects
    }
  }
  if (L == num_effects) {
    model_init$sets <- NULL
    return(model_init)
  }
  if (!is.null(model_init$sets$cs_index)) {
    effects_rank <- c(model_init$sets$cs_index, setdiff(1:num_effects, model_init$sets$cs_index))
  } else {
    effects_rank <- 1:num_effects
  }

  if (L > num_effects) {
    message(paste(
      "Specified number of effects L =", L,
      "is greater the number of effects", num_effects,
      "in input SuSiE model. The SuSiE model will be expanded",
      "to have", L, "effects."
    ))

    model_init$alpha <- rbind(
      model_init$alpha[effects_rank, ],
      matrix(1 / ncol(model_init$alpha), L - num_effects, ncol(model_init$alpha))
    )
    for (n in c("mu", "mu2", "lbf_variable")) {
      if (!is.null(model_init[[n]])) {
        model_init[[n]] <- rbind(
          model_init[[n]][effects_rank, ],
          matrix(0, L - num_effects, ncol(model_init[[n]]))
        )
      }
    }
    for (n in c("KL", "lbf")) {
      if (!is.null(model_init[[n]])) {
        model_init[[n]] <- c(model_init[[n]][effects_rank], rep(NA, L - num_effects))
      }
    }
    if (!is.null(V)) {
      if (length(V) > 1) {
        if (!is.null(model_init$V)) {
          V[1:num_effects] <- model_init$V[effects_rank]
        }
      } else {
        V <- rep(V, L)
      }
    }
    model_init$V <- V
  }
  model_init$sets <- NULL
  return(model_init)
}

# Add a null effect to the model object
#' @keywords internal
add_null_effect <- function(model_init, V) {
  p                       <- ncol(model_init$alpha)
  model_init$alpha        <- rbind(model_init$alpha, 1 / p)
  model_init$mu           <- rbind(model_init$mu, rep(0, p))
  model_init$mu2          <- rbind(model_init$mu2, rep(0, p))
  model_init$lbf_variable <- rbind(model_init$lbf_variable, rep(0, p))
  model_init$V            <- c(model_init$V, V)
  return(model_init)
}

# =============================================================================
# MATRIX-VECTOR PRODUCT HELPERS
#
# Unified helpers for predictor-matrix-times-vector operations across
# SS (XtX) and RSS-lambda (R) data types. These dispatch on what's available
# on the data object: data$X (low-rank factor), data$XtX, or data$R.
# When data$X is stored (Bxp, B < p), the two-step product X'(Xv) avoids
# forming the pxp matrix, reducing cost from O(p^2) to O(Bp).
#
# Functions: compute_Rv, compute_BR
# =============================================================================

# Compute R*v product: X'(Xv), XtX*v, or R*v.
# For multi-panel rss_lambda, pass Rv_matrix = model$X_meta to use the
# current R(omega) factor instead of data$X.
#' @keywords internal
compute_Rv <- function(data, v, Rv_matrix = NULL) {
  if (!is.null(Rv_matrix)) {
    return(as.vector(crossprod(Rv_matrix, Rv_matrix %*% v)))
  }
  if (!is.null(data$X)) {
    return(as.vector(crossprod(data$X, data$X %*% v)))
  } else if (!is.null(data$XtX)) {
    return(as.vector(data$XtX %*% v))
  } else if (!is.null(data$R)) {
    return(as.vector(data$R %*% v))
  }
  stop("No predictor matrix available on data object.")
}

# Compute B_mat %*% predictor-matrix: (Lxp) times (pxp) -> (Lxp)
# Used in get_ER2.ss for the quadratic form B %*% XtX
#' @keywords internal
compute_BR <- function(data, B_mat) {
  if (!is.null(data$X)) {
    return((B_mat %*% t(data$X)) %*% data$X)
  } else if (!is.null(data$XtX)) {
    return(B_mat %*% data$XtX)
  }
  stop("No predictor matrix available for compute_BR.")
}

# =============================================================================
# CORE ALGORITHM COMPONENTS
#
# Key computational functions that implement the mathematical core of the
# SuSiE algorithm. These handle eigen decompositions, posterior computations,
# and log Bayes factor calculations.
#
# Functions: compute_eigen_decomposition, add_eigen_decomposition,
# compute_omega_quantities, scale_design_matrix, compute_theta_blup,
# lbf_stabilization, compute_posterior_weights, compute_lbf_gradient
# =============================================================================

# Compute eigenvalue decomposition for unmappable methods
# When X (low-rank factor) is available, uses thin SVD (O(pB^2)) instead
# of eigen decomposition of XtX (O(p^3)).
#' @keywords internal
compute_eigen_decomposition <- function(XtX, n, X = NULL) {
  if (!is.null(X)) {
    # Thin SVD: O(p*B^2) instead of O(p^3)
    p <- ncol(X)
    sv <- svd(X, nu = 0)
    V <- sv$v                        # p x min(B,p) right singular vectors
    Dsq <- pmax(sv$d^2, 0)           # eigenvalues of X'X
    # Pad to length p with zeros (null-space eigenvectors)
    if (ncol(V) < p) {
      V <- cbind(V, matrix(0, p, p - ncol(V)))
      Dsq <- c(Dsq, rep(0, p - length(Dsq)))
    }
    idx <- order(Dsq, decreasing = TRUE)
    return(list(V = V[, idx], Dsq = Dsq[idx], VtXty = NULL))
  }

  LD  <- XtX / n
  eig <- eigen(LD, symmetric = TRUE)
  idx <- order(eig$values, decreasing = TRUE)

  list(
    V     = eig$vectors[, idx],
    Dsq   = pmax(eig$values[idx] * n, 0),
    VtXty = NULL
  )
}

# Add eigen decomposition to ss data objects for unmappable methods
#' @keywords internal
add_eigen_decomposition <- function(data, params, individual_data = NULL) {
  # Compute eigen decomposition (thin SVD when X is available)
  eigen_decomp <- compute_eigen_decomposition(data$XtX, data$n, X = data$X)

  # Append eigen components to data object
  data$eigen_vectors <- eigen_decomp$V
  data$eigen_values  <- eigen_decomp$Dsq
  data$VtXty         <- t(eigen_decomp$V) %*% data$Xty

  return(data)
}

#' Scale design matrix using centering and scaling parameters
#'
#' Applies column-wise centering and scaling to match the space used by
#' compute_XtX() and compute_Xty() for unmappable effects methods.
#'
#' @param X Matrix to scale (n x p)
#' @param center Vector of column means to subtract (length p), or NULL
#' @param scale Vector of column SDs to divide by (length p), or NULL
#'
#' @return Scaled matrix with centered and scaled columns
#'
#' @keywords internal
scale_design_matrix <- function(X, center = NULL, scale = NULL) {
  if (is.null(center)) center <- rep(0, ncol(X))
  if (is.null(scale)) scale <- rep(1, ncol(X))

  X_centered <- sweep(X, 2, center, "-")
  X_scaled <- sweep(X_centered, 2, scale, "/")

  return(X_scaled)
}

# Compute Omega-weighted quantities for unmappable effects methods
#' @keywords internal
compute_omega_quantities <- function(data, tau2, sigma2) {
  # Compute variance in eigen space
  omega_var <- tau2 * data$eigen_values + sigma2

  # Compute diagonal of X'OmegaX
  diagXtOmegaX <- rowSums(sweep(data$eigen_vectors^2, 2,
                                (data$eigen_values / omega_var), `*`))

  return(list(
    omega_var    = omega_var,
    diagXtOmegaX = diagXtOmegaX
  ))
}

# Compute unmappable effects coefficient vector using BLUP
#' @keywords internal
compute_theta_blup <- function(data, model) {
  # Calculate diagXtOmegaX, diagonal variances, and Beta
  omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
  b         <- colSums(model$mu * model$alpha)

  # Compute XtOmegaXb, XtOmegay, and XtOmegar
  XtOmegaXb <- data$eigen_vectors %*% ((t(data$eigen_vectors) %*% b) *
                                         data$eigen_values / omega_res$omega_var)
  XtOmegay  <- data$eigen_vectors %*% (data$VtXty / omega_res$omega_var)
  XtOmegar  <- XtOmegay - XtOmegaXb

  # Compute theta
  theta     <- model$tau2 * XtOmegar

  return(theta)
}

# Stabilize log Bayes factors and compute log posterior odds
#' @keywords internal
lbf_stabilization <- function(lbf, prior_weights, shat2) {
  lpo <- lbf + log(prior_weights + sqrt(.Machine$double.eps))

  # When shat2 is infinite, set lbf=0 and lpo to prior (no information from data)
  infinite_idx      <- is.infinite(shat2)
  lbf[infinite_idx] <- 0
  lpo[infinite_idx] <- log(prior_weights[infinite_idx] + sqrt(.Machine$double.eps))

  return(list(lbf = lbf, lpo = lpo))
}

# Compute alpha and lbf for each effect
#' @keywords internal
compute_posterior_weights <- function(lpo) {

  w_weighted     <- exp(lpo - max(lpo))
  weighted_sum_w <- sum(w_weighted)
  alpha          <- w_weighted / weighted_sum_w

  return(list(
    alpha     = alpha,
    lbf_model = log(weighted_sum_w) + max(lpo)
  ))
}

# Compute gradient for prior variance optimization
#' @keywords internal
compute_lbf_gradient <- function(alpha, betahat, shat2, V, use_NIG = FALSE) {
  # No gradient computation for NIG prior
  if (use_NIG) {
    return(NULL)
  }

  T2 <- betahat^2 / shat2
  grad_components <- 0.5 * (1 / (V + shat2)) * ((shat2 / (V + shat2)) * T2 - 1)
  grad_components[is.nan(grad_components)] <- 0
  gradient <- sum(alpha * grad_components)
  return(gradient)
}

# =============================================================================
# VARIANCE ESTIMATION
#
# Functions specifically for estimating variance components using different
# methods (MLE, MoM, NIG). These handle both standard SuSiE
# and unmappable effects models.
#
# Functions: mom_unmappable, mle_unmappable, create_ash_grid,
# compute_lbf_NIG_univariate, posterior_mean_NIG,
# posterior_var_NIG, compute_stats_NIG, update_prior_variance_NIG_EM,
# compute_kl_NIG, inv_gamma_factor, compute_null_loglik_NIG,
# compute_marginal_loglik, est_residual_variance, update_model_variance
# =============================================================================

# Method of Moments variance estimation for unmappable effects methods
#' @keywords internal
mom_unmappable <- function(data, params, model, omega, tau2, est_tau2 = TRUE, est_sigma2 = TRUE) {
  L <- nrow(model$mu)

  A <- matrix(0, nrow = 2, ncol = 2)
  A[1, 1] <- data$n
  A[1, 2] <- sum(data$eigen_values)
  A[2, 1] <- A[1, 2]
  A[2, 2] <- sum(data$eigen_values^2)

  # Compute diag(V'MV)
  b <- colSums(model$mu * model$alpha)
  Vtb <- crossprod(data$eigen_vectors, b)
  diagVtMV <- Vtb^2
  tmpD <- rep(0, data$p)

  for (l in seq_len(L)) {
    bl <- model$mu[l, ] * model$alpha[l, ]
    Vtbl <- crossprod(data$eigen_vectors, bl)
    diagVtMV <- diagVtMV - Vtbl^2
    tmpD <- tmpD + model$alpha[l, ] * (model$mu[l, ]^2 + 1 / omega[l, ])
  }

  diagVtMV <- diagVtMV + rowSums(sweep(t(data$eigen_vectors)^2, 2, tmpD, `*`))

  # Compute x
  x <- rep(0, 2)
  x[1] <- data$yty - 2 * sum(b * data$Xty) + sum(data$eigen_values * diagVtMV)
  x[2] <- sum(data$Xty^2) - 2 * sum(Vtb * data$VtXty * data$eigen_values) +
    sum(data$eigen_values^2 * diagVtMV)

  if (est_tau2) {
    sol <- solve(A, x)
    if (sol[1] > 0 && sol[2] > 0) {
      sigma2 <- sol[1]
      tau2   <- sol[2]
    } else {
      sigma2 <- x[1] / data$n
      tau2   <- 0
    }
    if (params$verbose) {
      message(sprintf("Update (sigma^2,tau^2) to (%f,%e)\n", sigma2, tau2))
    }
  } else if (est_sigma2) {
    sigma2 <- (x[1] - A[1, 2] * tau2) / data$n
    if (params$verbose) {
      message(sprintf("Update sigma^2 to %f\n", sigma2))
    }
  }
  return(list(sigma2 = sigma2, tau2 = tau2))
}

# MLE variance estimation for unmappable effects
#' @keywords internal
mle_unmappable <- function(data, params, model, omega, est_tau2 = TRUE, est_sigma2 = TRUE) {
  L <- nrow(model$alpha)

  # Set default ranges
  sigma2_range <- c(0.2 * data$yty / data$n, 1.2 * data$yty / data$n)
  tau2_range   <- c(1e-12, 1.2 * data$yty / (data$n * data$p))

  # Compute diag(V'MV)
  b        <- colSums(model$mu * model$alpha)
  Vtb      <- crossprod(data$eigen_vectors, b)
  diagVtMV <- Vtb^2
  tmpD     <- rep(0, data$p)

  for (l in seq_len(L)) {
    bl       <- model$mu[l, ] * model$alpha[l, ]
    Vtbl     <- crossprod(data$eigen_vectors, bl)
    diagVtMV <- diagVtMV - Vtbl^2
    tmpD     <- tmpD + model$alpha[l, ] * (model$mu[l, ]^2 + 1 / omega[l, ])
  }

  diagVtMV <- diagVtMV + rowSums(sweep(t(data$eigen_vectors)^2, 2, tmpD, `*`))

  # Negative ELBO as function of x = (sigma^2, tau^2)
  f <- function(x) {
    sigma2_val <- x[1]
    tau2_val   <- x[2]
    var_val    <- tau2_val * data$eigen_values + sigma2_val

    0.5 * (data$n - data$p) * log(sigma2_val) + 0.5 / sigma2_val * data$yty +
      sum(0.5 * log(var_val) -
            0.5 * tau2_val / sigma2_val * data$VtXty^2 / var_val -
            Vtb * data$VtXty / var_val +
            0.5 * data$eigen_values / var_val * diagVtMV)
  }

  # Negative ELBO for sigma^2 only (when tau^2 is fixed)
  g <- function(sigma2_val) {
    f(c(sigma2_val, model$tau2))
  }

  # Initialize with current values
  sigma2 <- model$sigma2
  tau2 <- model$tau2

  if (est_tau2) {
    # Optimize both sigma^2 and tau^2
    res <- optim(
      par    = c(model$sigma2, model$tau2),
      fn     = f,
      method = "L-BFGS-B",
      lower  = c(sigma2_range[1], tau2_range[1]),
      upper  = c(sigma2_range[2], tau2_range[2])
    )

    if (res$convergence == 0) {
      sigma2 <- res$par[1]
      tau2   <- res$par[2]
      if (params$verbose) {
        message(sprintf("Update (sigma^2,tau^2) to (%f,%e)\n", sigma2, tau2))
      }
    } else {
      warning_message("MLE optimization failed to converge; keeping previous parameters")
    }
  } else if (est_sigma2) {
    # Optimize only sigma^2
    res <- optim(
      par    = model$sigma2,
      fn     = g,
      method = "L-BFGS-B",
      lower  = sigma2_range[1],
      upper  = sigma2_range[2]
    )

    if (res$convergence == 0) {
      sigma2 <- res$par
      if (params$verbose) {
        message(sprintf("Update sigma^2 to %f\n", sigma2))
      }
    } else {
      warning_message("MLE optimization failed to converge; keeping previous parameters")
    }
  }

  return(list(sigma2 = sigma2, tau2 = tau2))
}

# Extract NIG sufficient statistics from model, regardless of data type
# This is the ONLY function that needs to know whether we have individual or SS data.
# All other NIG functions work with (yy, sxy, tau) uniformly.
#' @keywords internal
get_nig_sufficient_stats <- function(data, model) {
  if (!is.null(model$raw_residuals)) {
    # Individual data path: compute from raw residuals
    yy  <- sum(model$raw_residuals^2)
    sxy <- drop(cor(data$X, model$raw_residuals))
    tau <- 1
  } else {
    # SS/RSS path: use pre-computed quantities
    yy  <- model$yy_residual
    sxy <- model$residuals / sqrt(model$predictor_weights * yy)
    # Clamp sxy to [-1, 1]: with approximate R from a finite reference,
    # Cauchy-Schwarz may be violated numerically, giving |sxy| > 1.
    # This would make rss = yy*(1 - r0*sxy^2) negative, producing NaN in log BF.
    sxy <- pmin(pmax(sxy, -1), 1)
    tau <- if (!is.null(model$shat2_inflation)) model$shat2_inflation else 1
  }
  list(yy = yy, sxy = sxy, tau = tau)
}

# Inputs for compute_kl_NIG: single-IG projection of the SER posterior.
# a_post = (alpha0+n)/2; b_post = (beta0 + sum_j alpha_j RSS_j)/2 with
# RSS_j = yy*(1 - r0_j*sxy_j^2); s_j_sq = r0_j * tau / xx_j.
#' @keywords internal
nig_kl_inputs <- function(data, params, model, l) {
  nig_ss  <- get_nig_sufficient_stats(data, model)
  V_l     <- model$V[l]
  r0      <- V_l / (V_l + nig_ss$tau / model$predictor_weights)
  s_j_sq  <- r0 * nig_ss$tau / model$predictor_weights

  alpha_l <- model$alpha[l, ]
  rss_avg <- nig_ss$yy * (1 - sum(alpha_l * r0 * nig_ss$sxy^2))

  list(
    a_post = (params$alpha0 + data$n) / 2,
    b_post = (params$beta0 + rss_avg) / 2,
    s_j_sq = s_j_sq
  )
}

# Compute log Bayes factor for NIG prior (univariate form on raw x, y)
#' @keywords internal
compute_lbf_NIG_univariate <- function(x, y, s0, alpha0 = 0, beta0 = 0) {
  x <- x - mean(x)
  y <- y - mean(y)
  n <- length(x)
  xx <- sum(x * x)
  xy <- sum(x * y)
  yy <- sum(y * y)
  r0 <- s0 / (s0 + 1 / xx)
  sxy <- xy / sqrt(xx * yy)
  ratio <- (beta0 + yy * (1 - r0 * sxy^2)) / (beta0 + yy)
  return((log(1 - r0) - (n + alpha0) * log(ratio)) / 2)
}

# Posterior mean for NIG prior using sufficient statistics
#' @keywords internal
posterior_mean_NIG <- function(xtx, xty, s0_t = 1) {
  omega <- (xtx + (1 / s0_t^2))^(-1)
  b_bar <- omega %*% xty
  return(b_bar)
}

# Posterior variance for NIG prior using sufficient statistics
#' @keywords internal
posterior_var_NIG <- function(xtx, xty, yty, n, s0_t = 1) {

  # If prior variance is too small, return 0.
  if (s0_t < 1e-5) {
    return(list(post_var = 0, beta1 = 0))
  }

  omega <- (xtx + (1 / s0_t^2))^(-1)
  b_bar <- omega %*% xty
  beta1 <- (yty - b_bar * (omega^(-1)) * b_bar)
  post_var_up <- 0.5 * (yty - b_bar * (omega^(-1)) * b_bar)
  post_var_down <- 0.5 * (n * (1 / omega))
  post_var <- omega * (post_var_up / post_var_down) * n / (n - 2)

  return(list(post_var = post_var, beta1 = beta1))
}

# Compute the (log) Bayes factors and additional statistics under Normal-Inverse-Gamma (NIG) prior
#' @keywords internal
compute_stats_NIG <- function(n, xx, xy, yy, sxy, s0, a0, b0, tau = 1) {

  r0 <- s0 / (s0 + tau / xx)
  rss <- yy * (1 - r0 * sxy^2)

  # Update inverse-gamma parameters
  a1 <- a0 + n
  b1 <- b0 + rss

  # Compute log Bayes factor for each variable
  lbf <- -(log(1 + s0 * xx / tau) + a1 * log(b1 / (b0 + yy))) / 2

  # Compute least-squares estimate for each variable
  bhat <- xy / xx

  # Compute posterior mean
  post_mean <- r0 * bhat

  # Compute posterior variance
  post_var <- b1 / (a1 - 2) * r0 * tau / xx

  # Posterior mean of residual variance under IG((a0+n)/2, (b0+RSS)/2)
  rv <- (b1 / 2) / (a1 / 2 - 1)

  return(list(
    lbf        = lbf,
    post_mean  = post_mean,
    post_mean2 = post_var + post_mean^2,
    post_var   = post_var,
    rv         = rv
  ))
}

# Compute log Bayes factors under Normal-Inverse-Gamma (NIG) prior
#' @keywords internal
compute_lbf_NIG <- function(n, xx, xy, yy, sxy, s0, a0, b0, tau = 1) {
  r0 <- s0 / (s0 + tau / xx)
  rss <- yy * (1 - r0 * sxy^2)

  # Update inverse-gamma parameters
  a1 <- a0 + n
  b1 <- b0 + rss

  # Compute log Bayes factor for each variable
  lbf <- -(log(1 + s0 * xx / tau) + a1 * log(b1 / (b0 + yy))) / 2

  return(lbf)
}

# Compute posterior moments under Normal-Inverse-Gamma (NIG) prior
#' @keywords internal
compute_posterior_moments_NIG <- function(n, xx, xy, yy, sxy, s0, a0, b0, tau = 1) {
  r0 <- s0 / (s0 + tau / xx)
  rss <- yy * (1 - r0 * sxy^2)

  # Update inverse-gamma parameters
  a1 <- a0 + n
  b1 <- b0 + rss

  # Compute least-squares estimate for each variable
  bhat <- xy / xx

  # Compute posterior mean
  post_mean <- r0 * bhat

  # Compute posterior variance
  post_var <- b1 / (a1 - 2) * r0 * tau / xx

  # Posterior mean of residual variance under IG((a0+n)/2, (b0+RSS)/2)
  rv <- (b1 / 2) / (a1 / 2 - 1)

  return(list(
    post_mean  = post_mean,
    post_mean2 = post_var + post_mean^2,
    post_var   = post_var,
    s_j_sq     = r0 * tau / xx,
    rv         = rv
  ))
}

# EM update for prior variance under Normal-Inverse-Gamma (NIG) prior
#' @keywords internal
update_prior_variance_NIG_EM <- function(n, xx, xy, yy, sxy, pip, s0, a0, b0, tau = 1) {
  r0   <- s0 / (s0 + tau / xx)
  rss  <- yy * (1 - r0 * sxy^2)

  # Update inverse-gamma parameters
  a1   <- a0 + n
  b1   <- b0 + rss

  # Compute posterior mean and variance component
  bhat <- xy / xx
  post_mean  <- r0 * bhat
  post_var   <- r0 * tau / xx

  u  <- gamma(1/2) / beta(a1/2, 1/2)
  mb <- post_mean * sqrt(2 / b1) * u
  vb <- post_var + post_mean^2 * 2 / b1 * (1 / beta(a1/2, 1) - u^2)

  return(sum(pip * (vb + mb^2)))
}

# KL divergence for the NIG variational form. KL_beta uses the Gaussian-
# Gaussian KL with shared sigma^2 scaling (sigma^2 log-dets cancel; only
# mu^2/(sigma^2 V) survives). KL_sigma2 is the closed form for IG||IG.
#' @keywords internal
compute_kl_NIG <- function(alpha, post_mean, post_mean2, pi, V, a0, b0, a_post, b_post,
                           s_j_sq) {
  eps <- .Machine$double.eps

  # KL for categorical assignment q(gamma) || p(gamma)
  KL_gamma <- sum(alpha * (log(pmax(alpha, eps)) - log(pmax(pi, eps))))

  # KL for b given sigma^2, integrated over q(sigma^2)
  E_inv_sigma2 <- a_post / b_post
  KL_beta <- 0.5 * sum(alpha * (
    log(V) - log(pmax(s_j_sq, eps)) + s_j_sq / V +
      post_mean^2 * E_inv_sigma2 / V - 1
  ))

  # KL between IG posterior and IG prior (closed form)
  KL_sigma2 <- lgamma(a0) - lgamma(a_post) +
    a0 * log(b_post / b0) +
    (a_post - a0) * digamma(a_post) -
    a_post + (a_post * b0) / b_post

  return(as.numeric(KL_gamma + KL_beta + KL_sigma2))
}

# Compute log-normalizing factor for the IG(a,b) distribution
#' @keywords internal
inv_gamma_factor <- function(a, b) {
  return(a * log(b) - lgamma(a))
}

# Compute null log-likelihood under NIG prior
#' @keywords internal
compute_null_loglik_NIG <- function(n, yy, a0, b0, use_NIG = FALSE) {
  # No null log-likelihood for non-NIG prior
  if (!use_NIG) {
    return(NULL)
  }

  return(-n * log(2 * pi) / 2 +
         inv_gamma_factor(a0 / 2, b0 / 2) -
         inv_gamma_factor((a0 + n) / 2, (b0 + yy) / 2))
}

# Compute marginal log-likelihood for single effect regression
#' @keywords internal
compute_marginal_loglik <- function(lbf_model, n, yy, a0, b0, use_NIG = FALSE) {
  # No marginal log-likelihood computation for non-NIG prior
  if (!use_NIG) {
    return(NULL)
  }

  ll0 <- compute_null_loglik_NIG(n, yy, a0, b0, use_NIG = TRUE)
  return(lbf_model + ll0)
}

# Estimate residual variance
#' @keywords internal
est_residual_variance <- function(data, model) {
  resid_var <- (1 / data$n) * get_ER2(data, model)
  if (resid_var < 0) {
    stop("est_residual_variance() failed: the estimated value is negative")
  }
  return(resid_var)
}


# =============================================================================
# SuSiE-ASH SHARED UTILITIES
#
# Functions shared between individual-level and summary-statistics ash paths.
# The masking logic is data-type-agnostic (only needs correlation matrix),
# while the mr.ash fitting is dispatched to either mr.ash (individual) or
# mr.ash.rss (summary stats).
#
# Design: individual-level data uses mr.ash directly, SS data uses mr.ash.rss.
# The init/masking/cleanup logic is shared since it depends only on model
# dimensions (n, p, L), not on data representation.
# =============================================================================

# Initialize ash tracking fields on a model object
#
# Shared between individual and SS model initialization.
# Individual models store X_theta (n-vector); SS models store XtX_theta (p-vector).
#
# @param model Model object to augment
# @param n Number of observations (used only by individual path for X_theta)
# @param p Number of predictors
# @param L Number of single effects
# @param is_individual Whether this is individual-level data
#
# @return Model with ash tracking fields added
#
# @keywords internal
init_ash_fields <- function(model, n, p, L, is_individual = FALSE) {
  model$tau2     <- 0
  model$theta    <- rep(0, p)
  model$ash_iter <- 0
  model$ash_pi   <- NULL
  model$ash_s0   <- NULL

  if (is_individual) {
    model$X_theta <- rep(0, n)
  } else {
    model$XtX_theta <- rep(0, p)
  }

  return(model)
}

init_ash_fields_filter_archived <- function(model, n, p, L, is_individual = FALSE) {
  model <- init_ash_fields(model, n, p, L, is_individual)

  # Additional tracking fields for the archived filter-based masking
  model$masked                 <- rep(FALSE, p)
  model$diffuse_iter_count     <- rep(0, L)
  model$prev_sentinel          <- rep(0, L)
  model$unmask_candidate_iters <- rep(0, p)
  model$ever_unmasked          <- rep(FALSE, p)
  model$force_exposed_iter     <- rep(0, p)
  model$ever_diffuse           <- rep(0, L)
  model$second_chance_used     <- rep(FALSE, p)
  model$prev_case              <- rep(0, L)

  return(model)
}

# Update ash variance components: coordinate SuSiE and Mr.ASH
#
# Manages the interaction between SuSiE's sparse effects (beta) and
# Mr.ASH's dense effects (theta). Uses three zones to prevent Mr.ASH
# from absorbing signals SuSiE is fine-mapping:
#
#   SUBTRACT: Trusted effects are fully removed from Mr.ASH residuals.
#     Mr.ASH cannot see or absorb these confirmed signals.
#   MASK: Emerging effects have theta forced to 0 in their LD
#     neighborhoods. Mr.ASH cannot absorb signal here, giving SuSiE
#     time to resolve these effects.
#   EXPOSE: Positions not covered by subtraction or masking. Mr.ASH
#     absorbs signal freely. LD spillover and false positives that
#     get flagged and unmasked end up here.
#
# Spillover is detected in two ways:
#   Across-SER: Two effects whose sentinels are in tight LD (|r| > 0.9)
#     are colliding on the same signal. Both get flagged.
#   Within-SER: A sentinel that jumps to a distant variant (|r| < 0.5)
#     indicates the effect is not well-localized. Gets flagged.
#
# Flagged effects are initially masked (protected). After unmask_delay
# iterations, the OLD sentinel's LD neighborhood is selectively exposed
# to Mr.ASH, allowing absorption of spillover at the confusion point
# while the effect's current position stays protected.
#
# @param data Data object (individual or SS).
# @param model Current SuSiE model.
# @param params Parameters object.
#
# @return List of updated model fields (sigma2, tau2, theta, etc.)
#   to be merged into model via modifyList.
#
# @keywords internal
## V0-faithful three-case classification for BB+ash filter
## Replaces the body of update_ash_variance_components()
## Key change: standard purity (not effect_purity) for case classification
## + force_mask for diffuse slots' sentinel LD (from V0)

update_ash_variance_components <- function(data, model, params) {

  # BB+ash filter: V0's 3-tier classifier (diffuse / uncertain / confident)
  # with c_hat marginalization of CASE 3 subtraction.
  # Output: b_confident (subtract from mr.ash residual) and mask.

  # --- User parameters ---
  purity_threshold <- if (!is.null(params$purity_threshold)) params$purity_threshold else 0.5
  pip_threshold    <- if (!is.null(params$pip_threshold))    params$pip_threshold    else 0.1
  ld_threshold     <- if (!is.null(params$ld_threshold))     params$ld_threshold     else 0.5

  # --- Internal constants ---
  diffuse_purity             <- 0.1   # purity below this = CASE 1
  cs_threshold               <- 0.9   # working CS coverage
  neighborhood_pip_threshold <- 0.4   # LD-spread mask threshold
  collision_threshold        <- 0.9   # strong LD = same signal
  tight_ld_threshold         <- 0.95  # WTE exposure region
  diffuse_iter_count         <- 2L    # CASE 2 stable iters before WTE
  second_chance_wait         <- 3L    # iters after expose before re-mask
  delayed_unmask_iter        <- 2L    # iters unwanted before unmask

  is_individual <- inherits(data, "individual")
  L <- nrow(model$alpha)
  p <- ncol(model$alpha)
  if (is.null(model$ash_iter)) model$ash_iter <- 0L
  model$ash_iter <- model$ash_iter + 1L

  # Lazy-init state
  if (is.null(model$prev_case))              model$prev_case <- rep(0L, L)
  if (is.null(model$prev_sentinel))          model$prev_sentinel <- rep(0L, L)
  if (is.null(model$ever_diffuse))           model$ever_diffuse <- rep(0L, L)
  if (is.null(model$diffuse_iter_count))     model$diffuse_iter_count <- rep(0L, L)
  if (is.null(model$masked))                 model$masked <- rep(FALSE, p)
  if (is.null(model$ever_unmasked))          model$ever_unmasked <- rep(FALSE, p)
  if (is.null(model$unmask_candidate_iters)) model$unmask_candidate_iters <- rep(0L, p)
  if (is.null(model$force_exposed_iter))     model$force_exposed_iter <- rep(0L, p)
  if (is.null(model$second_chance_used))     model$second_chance_used <- rep(FALSE, p)

  xcorr_result <- get_xcorr(data)
  Xcorr <- xcorr_result$Xcorr
  data <- xcorr_result$data

  # c_hat = BB posterior slot-active weight (fallback 1 = V0).
  c_hat <- if (!is.null(model$slot_weights)) model$slot_weights else rep(1, L)

  # First pass: sentinels, purity, activity
  sentinels     <- apply(model$alpha, 1, which.max)
  effect_purity <- rep(1.0, L)
  is_active     <- rep(FALSE, L)
  for (l in 1:L) {
    a <- model$alpha[l, ]
    is_active[l] <- (max(a) - min(a)) >= 5e-5
    alpha_order <- order(a, decreasing = TRUE)
    cs_size <- min(sum(cumsum(a[alpha_order]) <= cs_threshold) + 1L, p)
    if (cs_size > 1) {
      cs_indices <- alpha_order[1:cs_size]
      R_cs <- abs(Xcorr[cs_indices, cs_indices])
      effect_purity[l] <- min(R_cs[upper.tri(R_cs)])
    }
  }

  # Collision: sentinels of two active slots in strong LD -> bump ever_diffuse
  current_collision <- rep(FALSE, L)
  for (l in which(is_active)) {
    others <- setdiff(which(is_active), l)
    if (length(others) == 0) next
    if (any(abs(Xcorr[sentinels[l], sentinels[others]]) > collision_threshold)) {
      current_collision[l] <- TRUE
      model$ever_diffuse[l] <- model$ever_diffuse[l] + 1L
    }
  }

  b_confident     <- rep(0, p)
  alpha_protected <- matrix(0, nrow = L, ncol = p)
  force_unmask    <- rep(FALSE, p)
  force_mask      <- rep(FALSE, p)

  # Second pass: classify slots
  current_case <- rep(0L, L)
  for (l in 1:L) {
    purity   <- effect_purity[l]
    sentinel <- sentinels[l]

    # Sentinel-jump reset: if sentinel moved to a non-tight-LD position, reset
    # the CASE 2 stability counter so WTE doesn't fire on a newly-picked signal.
    if (sentinel != model$prev_sentinel[l] && model$prev_sentinel[l] > 0L) {
      if (abs(Xcorr[sentinel, model$prev_sentinel[l]]) < tight_ld_threshold) {
        model$diffuse_iter_count[l] <- 0L
      }
    }

    can_be_confident <- (purity >= purity_threshold) && (model$ever_diffuse[l] == 0L)

    if (purity < diffuse_purity) {
      # CASE 1: diffuse. Narrow protection + force_mask on sentinel LD.
      current_case[l] <- 1L
      model$diffuse_iter_count[l] <- 0L
      moderate_ld <- abs(Xcorr[sentinel, ]) > ld_threshold
      to_protect  <- moderate_ld | (model$alpha[l, ] > 5 / p)
      alpha_protected[l, to_protect] <- model$alpha[l, to_protect]
      force_mask <- force_mask | moderate_ld
    } else if (!can_be_confident) {
      # CASE 2: uncertain. Collision -> reset counter only (no alpha protection).
      # Otherwise full alpha protection + wait-then-expose.
      current_case[l] <- 2L
      if (current_collision[l]) {
        model$diffuse_iter_count[l] <- 0L
      } else {
        model$diffuse_iter_count[l] <- model$diffuse_iter_count[l] + 1L
        alpha_protected[l, ] <- model$alpha[l, ]
        if (model$diffuse_iter_count[l] >= diffuse_iter_count) {
          tight_ld <- abs(Xcorr[sentinel, ]) > tight_ld_threshold
          expose   <- tight_ld & !model$second_chance_used
          newly    <- expose & (model$force_exposed_iter == 0L)
          model$force_exposed_iter[newly] <- model$ash_iter
          if (any(newly)) model$diffuse_iter_count[l] <- 0L
          alpha_protected[l, expose] <- 0
          force_unmask <- force_unmask | expose
        }
      }
    } else {
      # CASE 3: confident. Full protection + c_hat-weighted subtraction.
      current_case[l] <- 3L
      model$diffuse_iter_count[l] <- 0L
      alpha_protected[l, ] <- model$alpha[l, ]
      b_confident <- b_confident + c_hat[l] * model$alpha[l, ] * model$mu[l, ]
    }
  }

  # Oscillation: slot flipping between CASE 2 and CASE 3 is unstable -> mark
  # sticky-diffuse, and if it landed on CASE 3 this iter, reverse the
  # subtraction we just added (slot is not trustworthy yet).
  oscillated    <- model$prev_case != 0L & current_case != 0L &
                   ((model$prev_case == 2L & current_case == 3L) |
                    (model$prev_case == 3L & current_case == 2L))
  unstable_case3 <- oscillated & (current_case == 3L)
  model$ever_diffuse[oscillated] <- model$ever_diffuse[oscillated] + 1L
  for (l in which(unstable_case3)) {
    b_confident <- b_confident - c_hat[l] * model$alpha[l, ] * model$mu[l, ]
  }
  model$prev_case     <- current_case
  model$prev_sentinel <- sentinels

  # Mask: PIP-based union, with per-position persistence
  pip_protected    <- susie_get_pip(alpha_protected)
  LD_adj           <- abs(Xcorr) > ld_threshold
  neighborhood_pip <- as.vector(LD_adj %*% pip_protected)
  want_masked <- (neighborhood_pip > neighborhood_pip_threshold) |
                 (pip_protected    > pip_threshold) |
                 force_mask

  # Delayed unmask: count iters a masked position is no longer wanted
  reset_idx <- want_masked | !model$masked
  model$unmask_candidate_iters[!reset_idx] <- model$unmask_candidate_iters[!reset_idx] + 1L
  model$unmask_candidate_iters[reset_idx]  <- 0L
  ready_to_unmask <- model$masked &
    ((model$unmask_candidate_iters >= delayed_unmask_iter & !model$ever_unmasked) | force_unmask)

  model$ever_unmasked[ready_to_unmask] <- TRUE
  masked <- (model$masked | want_masked) & !ready_to_unmask & !model$ever_unmasked

  # Second chance
  should_restore <- (model$force_exposed_iter > 0L) &
                    (model$ash_iter - model$force_exposed_iter >= second_chance_wait) &
                    !model$second_chance_used
  if (any(should_restore)) {
    model$second_chance_used[should_restore] <- TRUE
    model$force_exposed_iter[should_restore] <- 0L
    model$ever_unmasked[should_restore]      <- FALSE
    masked[should_restore]                   <- TRUE
  }
  model$masked <- masked
  mask <- masked

  # Mr.ASH fit
  .skip_mrash <- getOption("susie.skip_mrash", FALSE)
  model$theta[mask] <- 0
  if (.skip_mrash) {
    theta_new <- model$theta; theta_new[mask] <- 0
    ash_result <- list(
      beta = theta_new,
      sigma2 = if (!is.null(model$sigma2)) model$sigma2 else 1,
      pi = model$ash_pi,
      tau2 = if (!is.null(model$tau2)) model$tau2 else 0)
  } else {
    convtol <- if (model$ash_iter < 2) 1e-3 else 1e-4
    if (is_individual) {
      ash_result <- compute_ash_from_individual_data(
        data$X, data$y, b_confident, model, params, convtol)
    } else {
      ash_result <- compute_ash_from_summary_stats(
        data, b_confident, model, params, convtol)
    }
    theta_new <- ash_result$beta
    theta_new[mask] <- 0
  }

  # Diagnostic
  .ash_debug <- TRUE
  if (.ash_debug) {
    model$ever_uncertain <- model$ever_diffuse > 0
    diag_df <- diagnose_bb_ash_iter(
      model, Xcorr, mask, b_confident,
      sentinels, current_collision,
      current_case == 3L, current_case == 3L,
      which(current_case == 2L), which(model$V > 0), c_hat,
      list(beta = theta_new, sigma2 = ash_result$sigma2, pi = ash_result$pi),
      p,
      high_chat = integer(0), low_chat = integer(0),
      collision_threshold = collision_threshold,
      purity_threshold = ld_threshold,
      masking_threshold = ld_threshold,
      nPIP_threshold = pip_threshold,
      c_hat_excess_threshold = NA,
      alpha_entropy_threshold = NA,
      slot_prior = params$slot_prior,
      mask_smoothness = effect_purity,
      mask_amount = c_hat,
      mask_concentration = current_case,
      mask_burnin = model$ever_diffuse,
      mask_spread_pip_at_sent = pip_protected[sentinels],
      mask_pip_prot_at_sent = pip_protected[sentinels])
    if (is.null(model$.diag_env)) model$.diag_env <- new.env(parent = emptyenv())
    if (is.null(model$.diag_env$history)) model$.diag_env$history <- list()
    model$.diag_env$history[[length(model$.diag_env$history) + 1]] <- diag_df
  }

  result <- list(
    sigma2                 = ash_result$sigma2,
    tau2                   = ash_result$tau2,
    theta                  = theta_new,
    ash_pi                 = ash_result$pi,
    ash_iter               = model$ash_iter,
    prev_case              = model$prev_case,
    prev_sentinel          = model$prev_sentinel,
    ever_diffuse           = model$ever_diffuse,
    diffuse_iter_count     = model$diffuse_iter_count,
    masked                 = model$masked,
    ever_unmasked          = model$ever_unmasked,
    unmask_candidate_iters = model$unmask_candidate_iters,
    force_exposed_iter     = model$force_exposed_iter,
    second_chance_used     = model$second_chance_used,
    .diag_env              = model$.diag_env
  )

  if (is_individual) {
    result$X_theta <- as.vector(data$X %*% theta_new)
  } else {
    result$XtX_theta <- as.vector(compute_Rv(data, theta_new))
  }

  return(result)
}

# Archived: Original filter-based ash variance component update
#
# Performs the full ash update cycle with the Diffusion-Aware masking
# heuristic: get correlation matrix, compute masking (3-case classification,
# WaitThenExpose, collision detection, nPIP masking), fit mr.ash, mask theta.
# This is the original SuSiE-ASH implementation with 9+ tuning parameters
# and per-effect/per-variant tracking arrays.
#
# Kept for internal diagnostics/archiving via unmappable_effects="ash_filter_archived".
# The default "ash" path now uses update_ash_variance_components() (c_hat + 3 LD rules).
#
# @param data Data object (individual or SS)
# @param model Current SuSiE model
# @param params Parameters object
#
# @return List with sigma2, tau2, theta, fitted theta, and all tracking fields
#
# @keywords internal
update_ash_variance_components_filter_archived <- function(data, model, params) {
  is_individual <- inherits(data, "individual")

  # Step 1: Get correlation matrix (cached after first call)
  xcorr_result <- get_xcorr(data)
  Xcorr <- xcorr_result$Xcorr
  data <- xcorr_result$data

  # Step 2: Compute masking (shared 3-case classification)
  mask_result <- compute_ash_masking(Xcorr, model, params)
  b_confident <- mask_result$b_confident
  masked <- mask_result$masked
  model <- mask_result$model

  # Step 3: Fit Mr.ASH (dispatch to individual or SS backend)
  # Set options(susie.skip_mrash = TRUE) to diagnose without mr.ash.
  .skip_mrash <- getOption("susie.skip_mrash", FALSE)
  if (.skip_mrash) {
    p_v0 <- ncol(model$alpha)
    mrash_output <- list(
      beta = model$theta, sigma2 = if (!is.null(model$sigma2)) model$sigma2 else 1,
      pi = model$ash_pi, tau2 = if (!is.null(model$tau2)) model$tau2 else 0,
      sa2 = if (!is.null(model$ash_s0)) model$ash_s0 else 0)
    mrash_output$beta[masked] <- 0
  } else {
    convtol <- if (model$ash_iter < 2) 1e-3 else 1e-4
    if (is_individual) {
      mrash_output <- compute_ash_from_individual_data(
        data$X, data$y, b_confident, model, params, convtol
      )
    } else {
      mrash_output <- compute_ash_from_summary_stats(
        data, b_confident, model, params, convtol
      )
    }
  }

  # Step 4: Zero out theta for masked variants
  theta_new <- mrash_output$beta
  theta_new[masked] <- 0

  # V0 diagnostic: capture data.frame and accumulate on model
  .ash_debug <- TRUE
  if (.ash_debug) {
    diag_df <- diagnose_ash_filter_archived_iter(
      model, Xcorr, masked, b_confident,
      mask_result$sentinels, mask_result$effect_purity,
      mask_result$current_case, mask_result$current_collision,
      mrash_output)
    if (is.null(model$.diag_env)) model$.diag_env <- new.env(parent = emptyenv())
    if (is.null(model$.diag_env$history)) model$.diag_env$history <- list()
    model$.diag_env$history[[length(model$.diag_env$history) + 1]] <- diag_df
  }

  # Step 5: Compute fitted theta (data-representation-specific)
  result <- list(
    sigma2              = mrash_output$sigma2,
    tau2                = mrash_output$tau2,
    theta               = theta_new,
    ash_pi              = mrash_output$pi,
    sa2                 = mrash_output$sa2,
    ash_iter            = model$ash_iter,
    diffuse_iter_count  = model$diffuse_iter_count,
    prev_sentinel       = model$prev_sentinel,
    masked              = masked,
    unmask_candidate_iters = model$unmask_candidate_iters,
    ever_unmasked       = model$ever_unmasked,
    force_exposed_iter  = model$force_exposed_iter,
    second_chance_used  = model$second_chance_used,
    ever_diffuse        = model$ever_diffuse,
    prev_case           = model$prev_case,
    .diag_env           = model$.diag_env
  )

  if (is_individual) {
    result$X_theta <- as.vector(data$X %*% theta_new)
  } else {
    result$XtX_theta <- as.vector(compute_Rv(data, theta_new))
  }

  return(result)
}

# Remove ash-specific runtime fields from model
#
# Shared between cleanup_model.individual() and cleanup_model.ss().
#
# @param model Model object
#
# @return Model with ash runtime fields removed
#
# @keywords internal
cleanup_ash_fields <- function(model) {
  # Remove internal tracking fields from the new ash path.
  # Keep: tau2, theta, ash_pi (user-visible results)
  for (field in c("X_theta", "XtX_theta", "ash_iter", "ash_s0",
                   "ever_uncertain", "prev_sentinel")) {
    model[[field]] <- NULL
  }
  return(model)
}

cleanup_ash_fields_filter_archived <- function(model) {
  # Remove internal tracking fields from the archived filter path.
  for (field in c("X_theta", "XtX_theta", "ash_iter", "ash_s0",
                   "masked", "diffuse_iter_count", "prev_sentinel",
                   "unmask_candidate_iters", "ever_unmasked",
                   "force_exposed_iter", "ever_diffuse",
                   "second_chance_used", "prev_case")) {
    model[[field]] <- NULL
  }
  return(model)
}

# Get or compute correlation matrix for ash masking
#
# For SS data: derives from XtX via safe_cov2cor (cheap scaling).
# For individual data: computes cor(X) and caches it on the data object.
#
# @param data Data object
#
# @return List with Xcorr and (possibly updated) data object
#
# @keywords internal
get_xcorr <- function(data) {
  # Check for cached correlation matrix
  if (!is.null(data$Xcorr_cache)) {
    return(list(Xcorr = data$Xcorr_cache, data = data))
  }

  if (!is.null(data$XtX)) {
    # SS path: derive from XtX
    if (any(!(diag(data$XtX) %in% c(0, 1)))) {
      Xcorr <- safe_cov2cor(data$XtX)
    } else {
      Xcorr <- data$XtX
    }
  } else if (!is.null(data$X)) {
    # Individual path: compute correlation from X
    Xcorr <- safe_cor(data$X)
  } else {
    stop("Cannot compute correlation matrix: data has neither XtX nor X")
  }

  # Cache for future iterations
  data$Xcorr_cache <- Xcorr
  return(list(Xcorr = Xcorr, data = data))
}

# Compute ash masking: classify effects, determine protection/masking
#
# KEY INSIGHT: Protect SuSiE's sparse effects from Mr.ASH absorption,
# but let Mr.ASH absorb unmappable and unreliable signals.
#
# Two types of diffusion (both indicate unreliable effects):
#   1. WITHIN-EFFECT: Low purity - spread across variants not in tight LD
#   2. CROSS-EFFECT: Sentinel collision - multiple effects compete for
#      same position (composite signal, not clean single causal)
#
# Classification into three cases:
#   CASE 1 (diffuse): purity < 0.1 - protect neighborhood loosely
#   CASE 2 (uncertain): low purity OR ever_diffuse - expose to Mr.ASH
#   CASE 3 (confident): purity >= 0.5 AND never diffuse - subtract from residuals
#
# Cross-effect diffusion tracking:
#   - Detect via sentinel collision (sentinels in tight LD across effects)
#   - Mark effect as ever_diffuse (sticky, effect-level)
#   - ever_diffuse effects get zero protection permanently
#   - Real signals survive Mr.ASH competition; composites get absorbed
#
# Low purity (non-diffuse) effects:
#   - Use wait-then-expose mechanism
#   - After diffuse_iter_count stable iterations, expose sentinel neighborhood
#   - If Mr.ASH absorbs it, the signal was synthetic
#   - Second-chance mechanism: after wait period, restore masking to check
#
# @param Xcorr Correlation matrix (p x p)
# @param model Current SuSiE model (with alpha, mu, tracking fields)
# @param params Parameters object
#
# @return List with b_confident, masked, and updated model tracking fields
#
# @keywords internal
compute_ash_masking <- function(Xcorr, model, params) {
  # --- Protection thresholds ---
  neighborhood_pip_threshold <- if (!is.null(params$neighborhood_pip_threshold)) params$neighborhood_pip_threshold else 0.4
  direct_pip_threshold <- if (!is.null(params$direct_pip_threshold)) params$direct_pip_threshold else 0.1
  signal_separation_ld <- if (!is.null(params$signal_separation_ld)) params$signal_separation_ld else 0.5

  # --- Purity thresholds ---
  cs_threshold <- if (!is.null(params$working_cs_threshold)) params$working_cs_threshold else 0.9
  cs_formation_threshold <- if (!is.null(params$cs_formation_threshold)) params$cs_formation_threshold else 0.1
  purity_threshold <- if (!is.null(params$purity_threshold)) params$purity_threshold else 0.5

  # --- LD thresholds for collision and exposure ---
  collision_threshold <- if (!is.null(params$collision_threshold)) params$collision_threshold else 0.9
  tight_ld_threshold <- if (!is.null(params$tight_ld_threshold)) params$tight_ld_threshold else 0.95

  # --- Iteration counters for CASE 2 ---
  diffuse_iter_count <- if (!is.null(params$diffuse_iter_count)) params$diffuse_iter_count else 2
  track_sentinel <- if (!is.null(params$track_sentinel)) params$track_sentinel else TRUE

  # --- Second chance mechanism ---
  second_chance_wait <- if (!is.null(params$second_chance_wait)) params$second_chance_wait else 3

  # --- Unmasking stability ---
  delayed_unmask_iter <- 2

  L <- nrow(model$alpha)
  p <- ncol(model$alpha)
  model$ash_iter <- model$ash_iter + 1

  # =========================================================================
  # First pass: Compute sentinels and purity
  # =========================================================================
  sentinels <- apply(model$alpha, 1, which.max)
  effect_purity <- rep(NA, L)

  for (l in 1:L) {
    alpha_order <- order(model$alpha[l,], decreasing = TRUE)
    cumsum_alpha <- cumsum(model$alpha[l, alpha_order])
    cs_size <- sum(cumsum_alpha <= cs_threshold) + 1
    cs_indices <- alpha_order[1:min(cs_size, p)]
    effect_purity[l] <- get_purity(cs_indices, X = NULL, Xcorr = Xcorr, use_rfast = FALSE)[1]
  }

  # Detect current collision and update ever_diffuse
  current_collision <- rep(FALSE, L)
  for (l in 1:L) {
    if (max(model$alpha[l,]) - min(model$alpha[l,]) < 5e-5) next
    sentinel_l <- sentinels[l]
    for (other_l in (1:L)[-l]) {
      if (max(model$alpha[other_l,]) - min(model$alpha[other_l,]) < 5e-5) next
      if (abs(Xcorr[sentinel_l, sentinels[other_l]]) > collision_threshold) {
        current_collision[l] <- TRUE
      }
    }
    model$ever_diffuse[l] <- model$ever_diffuse[l] + current_collision[l]
  }

  # Initialize per-iteration outputs
  b_confident <- rep(0, p)
  alpha_protected <- matrix(0, nrow = L, ncol = p)
  force_unmask <- rep(FALSE, p)
  force_mask <- rep(FALSE, p)

  # =========================================================================
  # Second pass: Classify effects and determine protection
  # =========================================================================
  current_case <- rep(0, L)

  for (l in 1:L) {
    purity <- effect_purity[l]
    sentinel <- sentinels[l]

    if (track_sentinel && sentinel != model$prev_sentinel[l] && model$prev_sentinel[l] > 0) {
      if (abs(Xcorr[sentinel, model$prev_sentinel[l]]) < tight_ld_threshold) {
        model$diffuse_iter_count[l] <- 0
      }
    }

    is_ever_diffuse <- model$ever_diffuse[l] > 0
    can_be_confident <- (purity >= purity_threshold) && !is_ever_diffuse

    if (purity < cs_formation_threshold) {
      # CASE 1: Diffuse within effect
      current_case[l] <- 1
      model$diffuse_iter_count[l] <- 0
      moderate_ld_with_sentinel <- abs(Xcorr[sentinel,]) > signal_separation_ld
      meaningful_alpha <- model$alpha[l,] > 5/p
      to_protect <- moderate_ld_with_sentinel | meaningful_alpha
      alpha_protected[l, to_protect] <- model$alpha[l, to_protect]
      force_mask <- force_mask | moderate_ld_with_sentinel
    } else if (!can_be_confident) {
      # CASE 2: Uncertain
      current_case[l] <- 2
      if (current_collision[l]) {
        model$diffuse_iter_count[l] <- 0
      } else {
        model$diffuse_iter_count[l] <- model$diffuse_iter_count[l] + 1
        if (model$diffuse_iter_count[l] >= diffuse_iter_count) {
          tight_ld_with_sentinel <- abs(Xcorr[sentinel,]) > tight_ld_threshold
          newly_exposed <- tight_ld_with_sentinel &
                          !model$second_chance_used &
                          (model$force_exposed_iter == 0)
          model$force_exposed_iter[newly_exposed] <- model$ash_iter
          if (any(newly_exposed)) {
            model$diffuse_iter_count[l] <- 0
          }
          alpha_protected[l,] <- model$alpha[l,]
          expose_positions <- tight_ld_with_sentinel & !model$second_chance_used
          alpha_protected[l, expose_positions] <- 0
          force_unmask <- force_unmask | expose_positions
        } else {
          alpha_protected[l,] <- model$alpha[l,]
        }
      }
    } else {
      # CASE 3: Confident
      current_case[l] <- 3
      model$diffuse_iter_count[l] <- 0
      b_confident <- b_confident + model$alpha[l,] * model$mu[l,]
      alpha_protected[l,] <- model$alpha[l,]
    }

    model$prev_sentinel[l] <- sentinel
  }

  # =========================================================================
  # Oscillation detection
  # =========================================================================
  for (l in 1:L) {
    prev <- model$prev_case[l]
    curr <- current_case[l]
    if (curr == 0 || prev == 0) next
    if ((prev == 2 && curr == 3) || (prev == 3 && curr == 2)) {
      model$ever_diffuse[l] <- model$ever_diffuse[l] + 1
      if (curr == 3) {
        b_confident <- b_confident - model$alpha[l,] * model$mu[l,]
      }
    }
  }
  model$prev_case <- current_case

  # =========================================================================
  # Masking logic
  # =========================================================================
  pip_protected <- susie_get_pip(alpha_protected)

  LD_adj <- abs(Xcorr) > signal_separation_ld
  neighborhood_pip <- as.vector(LD_adj %*% pip_protected)
  want_masked <- (neighborhood_pip > neighborhood_pip_threshold) |
                 (pip_protected > direct_pip_threshold) |
                 force_mask

  dont_want_mask <- !want_masked
  model$unmask_candidate_iters[model$masked & dont_want_mask] <-
    model$unmask_candidate_iters[model$masked & dont_want_mask] + 1
  model$unmask_candidate_iters[want_masked | !model$masked] <- 0

  ready_to_unmask <- (model$masked &
                     (model$unmask_candidate_iters >= delayed_unmask_iter) &
                     !model$ever_unmasked) |
                     (model$masked & force_unmask)

  model$ever_unmasked[ready_to_unmask] <- TRUE
  masked <- (model$masked | want_masked) & !ready_to_unmask & !model$ever_unmasked

  # Second chance
  waited_long_enough <- (model$force_exposed_iter > 0) &
                        (model$ash_iter - model$force_exposed_iter) >= second_chance_wait
  should_restore <- waited_long_enough & !model$second_chance_used
  if (any(should_restore)) {
    model$second_chance_used[should_restore] <- TRUE
    model$force_exposed_iter[should_restore] <- 0
    model$ever_unmasked[should_restore] <- FALSE
    masked[should_restore] <- TRUE
  }

  list(
    b_confident = b_confident,
    masked = masked,
    model = model,
    sentinels = sentinels,
    effect_purity = effect_purity,
    current_case = current_case,
    current_collision = current_collision
  )
}

# Run Mr.ASH on individual-level data
#
# Computes residuals from raw X, y and calls mr.ash directly.
#
# @param X Design matrix (n x p)
# @param y Response vector (n)
# @param b_confident Vector of confident effects to subtract from residuals
# @param model Current SuSiE model
# @param params Parameters object
# @param convtol Convergence tolerance for mr.ash
#
# @return List with beta, sigma2, pi, sa2, tau2
#
# @keywords internal
compute_ash_from_individual_data <- function(X, y, b_confident, model, params, convtol = 1e-4) {
  residuals <- y - X %*% b_confident

  mrash_output <- mr.ash(
    X             = X,
    y             = residuals,
    intercept     = FALSE,
    standardize   = FALSE,
    sigma2        = model$sigma2,
    update.sigma2 = params$estimate_residual_variance,
    beta.init     = model$theta,
    pi            = model$ash_pi,
    tol           = list(convtol = convtol, epstol = 1e-12),
    verbose       = params$verbose,
    max.iter      = 1000
  )

  list(
    beta = mrash_output$beta,
    sigma2 = mrash_output$sigma2,
    pi = mrash_output$pi,
    sa2 = mrash_output$data$sa2,
    tau2 = sum(mrash_output$data$sa2 * mrash_output$pi) * mrash_output$sigma2
  )
}

# Run Mr.ASH using summary statistics (via mr.ash.rss)
#
# Computes residual summary statistics from sufficient statistics and
# calls mr.ash.rss. This enables the "ash" unmappable effects mode
# for susie_ss() and susie_rss() without requiring raw X and y.
#
# @param data Data object (must have $XtX, $Xty, $yty, $n)
# @param b_confident Vector of confident effects to subtract from residuals
# @param model Current SuSiE model
# @param params Parameters object
# @param convtol Convergence tolerance for mr.ash.rss
#
# @return List with beta, sigma2, pi, sa2, tau2
#
# @keywords internal
compute_ash_from_summary_stats <- function(data, b_confident, model, params, convtol = 1e-4) {
  # Compute residual sufficient statistics: r = y - X*b_confident
  # X'r = X'y - X'X * b_confident
  Xtr <- as.vector(data$Xty - data$XtX %*% b_confident)
  # r'r = y'y - 2*b'*X'y + b'*X'X*b
  rtr <- data$yty - 2 * sum(b_confident * data$Xty) +
         as.numeric(t(b_confident) %*% data$XtX %*% b_confident)

  XtXdiag <- diag(data$XtX)
  bhat <- Xtr / XtXdiag
  # Use n-2 df to match PVE adjustment in mr.ash.rss
  shat <- sqrt(pmax(0, (rtr - Xtr^2 / XtXdiag) / ((data$n - 2) * XtXdiag)))
  R_mat <- safe_cov2cor(data$XtX)
  var_r <- rtr / (data$n - 1)

  # Default prior grid (matching mr.ash defaults)
  if (is.null(model$ash_s0)) {
    sa2 <- (2^((0:24) / 25) - 1)^2
    model$ash_s0 <- sa2 / median(XtXdiag) * data$n
  }
  K <- length(model$ash_s0)
  if (is.null(model$ash_pi)) model$ash_pi <- rep(1 / K, K)

  fit <- mr.ash.rss(
    bhat = bhat, shat = shat, R = R_mat,
    var_y = var_r, n = data$n,
    sigma2_e = model$sigma2, s0 = model$ash_s0, w0 = model$ash_pi,
    mu1_init = model$theta,
    tol = convtol, max_iter = 1000,
    update_w0 = TRUE,
    update_sigma = params$estimate_residual_variance
  )

  list(
    beta = fit$beta,
    sigma2 = fit$sigma2,
    pi = fit$pi,
    sa2 = model$ash_s0,
    tau2 = sum(model$ash_s0 * fit$pi) * fit$sigma2
  )
}

# Run final Mr.ASH pass after SuSiE convergence
#
# After SuSiE converges, run one final Mr.ASH pass with ALL SuSiE effects
# removed (unmasked) to get the final unmappable effects estimate.
# Individual-level data uses mr.ash directly; SS data uses mr.ash.rss.
#
# @param data Data object
# @param params Parameters object
# @param model Converged SuSiE model
#
# @return Model with updated theta, tau2, ash_pi, and fitted theta values
#
# @keywords internal
run_final_ash_pass <- function(data, params, model) {
  b_susie <- colSums(model$alpha * model$mu)
  is_individual <- inherits(data, "individual")

  # Dispatch to individual (mr.ash) or SS (mr.ash.rss) backend
  if (is_individual) {
    mrash_output <- compute_ash_from_individual_data(
      data$X, data$y, b_susie, model, params
    )
  } else {
    mrash_output <- compute_ash_from_summary_stats(data, b_susie, model, params)
  }

  # Update model (shared across both paths)
  model$theta  <- mrash_output$beta
  model$tau2   <- mrash_output$tau2
  model$ash_pi <- mrash_output$pi

  # Compute fitted theta (data-representation-specific)
  if (is_individual) {
    model$X_theta <- as.vector(data$X %*% model$theta)
  } else {
    model$XtX_theta <- compute_Rv(data, model$theta)
  }

  return(model)
}

# Compute ELBO for infinitesimal effects model
#' @keywords internal
compute_elbo_inf <- function(alpha, mu, omega, lbf, sigma2, tau2, n, p,
                             eigen_vectors, eigen_values, VtXty, yty) {
  L <- nrow(mu)

  b <- colSums(mu * alpha)
  Vtb <- t(eigen_vectors) %*% b
  diagVtMV <- Vtb^2
  tmpD <- rep(0, p)

  for (l in seq_len(L)) {
    bl <- mu[l, ] * alpha[l, ]
    Vtbl <- t(eigen_vectors) %*% bl
    diagVtMV <- diagVtMV - Vtbl^2
    tmpD <- tmpD + alpha[l, ] * (mu[l, ]^2 + 1 / omega[l, ])
  }

  diagVtMV <- diagVtMV + rowSums(sweep(t(eigen_vectors)^2, 2, tmpD, `*`))

  # Compute variance
  var <- tau2 * eigen_values + sigma2

  # Compute negative ELBO
  neg_elbo <- 0.5 * (n - p) * log(sigma2) + 0.5 / sigma2 * yty +
    sum(0.5 * log(var) -
          0.5 * tau2 / sigma2 * VtXty^2 / var -
          Vtb * VtXty / var +
          0.5 * eigen_values / var * diagVtMV)

  elbo <- -neg_elbo

  return(elbo)
}

# =============================================================================
# CREDIBLE SETS & POST-PROCESSING
#
# Functions for generating final output including credible sets, posterior
# inclusion probabilities, and summary statistics. These process the fitted
# model into interpretable results.
#
# Functions: n_in_CS_x, in_CS_x, n_in_CS, in_CS, get_purity
# =============================================================================

# Find how many variables in the CS.
# x is a probability vector.
#' @keywords internal
n_in_CS_x <- function(x, coverage = 0.9) {
  sum(cumsum(sort(x, decreasing = TRUE)) < coverage) + 1
}

# Return binary vector indicating if each point is in CS.
# x is a probability vector.
#' @keywords internal
in_CS_x <- function(x, coverage = 0.9) {
  n <- n_in_CS_x(x, coverage)
  o <- order(x, decreasing = TRUE)
  result <- rep(0, length(x))
  result[o[1:n]] <- 1
  return(result)
}

# Returns an l-by-p binary matrix indicating which variables are in
# susie credible sets.
#' @keywords internal
in_CS <- function(res, coverage = 0.9) {
  if (inherits(res, "susie")) {
    res <- res$alpha
  }
  return(t(apply(res, 1, function(x) in_CS_x(x, coverage))))
}

#' @keywords internal
n_in_CS <- function(res, coverage = 0.9) {
  if (inherits(res, "susie")) {
    res <- res$alpha
  }
  return(apply(res, 1, function(x) n_in_CS_x(x, coverage)))
}

# Subsample and compute min, mean, median and max abs corr.
#' @importFrom stats median
#' @keywords internal
get_purity <- function(pos, X, Xcorr, squared = FALSE, n = 100,
                       use_rfast = NULL) {
  if (is.null(use_rfast)) {
    use_rfast <- requireNamespace("Rfast", quietly = TRUE)
  }
  if (use_rfast) {
    get_upper_tri <- Rfast::upper_tri
    get_median <- Rfast::med
  } else {
    get_upper_tri <- function(R) R[upper.tri(R)]
    get_median <- median
  }
  if (length(pos) == 1) {
    return(c(1, 1, 1))
  } else {
    if (is.null(Xcorr)) {
      if (length(pos) > n) {
        pos <- sample(pos, n)
      }
      X_sub <- X[, pos]
      X_sub <- as.matrix(X_sub)
      value <- abs(get_upper_tri(safe_cor(X_sub)))
    } else {
      value <- abs(get_upper_tri(Xcorr[pos, pos]))
    }
    if (squared) {
      value <- value^2
    }
    result <- c(
      min(value),
      sum(value) / length(value),
      get_median(value)
    )
    if (any(is.na(result) | is.nan(result))) {
      stop("get_purity returned NaN/NA. Check for constant columns or data issues.")
    }
    return(result)
  }
}


================================================
FILE: R/susie_workhorse.R
================================================
#' SuSiE workhorse function
#'
#' Main orchestration for the IBSS algorithm. When `params$L_greedy`
#' is non-NULL, runs a greedy outer loop that grows `L` in linear
#' steps of `params$L_greedy` until the fit has at least one empty
#' slot (`min(lbf) < params$greedy_lbf_cutoff`, default `0.1`) or `L` reaches
#' `params$L`. With `params$L_greedy = NULL` (default), runs a
#' single fixed-`L` IBSS, output bit-identical to prior susieR.
#'
#' @param data Data object (individual, ss, or rss_lambda).
#' @param params Validated params object.
#' @return Complete fitted SuSiE model.
#'
#' @export
#' @keywords internal
susie_workhorse <- function(data, params) {

  # Greedy-L outer loop. Saturation detected when any one slot's
  # lbf falls below greedy_lbf_cutoff (slot-invariant, single-round verdict).
  # Warm-start across rounds via params$model_init.
  if (!is.null(params$L_greedy)) {
    L_max   <- params$L
    L_step  <- params$L_greedy
    greedy_lbf_cutoff <- if (is.null(params$greedy_lbf_cutoff)) 0.1 else params$greedy_lbf_cutoff
    verbose <- isTRUE(params$verbose)
    history <- list()

    current_L <- min(L_step, L_max)
    fit       <- NULL
    round_n   <- 0L

    repeat {
      round_n <- round_n + 1L
      params_round          <- params
      params_round$L_greedy <- NULL                # avoid recursion
      params_round$L        <- current_L
      if (!is.null(fit)) params_round$model_init <- fit
      fit <- susie_workhorse(data, params_round)

      min_lbf <- min(fit$lbf, na.rm = TRUE)
      action  <- if (current_L >= L_max)    "L_max reached"
                 else if (min_lbf < greedy_lbf_cutoff) "saturated"
                 else                         "grow"
      history[[round_n]] <- list(L = current_L, min_lbf = min_lbf,
                                 action = action)
      if (action != "grow") break
      current_L <- min(current_L + L_step, L_max)
    }
    if (verbose) {
      message(sprintf("[L_greedy] %d round%s, greedy_lbf_cutoff=%.3f, final L=%d",
                      round_n, if (round_n == 1L) "" else "s",
                      greedy_lbf_cutoff, current_L))
      message(sprintf("%-6s %-5s %-10s %s",
                      "round", "L", "min(lbf)", "action"))
      for (i in seq_along(history)) {
        h <- history[[i]]
        message(sprintf("%-6d %-5d %-10.3f %s",
                        i, h$L, h$min_lbf, h$action))
      }
    }
    return(fit)
  }

  # Initialize model object
  model <- ibss_initialize(data, params)

  # Initialize ELBO & tracking
  elbo     <- rep(as.numeric(NA), params$max_iter + 1)
  elbo[1]  <- -Inf
  tracking <- list()

  # Initialize runtime state (convergence tracking, cleaned up at finalization)
  model$runtime <- list(
    prev_elbo  = -Inf,
    prev_alpha = model$alpha
  )

  # Main IBSS iteration loop
  for (iter in seq_len(params$max_iter)) {
    # Store iteration snapshot for track_fit
    tracking <- track_ibss_fit(data, params, model, tracking, iter, elbo)

    # Update all L effects
    model <- ibss_fit(data, params, model)

    # Calculate objective and check convergence
    elbo[iter + 1] <- get_objective(data, params, model)
    model <- check_convergence(data, params, model, elbo, iter)

    # Update convergence state for next iteration
    model$runtime$prev_elbo  <- elbo[iter + 1]
    model$runtime$prev_alpha <- model$alpha

    if (model$converged) {
      break
    }

    # Update variance components if not converged.
    # The method itself checks params to decide what to update,
    # allowing S3 overrides to update additional model parameters
    model <- update_model_variance(data, params, model)

  }

  # Check final convergence status
  if (!model$converged) {
    warning_message(paste("IBSS algorithm did not converge in", params$max_iter, "iterations!"))
  }

  # Set ELBO from iterations
  model$elbo <- elbo[2:(iter + 1)]

  # For NIG prior, scale prior variance by residual variance mode.
  if (isTRUE(params$use_NIG))
    model$V <- model$V * model$rv
    
  # Zero out effects with negligible prior variance
  model <- trim_null_effects(data, params, model)

  model <- ibss_finalize(data, params, model, elbo, iter, tracking)

  # Run refinement if requested
  if (params$refine && !is.null(model$sets) && length(model$sets$cs) > 0) {
    model <- run_refine(model, data, params)
  }

  return(model)
}


================================================
FILE: R/univariate_regression.R
================================================
#' @title Perform Univariate Linear Regression Separately for Columns of X
#' 
#' @description This function performs the univariate linear
#'   regression y ~ x separately for each column x of X. The estimated effect size
#'   and stardard error for each variable are outputted.
#' 
#' @param X n by p matrix of regressors.
#' 
#' @param y n-vector of response variables.
#' 
#' @param Z Optional n by k matrix of covariates to be included in all
#'   regresions. If Z is not \code{NULL}, the linear effects of
#'   covariates are removed from y first, and the resulting residuals
#'   are used in place of y.
#' 
#' @param center If \code{center = TRUE}, center X, y and Z.
#' 
#' @param scale If \code{scale = TRUE}, scale X, y and Z.
#' 
#' @param return_residuals Whether or not to output the residuals if Z
#'   is not \code{NULL}.
#'
#' @param method Either \dQuote{sumstats} (faster implementation) or
#'   \dQuote{lmfit} (uses \code{\link[stats]{.lm.fit}}).
#'
#' @return A list with two vectors containing the least-squares
#'   estimates of the coefficients (\code{betahat}) and their standard
#'   errors (\code{sebetahat}). Optionally, and only when a matrix of
#'   covariates \code{Z} is provided, a third vector \code{residuals}
#'   containing the residuals is returned.
#' 
#' @examples
#' set.seed(1)
#' n = 1000
#' p = 1000
#' beta = rep(0,p)
#' beta[1:4] = 1
#' X = matrix(rnorm(n*p),nrow = n,ncol = p)
#' X = scale(X,center = TRUE,scale = TRUE)
#' y = drop(X %*% beta + rnorm(n))
#' res = univariate_regression(X,y)
#' plot(res$betahat/res$sebetahat)
#' 
#' @importFrom stats lm
#' @importFrom stats .lm.fit
#' @importFrom stats coef
#' @importFrom stats summary.lm
#'
#' @export
#' 
univariate_regression = function (X, y, Z = NULL, center = TRUE,
                                  scale = FALSE, return_residuals = FALSE,
                                  method = c("lmfit", "sumstats")) {
  method <- match.arg(method)
  y_na <- which(is.na(y))
  if (length(y_na)) {
    X = X[-y_na,]
    y = y[-y_na]
  }
  if (center) {
    y = y - mean(y)
    X = scale(X,center = TRUE,scale = scale)
  } else 
    X = scale(X,center = FALSE,scale = scale)
  X[is.nan(X)] = 0
  if (!is.null(Z)) {
    if (center)
      Z = scale(Z,center = TRUE,scale = scale)
    y = .lm.fit(Z,y)$residuals
  }

  # fast implementation: computes X'X and X'y without forming X
  if (method == "sumstats") {
    output <- try({
      n  <- length(y)
      sy <- sum(y)
      yy <- sum(y * y)
      p  <- ncol(X)
      res <- matrix(NA_real_, nrow = p, ncol = 2)
      
      for (i in seq_len(p)) {
        x   <- X[, i]
        sx  <- sum(x)
        sxx <- sum(x * x)
        sxy <- sum(x * y)

        # XtX and Xty for [1, x]
        # XtX = [[ n,  sx ],
        #        [ sx, sxx]]
        detXtX <- n * sxx - sx * sx
        if (!is.finite(detXtX) || detXtX <= 0) {
          warning_message("Column ", i, " has zero variance after centering/scaling")
          res[i, ] <- c(0, 0)  # constant/degenerate column
          next
        }

        XtX <- matrix(c(n, sx, sx, sxx), nrow = 2, ncol = 2)
        Xty <- c(sy, sxy)

        # Solve (XtX) beta = Xty via Cholesky
        R    <- chol(XtX)                              # XtX = R^T R
        beta <- backsolve(R, forwardsolve(t(R), Xty))  # slope is beta[2]

        # RSS = y'y - 2 beta^T X'y + beta^T XtX beta (no need to form
        # residuals)
        rss <- yy - 2 * sum(beta * Xty) +
               as.numeric(crossprod(beta, XtX %*% beta))
        sigma2 <- rss / (n - 2)         # p = 2 (intercept + slope)

        # Var(beta) = sigma2 * (XtX)^{-1}; se(slope) = sqrt( ... [2,2] )
        XtX_inv   <- chol2inv(R)
        se_slope  <- sqrt(sigma2 * XtX_inv[2, 2])
        res[i, ] <- c(beta[2], se_slope)
      }
      res
    }, silent = TRUE)
  } else {
    # original .lm.fit-based implementation
    output = try(do.call(rbind,
                        lapply(1:ncol(X), function (i) {
                          g = .lm.fit(cbind(1,X[,i]),y)
                          return(c(coef(g)[2],calc_stderr(cbind(1,X[,i]),
                                                          g$residuals)[2]))
                        })),
                silent = TRUE)
  }

  # Exception occurs, fall back to a safer but slower calculation.
  if (inherits(output,"try-error")) {
    output = matrix(0,ncol(X),2)
    for (i in 1:ncol(X)) {
      fit = summary(lm(y ~ X[,i]))$coef
      if (nrow(fit) == 2)
        output[i,] = as.vector(summary(lm(y ~ X[,i]))$coef[2,1:2])
      else {
        warning_message("Column ", i, " has zero variance after centering/scaling")
        output[i,] = c(0,0)
      }
    }
  }
  if (return_residuals && !is.null(Z)) 
    return(list(betahat = output[,1],sebetahat = output[,2],residuals = y))
  else
    return(list(betahat = output[,1],sebetahat = output[,2]))
}

#' @rdname univariate_regression
#' @export
calc_z = function (X, Y, center = FALSE, scale = FALSE) {
  univariate_z = function(X,Y,center,scale) {
    out = univariate_regression(X,Y,center = center,scale = scale)
    return(out$betahat/out$sebetahat)
  }
  if (is.null(dim(Y)))
    return(univariate_z(X,Y,center,scale))
  else
    return(do.call(cbind,lapply(1:ncol(Y),
                                function(i) univariate_z(X,Y[,i],
                                                         center = center,
                                                         scale = scale))))
}


#' @title Per-Position Marginal OLS Regression of `Y` on Each Column of `X`
#'
#' @description Computes the marginal OLS regression coefficient and
#'   standard error for each `(X column, Y column)` pair, treating
#'   the regressions as independent. `X` is assumed column-centred
#'   (no intercept term in the per-pair regression); each `Y`
#'   column is treated independently. Returns the J x T matrices
#'   `Bhat` and `Shat`.
#'
#' Used internally by single-effect-regression style routines that
#' need a per-position marginal estimate. Vectorised across columns
#' of `Y` so callers can pass either a numeric vector (T = 1) or a
#' numeric matrix (T > 1) without looping at the call site.
#'
#' @param X numeric matrix `n x J`, expected column-centred.
#' @param Y numeric matrix `n x T` or numeric vector of length `n`.
#'   When a vector, is treated as a one-column matrix.
#' @param predictor_weights optional numeric vector of length `J`
#'   giving `colSums(X^2)`. Computed internally when `NULL`.
#'   Callers that have this cached on the data object pass it
#'   through to avoid recomputation.
#' @param sigma2 optional numeric scalar giving a known residual
#'   variance. When supplied, `Shat[j, t] = sqrt(sigma2 /
#'   predictor_weights[j])` (single-effect-residual form). When
#'   `NULL`, `Shat` is the per-pair empirical residual standard
#'   error: for each `(j, t)` pair, the sample SD of `Y[, t] -
#'   X[, j] * Bhat[j, t]` divided by `sqrt(n - 1)`. The latter
#'   matches the form used by data-driven prior init routines
#'   (e.g., for fitting a normal-mixture prior via `ashr::ash`).
#'
#' @return list with elements `Bhat` (`J x T`) and `Shat` (`J x T`).
#'
#' @examples
#' set.seed(1)
#' X <- matrix(rnorm(50 * 5), 50, 5)
#' X <- scale(X, center = TRUE, scale = FALSE)
#' Y <- matrix(rnorm(50 * 3), 50, 3)
#' out <- compute_marginal_bhat_shat(X, Y)
#' dim(out$Bhat)   # 5 x 3
#' dim(out$Shat)   # 5 x 3
#'
#' @importFrom Rfast colVars
#' @export
compute_marginal_bhat_shat <- function(X, Y,
                                       predictor_weights = NULL,
                                       sigma2 = NULL) {
  if (is.null(dim(Y))) {
    Y <- matrix(Y, ncol = 1)
  }
  n <- nrow(Y)
  J <- ncol(X)
  T_y <- ncol(Y)

  if (is.null(predictor_weights)) {
    predictor_weights <- colSums(X^2)
  }

  Bhat <- crossprod(X, Y) / predictor_weights      # J x T

  if (!is.null(sigma2)) {
    Shat <- matrix(sqrt(sigma2 / predictor_weights), nrow = J, ncol = T_y)
  } else {
    Shat <- vapply(
      seq_len(T_y),
      function(t) Rfast::colVars(Y[, t] - sweep(X, 2, Bhat[, t], "*")),
      numeric(J)
    )
    if (!is.matrix(Shat)) Shat <- matrix(Shat, nrow = J, ncol = T_y)
    Shat <- sqrt(pmax(Shat, 1e-64)) / sqrt(n - 1)
  }

  list(Bhat = Bhat, Shat = Shat)
}

# ----------------------------------------------------------------------
# Some miscellaneuous auxiliary functions are listed below.
# Some functions are directly copied from varbvs,
# https://github.com/pcarbo/varbvs
# ----------------------------------------------------------------------

# Remove covariate effects Regresses Z out from X and y; that is, X
# and y are projected into the space orthogonal to Z.
#' 
#' @importFrom Matrix forceSymmetric
#'
remove_covariate <- function (X, y, Z, standardize = FALSE, intercept = TRUE) {
  
  # check if Z is null and intercept = FALSE
  if (is.null(Z) & (intercept == FALSE)) {
    return(list(X = X, y = y, Z = Z,
                ZtZiZX = rep(0,dim(X)[2]), ZtZiZy = 0))
  }
  
  # redefine y
  y = c(as.double(y))
  n = length(y)
  
  # add intercept if intercept = TRUE
  if (intercept) {
    if (is.null(Z))
      Z <- matrix(1,n,1)
    else
      Z <- cbind(1,Z)
  }
  
  if (ncol(Z) == 1) {
    ZtZ         = forceSymmetric(crossprod(Z))       # (Z^T Z) symmetric
    ZtZiZy      = as.vector(solve(ZtZ,c(y %*% Z)))   # (Z^T Z)^{-1} Z^T y
    ZtZiZX      = as.matrix(solve(ZtZ,t(Z) %*% X))   # (Z^T Z)^{-1} Z^T X
    X           = scale(X, center = intercept, scale = standardize)
    alpha       = mean(y)
    y           = y - alpha
    
  } else {
    ZtZ         = forceSymmetric(crossprod(Z))       # (Z^T Z) symmetric
    ZtZiZy      = as.vector(solve(ZtZ,c(y %*% Z)))   # (Z^T Z)^{-1} Z^T y
    ZtZiZX      = as.matrix(solve(ZtZ,t(Z) %*% X))   # (Z^T Z)^{-1} Z^T X
    
    #   y = y - Z (Z^T Z)^{-1} Z^T y
    #   X = X - Z (Z^T Z)^{-1} Z^T X  
    y     = y - c(Z %*% ZtZiZy)
    X     = X - Z %*% ZtZiZX
  }
  
  return(list(X = X, y = y, Z = Z,
              ZtZiZX = ZtZiZX, ZtZiZy = ZtZiZy))
}

#' @title Ordering of Predictors from Univariate Regression
#' 
#' @description This function extracts the ordering of the predictors
#'   according to the coefficients estimated in a basic univariate
#'   regression; in particular, the predictors are ordered in decreasing
#'   order by magnitude of the univariate regression coefficient
#'   estimate.
#' 
#' @param X An input design matrix. This may be centered and/or
#'   standardized prior to calling function.
#' 
#' @param y A vector of response variables.
#'
#' @return An ordering of the predictors.
#' 
#' @examples
#' ### generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#' 
#' univ.order = univar.order(X,y)
#' 
#' @export
#' 
univar.order = function(X, y) {
  colnorm = c(colMeans(X^2))
  return (order(abs(c(t(X) %*% y) / colnorm), decreasing = TRUE))
}

#' @title Ordering of Predictors from Coefficient Estimates 
#' 
#' @param beta A vector of estimated regression coefficients.
#' 
#' @description This function orders the predictors by decreasing
#'   order of the magnitude of the estimated regression coefficient.
#'
#' @return An ordering of the predictors.
#' 
#' @examples
#' ### generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 300
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#'
#' ### order predictors by magnitude of univariate regression coefficient
#' beta.hat    = univariate_regression(X,y)$betahat
#' order       = absolute.order(beta.hat)
#'
#' @export
#'
absolute.order = function (beta) {
  abs_order = c(order(abs(beta), decreasing = TRUE))
  return (abs_order)
}

#' @title Ordering of Predictors by Regularization Path
#' 
#' @param fit A fit object whose \code{coef()} method returns a matrix of
#'   coefficients with the intercept in the first row and one column per
#'   penalty strength (as produced by typical penalized-regression
#'   implementations).
#' 
#' @description This function determines an ordering of the predictors
#'  based on the regularization path of the penalized regression; in
#'   particular, the predictors are ordered based on the order in which
#'   the coefficients are included in the model as the penalty strength
#'   decreases.
#' 
#' @return An ordering of the predictors.
#' 
#' @examples
#' ### generate synthetic data
#' set.seed(1)
#' n           = 200
#' p           = 30
#' X           = matrix(rnorm(n*p),n,p)
#' beta        = double(p)
#' beta[1:10]  = 1:10
#' y           = X %*% beta + rnorm(n)
#'
#' ### build a minimal example 'fit' object with the same structure as a
#' ### fit from a penalized regression: a coefficient matrix with the
#' ### intercept in row 1 and one column per (decreasing) penalty value.
#' beta_path   = matrix(0, p + 1, p)
#' for (k in 1:p) beta_path[k + 1, k:p] = 1
#' fit         = list(coefficients = beta_path)
#' order       = path.order(fit)
#'
#' @export
#'
path.order = function (fit) {
  beta_path = coef(fit)[-1,]
  K = dim(beta_path)[2]
  path_order = c()
  for (k in 1:K) {
    crt_path = which(beta_path[,k] != 0)
    if (length(crt_path) != 0 & length(path_order) == 0) {
      path_order = c(path_order, crt_path)
    } else if(length(crt_path) != 0) {
      path_order = c(path_order, crt_path[-which(crt_path %in% path_order)] )
    }
  }
  path_order = unname(path_order)
  index_order = c(path_order, seq(1,dim(beta_path)[1])[-path_order])
  return (index_order)
}


================================================
FILE: README.md
================================================
# susieR

[![CI](https://github.com/stephenslab/susieR/actions/workflows/ci.yml/badge.svg)](https://github.com/stephenslab/susieR/actions/workflows/ci.yml)
[![CRAN status badge](https://www.r-pkg.org/badges/version/susieR)](https://cran.r-project.org/package=susieR)
[![Codecov test coverage](https://codecov.io/gh/StatFunGen/susieR/graph/badge.svg)](https://app.codecov.io/gh/stephenslab/susieR)

The `susieR` package implements a simple new way to perform variable
selection in multiple regression ($y=Xb+e$). The methods implemented
here are particularly well-suited to settings where some of the X
variables are highly correlated, and the true effects are highly
sparse (e.g. <20 non-zero effects in the vector $b$).  One example of
this is genetic fine-mapping applications, and this application was a
major motivation for developing these methods. However, the methods
should also be useful more generally.

The methods are based on a new model for sparse multiple regression,
which we call the "Sum of Single Effects" (SuSiE) model.  This model,
which is described in [Wang et al. (2020)](https://doi.org/10.1111/rssb.12388), lends itself to a particularly simple and intuitive fitting 
procedure -- effectively a Bayesian modification of simple forward 
selection, which we call "Iterative Bayesian Step-wise Selection".

The output of the fitting procedure is a number of "Credible Sets"
(CSs), which are each designed to have high probability to contain a
variable with non-zero effect, while at the same time being as small
as possible. You can think of the CSs as being a set of "highly
correlated" variables that are each associated with the response: you
can be confident that one of the variables has a non-zero coefficient,
but they are too correlated to be sure which one.

The package was initially developed by Gao Wang, Peter Carbonetto,
Yuxin Zou, Kaiqian Zhang, and Matthew Stephens from the
[Stephens Lab](https://stephenslab.uchicago.edu) at the University of
Chicago. It was later extended with new methods and implementations by
Alexander McCreight from the [StatFunGen Lab](https://wanggroup.org/) at
Columbia University.

Please
[post issues](https://github.com/stephenslab/susieR/issues) to ask
questions, get our support or provide us feedback; please
[send pull requests](https://github.com/stephenslab/susieR/pulls) if
you have helped fixing bugs or making improvements to the source code.

## Quick Start

Install susieR from [CRAN](https://cran.r-project.org/package=susieR):

```R
install.packages("susieR")
```

Alternatively, install the latest development version of `susieR`
from GitHub:

```R
# install.packages("remotes")
remotes::install_github("stephenslab/susieR")
```

See [here](https://stephenslab.github.io/susieR/articles/mwe.html) for
a brief illustration of `susieR`. For more documentation and examples
please visit https://stephenslab.github.io/susieR

## Citing this work

If you find the `susieR` package or any of the source code in this
repository useful for your work, please cite both:

> Wang, G., Sarkar, A., Carbonetto, P. & Stephens, M. (2020). A
> simple new approach to variable selection in regression, with
> application to genetic fine mapping. *Journal of the Royal
> Statistical Society, Series B* **82**, 1273–1300.
> https://doi.org/10.1111/rssb.12388

> McCreight, A., Cho, Y., Li, R., Nachun, D., Gan, H-Y., Carbonetto, P., Stephens,
> M., Denault, W.R.P. & Wang, G. (2025). SuSiE 2.0:
> improved methods and implementations for genetic fine-mapping and
> phenotype prediction. Submitting to *Genome Biology*.

If you use any of the summary data methods such as `susie_ss` or 
`susie_rss`, please also cite:

> Zou, Y., Carbonetto, P., Wang, G. & Stephens, M. (2022). Fine-mapping
> from summary data with the "Sum of Single Effects" model. *PLoS
> Genetics* **18**, e1010299. https://doi.org/10.1371/journal.pgen.1010299

If you use the Servin-Stephens prior on residual variance estimates
(`estimate_residual_method = "NIG"`), please also cite:

> Denault, W.R.P., Carbonetto, P., Li, R., Alzheimer's Disease Functional
> Genomics Consortium, Wang, G. & Stephens, M. (2025). Accounting for
> uncertainty in residual variances improves calibration of the "Sum of
> Single Effects" model for small sample sizes. *bioRxiv*, 2025-05.
> Under review for *Nature Methods*.

If you use infinitesimal effects modeling (`unmappable_effects = "inf"`), 
please also cite:

> Cui, R., Elzur, R.A., Kanai, M. et al. (2024). Improving fine-mapping
> by modeling infinitesimal effects. *Nature Genetics* **56**, 162–169.
> https://doi.org/10.1038/s41588-023-01597-3

## Developer notes


+ The `Makefile` contains various R commands to build and maintain the package. 
For example to build the website via `pkgdown`:

   ```bash
   make pkgdown
   ```

+ When any changes are made to `roxygen2` markup, run
`make document` to update package `NAMESPACE` and documentation
files.


+ To format R codes in the `R` folder,

   ```bash
   for i in `ls R/*.R`; do bash inst/misc/format_r_code.sh $i; done
   ```

[susie-preprint]: https://doi.org/10.1101/501114


================================================
FILE: _pkgdown.yml
================================================
url: https://stephenslab.github.io/susieR

template:
 bootstrap: 5
 light-switch: true
 math-rendering: katex
 bslib:
  base_font: { google: "Roboto" }
  heading_font: { google: "Roboto Slab" }
  code_font: { google: "JetBrains Mono" }

development:
 mode: auto

home:
 links:
 - text: Learn more
   href: https://github.com/stephenslab/susieR
 - text: Report a bug
   href: https://github.com/stephenslab/susieR/issues

navbar:
 structure:
  left: [intro, reference, articles, news]
  right: [search, github, lightswitch]
 components:
  intro:
   icon: fa fa-play-circle
   text: Get Started
   href: articles/mwe.html
   aria-label: Get started with susieR
  reference:
   icon: fa fa-file-code
   text: Functions
   href: reference/index.html
   aria-label: Function reference
  articles:
   icon: fa fa-book-reader
   text: Vignettes
   href: articles/index.html
   aria-label: Articles and vignettes
  news:
   icon: fa fa-newspaper
   text: News
   href: articles/announcements.html
   aria-label: Package news
  github:
   icon: fab fa-github
   href: https://github.com/stephenslab/susieR
   aria-label: View source on GitHub

articles:
  - title: "Getting Started"
    navbar: ~
    contents:
    - mwe
  - title: "Fine-mapping Applications"
    desc: >
      Detailed tutorials for genetic fine-mapping using susieR with 
      individual-level and summary statistics data.
    contents:
    - finemapping
    - finemapping_summary_statistics
    - susie_rss
    - susierss_diagnostic
    - small_sample
  - title: "Advanced Topics"
    desc: >
      Advanced features and specialized applications of the susieR package.
    contents:
    - sparse_susie_eval
    - susie_refine
    - l0_initialization
    - trend_filtering
    - susie_unmappable_effects
  - title: "Package Information"
    navbar: ~
    contents:
    - announcements

footer:
 structure:
  left: developed_by
  right: built_with


================================================
FILE: inst/CITATION
================================================
citHeader("To cite the susieR package, please use both:")

bibentry(bibtype = "Article",
         title = paste("A simple new approach to variable selection in",
                       "regression, with application to genetic fine",
                       "mapping"),
         author = c(person("Gao","Wang"),
                    person("Abhishek","Sarkar"),
                    person("Peter","Carbonetto"),
                    person("Matthew","Stephens")),
         journal = "Journal of the Royal Statistical Society, Series B",
         year    = "2020",
         volume  = "82",
         pages   = "1273-1300",
         doi     = "10.1111/rssb.12388",
         textVersion =
           paste("Wang, G., Sarkar, A., Carbonetto, P. & Stephens, M. (2020).",
                 "A simple new approach to variable selection in regression,",
                 "with application to genetic fine mapping. Journal of the",
                 "Royal Statistical Society, Series B 82, 1273-1300.",
                 "https://doi.org/10.1111/rssb.12388"))

bibentry(bibtype = "Article",
         title = paste("SuSiE 2.0: improved methods and implementations for",
                "genetic fine-mapping and phenotype prediction"),
         author = c(person("Alexander", "McCreight"),
                    person("Yanghyeon", "Cho"),
                    person("Daniel", "Nachun"),
                    person("Ruixi", "Li"),
                    person("Hao-Yu", "Gan"),
                    person("Matthew", "Stephens"),
                    person("Peter", "Carbonetto"),
                    person("William", "R.P. Denault"),
                    person("Gao", "Wang")),
         journal = "Submitting to Genome Biology",
         year = "2025",
         textVersion =
           paste("McCreight, A., Cho, Y., Nachun, D., Li, R., Gan, H-Y., Stephens,",
                 "M., Carbonetto, P., Denault, W.R.P. & Wang, G. (2025). SuSiE 2.0:",
                 "improved methods and implementations for genetic fine-mapping and",
                 "phenotype prediction. Submitting to Genome Biology."))

bibentry(header = "If susie_suff_stat or susie_rss is used, please also cite:",
         bibtype = "Article",
         title = paste('Fine-mapping from summary data with the',
                       '"Sum of Single Effects" model'),
         author = c(person("Yuxin","Zou"),
                    person("Peter","Carbonetto"),
                    person("Gao","Wang"),
                    person("Matthew","Stephens")),
         journal = "PLoS Genetics",
         volume  = "18",
         year    = "2022",
         pages   = "e1010299",
         doi     = "10.1371/journal.pgen.1010299",
         textVersion =
           paste('Zou, Y., Carbonetto, P., Wang, G. & Stephens, M. (2022).',
                 'Fine-mapping from summary data with the "Sum of Single',
                 'Effects" model. PLoS Genetics 18, e1010299.',
                 'https://doi.org/10.1371/journal.pgen.1010299'))

bibentry(header = paste("If estimate_residual_method = 'NIG' is used,",
                        "please also cite:"),
         bibtype = "Article",
         title = paste("Accounting for uncertainty in residual variances",
                       "improves calibration of the 'Sum of Single Effects'",
                       "model for small sample sizes"),
         author = c(person("William", "R.P. Denault"),
                    person("Peter", "Carbonetto"),
                    person("Ruixi", "Li"),
                    person("Alzheimer's Disease Functional Genomics Consortium"),
                    person("Gao", "Wang"),
                    person("Matthew", "Stephens")),
         journal = "bioRxiv",
         year    = "2025",
         note    = "Under review for Nature Methods",
         textVersion =
           paste("Denault, W.R.P., Carbonetto, P., Li, R., Alzheimer's Disease",
                 "Functional Genomics Consortium, Wang, G. & Stephens, M. (2025).",
                 "Accounting for uncertainty in residual variances improves",
                 "calibration of the 'Sum of Single Effects' model for small",
                 "sample sizes. bioRxiv, 2025-05. Under review for Nature Methods."))

bibentry(header = paste("If unmappable_effects = 'inf' is used,",
                        "please also cite:"),
         bibtype = "Article",
         title = "Improving fine-mapping by modeling infinitesimal effects",
         author = c(person("Rui", "Cui"),
                    person("R.A.", "Elzur"),
                    person("M.", "Kanai"),
                    person(c("et", "al."))),
         journal = "Nature Genetics",
         volume  = "56",
         year    = "2024",
         pages   = "162-169",
         doi     = "10.1038/s41588-023-01597-3",
         textVersion =
           paste("Cui, R., Elzur, R.A., Kanai, M. et al. (2024).",
                 "Improving fine-mapping by modeling infinitesimal effects.",
                 "Nature Genetics 56, 162-169.",
                 "https://doi.org/10.1038/s41588-023-01597-3"))


================================================
FILE: inst/analysis/optimize.Rmd
================================================
---
title: "optimize"
author: "Matthew Stephens"
date: "4/15/2018"
output: html_document
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE)
```

Diagnose optimization issues with Lei's example
```{r}
set.seed(777)
devtools::load_all(".")
X <- matrix(rnorm(1010 * 1000), 1010, 1000)
beta <- rep(0, 1000)
beta[1 : 200] <- 100
y <- X %*% beta + rnorm(1010)
s = susie(X,y,L=1,estimate_residual_variance = TRUE)
Y = y-s$Xr
s2 = s$sigma2
x = seq(1,100000,length=100)
l  = rep(0,100)
lg = rep(0,100)
for(i in 1:100){
  l[i] = loglik(x[i],Y,X,s2)
  lg[i] = loglik.grad(x[i],Y,X,s2)
}
plot(x,l)
plot(x,lg)
# > which.max(l)
# [1] 23
# > lg[23]
# [1] -2.398905e-07
# > lg[22]
# [1] 6.282734e-07

lx = log(x)
l2=l
lg2=lg
for(i in 1:100){
  l2[i] = negloglik.logscale(lx[i],Y,X,s2)
  lg2[i] = negloglik.grad.logscale(lx[i],Y,X,s2)
}
plot(lx,l2)
plot(lx,lg2)

y = seq(0,20,length=100)
l3=l2
lg3=lg2
for(i in 1:100){
  l3[i] = negloglik.logscale(y[i],Y,X,s2)
  lg3[i] = negloglik.grad.logscale(y[i],Y,X,s2)
}
plot(y,l3)
plot(y,lg3)
uniroot(negloglik.grad.logscale,c(-20,20),extendInt = "upX",Y=Y,X=X,s2=s2)

```

So, to summarize, problem seems to be that optim has issues with
very flat initial gradient near 0.


================================================
FILE: inst/analysis/test_susie_auto.Rmd
================================================
---
title: "Test susie auto"
author: "Matthew Stephens"
date: "5/2/2018"
output: html_document
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE)
```

The goal here is to test the function `susie_auto` which tries
to make susie run well even in some tricky situations (eg where $L$ is big,
which susie is not well suited to).

This is an example Lei Sun showed us from the paper demonstrating that
false positives occur early on the Lasso path. Here I change L to 20 instead
of 200 to make it run fast to begin with.
```{r}
set.seed(777)
library(susieR)
L <- 20
X <- matrix(rnorm(1010 * 1000), 1010, 1000)
beta <- rep(0, 1000)
beta[1 : L] <- 100
y <- X %*% beta + rnorm(1010)
```

```{r}
s <- susie_auto(X,y,verbose=TRUE)
s$sa2
```


Now try L=200
```{r}
set.seed(777)
L <- 200
X <- matrix(rnorm(1010 * 1000), 1010, 1000)
beta <- rep(0, 1000)
beta[1 : L] <- 100
y <- X %*% beta + rnorm(1010)
s2 <- susie_auto(X,y,verbose=TRUE)
s2$sa2
```


================================================
FILE: inst/analysis/testing.Rmd
================================================
---
title: "test.Rmd"
author: "Matthew Stephens"
date: "4/14/2018"
output: html_document
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE)
```

# simulate data

This is Lei's example
```{r}
set.seed(777)
library(susieR)
X <- matrix(rnorm(1010 * 1000), 1010, 1000)
beta <- rep(0, 1000)
beta[1 : 200] <- 100
y <- X %*% beta + rnorm(1010)
s = susie(X,y,L=200)

plot(coef(s),beta)
s$sigma2

# fit <- lm(y ~ X - 1)
# mlr.p <- log(summary(fit)$coefficients[, 4])
# 
mar.p <- c()
mar.betahat = c()
for (i in 1 : 1000) {
 fit <- lm(y ~ X[, i] - 1)
  mar.p[i] <- log(summary(fit)$coefficients[, 4])
  mar.betahat[i] <- summary(fit)$coefficients[, 1]
}
# 
# pdf("pvalue.pdf", width = 10, height = 5)
# par(mfrow = c(1, 2))
# plot(mlr.p, ylab = "log(p-value)", main = "Multiple Linear Regression")
# abline(h = log(0.05 / 1000), lty = 2, col = "red")
# legend("right", lty = 2, col = "red", "log(0.05/p)")
# 
# plot(mar.p, ylab = "log(p-value)", main = "One-on-One Linear Regression")
# abline(h = log(0.05 / 1000), lty = 2, col = "red")
```

Notice that the coefficients are monotonic with betahat. Some shrinkage of zero values is evident, but it is not enough... presumably because sigma2 is way over-estimated. And further we see excessive shrinkage of true signals, presumably because sa2 is too small.
```{r}
plot(coef(s),mar.betahat)
```


Here we try fixing $L$ and residual variance to true value.
```{r}
strue = susie(X,y,L=200,residual_variance =1,estimate_residual_variance =FALSE)
plot(coef(strue),beta)
strue$elbo
```
it works!!

```{r}
plot(strue$alpha[1,])
plot(strue$alpha[2,])
```

Try with very small residual variance
```{r}
s3 = susie(X,y,L=200, residual_variance = 0.01,estimate_residual_variance = FALSE)
plot(coef(s3))
s4 = susie(X,y,s_init = s3)
plot(coef(s4))
s4$elbo
```
That is weird it goes away from the solution!

Try with estimating prior:
```{r}
s5 = susie(X,y,s_init = s3, estimate_prior_variance = TRUE)
plot(coef(s5))
s5$elbo
sqrt(s5$sa2)
sqrt(s4$sa2)
```
much better!


Now try too many effects
```{r}
s3.300 = susie(X,y,L=300, residual_variance = 0.01,estimate_residual_variance = FALSE)
s5.300 = susie(X,y,s_init = s3.300, estimate_prior_variance = TRUE)
plot(coef(s3.300))
plot(coef(s5.300))
s3.300$elbo
s5.300$elbo
sum(s5.300$sa2>0)
```

Now try too many effects but just a very small number of iterations for initial case:
```{r}
s3.300.5 = susie(X,y,L=300, residual_variance = 0.01,estimate_residual_variance = FALSE, max_iter = 5)
s5.300.5 = susie(X,y,s_init = s3.300.5, estimate_prior_variance = TRUE)
plot(coef(s3.300.5))
plot(coef(s5.300.5))
s3.300.5$elbo
s5.300.5$elbo
plot(colSums(s5.300.5$alpha))
```

Q: does the initial run with small variance gradually find the smaller effects, or does it get them from the first iteration?
Could look at that by doing one iteration at a time.
```{r}
s3.300.1 = susie(X,y,L=300, residual_variance = 0.01,estimate_residual_variance = FALSE, max_iter = 1)
plot(coef(s3.300.1))
s3.300.2 = susie(X,y,s_init=s3.300.1,estimate_residual_variance = FALSE, max_iter = 1)
plot(coef(s3.300.2))
s3.300 = susie(X,y,s_init=s3.300.2,estimate_residual_variance = TRUE)

```


================================================
FILE: inst/code/caviar.R
================================================
#!/usr/bin/env Rscript
library(dplyr)
library(readr)
library(magrittr)

#' CAVIAR I/O
write_caviar_sumstats <- function(z, prefix) {
  cfg = list(z=paste0(prefix,".z"),
             set=paste0(prefix,"_set"),
             post=paste0(prefix,"_post"),
             log=paste0(prefix,".log"))
  write.table(z,cfg$z,quote=F,col.names=F)
  return(cfg)
}

#' Run CAVIAR
#' https://github.com/fhormoz/caviar

run_caviar <- function(z, LD_file, args = "", prefix="data")
{
  cfg = write_caviar_sumstats(z, prefix)
  cmd = paste("CAVIAR", "-z", cfg$z, "-l", LD_file, "-o", prefix, args)
  dscrutils::run_cmd(cmd)
  if(!all(file.exists(cfg$post, cfg$set, cfg$log))) {
      stop("Cannot find one of the post, set, and log files")
  }
  
  log <- readLines(cfg$log)

  # read output tables
  snp <- read.delim(cfg$post)  
  stopifnot(ncol(snp) == 3)
  names(snp) <- c("snp", "snp_prob_set", "snp_prob")
  snp$snp <- as.character(snp$snp)
  snp <- rank_snp(snp)

  # `set` of snps
  set <- readLines(cfg$set)
  set_ordered <- left_join(data_frame(snp = set), snp, by = "snp") %>% 
    arrange(rank) %$% snp
  return(list(snp=snp, set=set_ordered))
}

rank_snp <- function(snp) {
  snp <- arrange(snp, -snp_prob) %>%
    mutate(
        rank = seq(1, n()),
        snp_prob_cumsum = cumsum(snp_prob) / sum(snp_prob)) %>%
    select(rank, snp, snp_prob, snp_prob_cumsum, snp_prob_set)
  return(snp)    
}

finemap_mcaviar <- function(zscore, LD_file, args, prefix) {
  if (is.null(dim(zscore))) {
      zscore = matrix(ncol=1,zscore)
  }
  return(parallel::mclapply(1:ncol(zscore), function(r)
          run_caviar(zscore[,r], LD_file, args, 
                     paste0(prefix, '_condition_', r)), 
                            mc.cores = min(8, ncol(zscore))))
}

eval(parse(text=commandArgs(T)))
dat = readRDS(input)
sumstats = dat$sumstats
ld = tempfile(fileext = ".ld")
write.table(cor(dat$data$X),ld,quote=F,col.names=F,row.names=F)
posterior = finemap_mcaviar(sumstats[1,,] / sumstats[2,,],
                            ld,
                            args, prefix=tempfile(fileext = ".caviar"))
saveRDS(posterior, paste0(output, '.rds'))


================================================
FILE: inst/code/compute_ss_memory.R
================================================
# export MEM_CHECK_INTERVAL=0.01
# python3 monitor_memory.py Rscript compute_ss_memory.R
#
# NOTES:
#
# - Without any improvements:
#   Size of X: 0.3 GB
#   max rss_memory: 1.65 GB
#
# - The original centering and scaling steps require about 1 GB.
#
# - With the improvements:
#   Size of X: 0.3 GB
#   max rss_memory: 0.66 GB
#
# set.seed(1)
# p <- 2000
# n <- 20000
# X <- matrix(rnorm(n*p),n,p)
# y <- rnorm(n)
# save(list = c("X","y"),file = "compute_ss_data.RData")
# library(susieR)
devtools::load_all()
set.seed(1)
load("compute_ss_data.RData")
cat("Size of X:\n")
print(object.size(X),unit = "GB")
cat("Running compute_ss.\n")
out <- compute_ss(X,y,standardize = TRUE)


================================================
FILE: inst/code/dap-g.py
================================================
#!/usr/bin/env python3
import sys
import subprocess
import pandas as pd
import numpy as np

def write_dap_full(x,y,prefix,r):
    names = np.array([('geno', i+1, f'group{r}') for i in range(x.shape[1])])
    with open(f'{prefix}.data', 'w') as f:
        print(*(['pheno', 'pheno', f'group{r}'] + list(np.array(y).ravel())), file=f)
        np.savetxt(f, np.hstack((names, x.T)), fmt = '%s', delimiter = ' ')
        
def run_dap_full(prefix, args):
    cmd = ['dap-g', '-d', f'{prefix}.data', '-o', f'{prefix}.result', '--output_all'] + ' '.join(args).split()
    subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE).communicate()    
           
def write_dap_ss(z,prefix):
    '''z-score vesion of dap input is the same as FINEMAP'''
    ids = np.array([str(i+1) for i in range(z.shape[0])])
    with open(f'{prefix}.z', 'w') as f:
        np.savetxt(f,  np.vstack((ids, z)).T, fmt = '%s', delimiter = ' ')

def run_dap_z(ld, prefix, args):
    cmd = ['dap-g', '-d_z', f'{prefix}.z', '-d_ld', ld, '-o', f'{prefix}.result', '--all'] + ' '.join(args).split()
    subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE).communicate()    
    
def extract_dap_output(prefix):
    out = [x.strip().split() for x in open(f'{prefix}.result').readlines()]
    pips = []
    clusters = []
    still_pip = True
    for line in out:
        if len(line) == 0:
            continue
        if len(line) > 2 and line[2] == 'cluster_pip':
            still_pip = False
            continue
        if still_pip and (not line[0].startswith('((')):
            continue
        if still_pip:
            pips.append([line[1], float(line[2]), float(line[3]), int(line[4])])
        else:
            clusters.append([len(clusters) + 1, float(line[2]), float(line[3])])
    pips = pd.DataFrame(pips, columns = ['snp', 'snp_prob', 'snp_log10bf', 'cluster'])
    clusters = pd.DataFrame(clusters, columns = ['cluster', 'cluster_prob', 'cluster_avg_r2'])
    clusters = pd.merge(clusters, pips.groupby(['cluster'])['snp'].apply(','.join).reset_index(), on = 'cluster')
    return {'snp': pips, 'set': clusters}

def dap_single(x, y, prefix, r, args):
    write_dap_full(x,y,prefix,r)
    run_dap_full(prefix,args)
    return extract_dap_output(prefix)

def dap_single_z(z, ld, prefix, args):
    write_dap_ss(z,prefix)
    run_dap_z(ld,prefix,args)
    return extract_dap_output(prefix)

def dap_batch(X, Y, prefix, *args):
    return dict([(f'V{r+1}', dap_single(X, Y[:,r], f'{prefix}_condition_{r+1}', r+1, args)) for r in range(Y.shape[1])])

def dap_batch_z(z, ld, prefix, *args):
    return dict([(f'V{r+1}', dap_single_z(z[:,r], ld, f'{prefix}_condition_{r+1}', args)) for r in range(z.shape[1])])

import os
from dsc.dsc_io import load_rds, save_rds
import tempfile
import warnings
if not sys.warnoptions:
    warnings.simplefilter("ignore")

input_file = os.path.expanduser(sys.argv[1])
output_file = os.path.expanduser(sys.argv[2])
args = sys.argv[3:]
data = load_rds(input_file)['data']
cache = tempfile.NamedTemporaryFile(suffix = '.dap')
posterior = dap_batch(data['X'], data['Y'], cache.name, ' '.join(args))
save_rds(posterior, output_file + '.rds')


================================================
FILE: inst/code/finemap.R
================================================
#!/usr/bin/env Rscript
library(dplyr)
library(readr)
library(magrittr)

#' FINEMAP I/O
write_finemap_sumstats <- function(z, LD_file, n, k, prefix) {
  cfg = list(z=paste0(prefix,".z"),
             ld=LD_file,
             snp=paste0(prefix,".snp"),
             config=paste0(prefix,".config"),
             k=paste0(prefix,".k"),
             log=paste0(prefix,".log"),
             meta=paste0(prefix,".master"))
  write.table(z,cfg$z,quote=F,col.names=F)
  if (!is.null(k)) {
      write.table(t(k),cfg$k,quote=F,col.names=F,row.names=F)
      write("z;ld;snp;config;k;log;n-ind",file=cfg$meta)
      write(paste(cfg$z, cfg$ld, cfg$snp, cfg$config, cfg$k, cfg$log, n, sep=";"),
        file=cfg$meta,append=TRUE)
  } else {
      write("z;ld;snp;config;log;n-ind",file=cfg$meta)
      write(paste(cfg$z, cfg$ld, cfg$snp, cfg$config, cfg$log, n, sep=";"),
            file=cfg$meta,append=TRUE)
  }
  return(cfg)
}

#' Run FINEMAP version 1.1
#' http://www.christianbenner.com
## FIXME: read the finemapr implementation for data sanity check.
## Can be useful as a general data sanity checker (in previous modules)

run_finemap <- function(z, LD_file, n, k, args = "", prefix="data")
{
  cfg = write_finemap_sumstats(z, LD_file, n, k, prefix)
  cmd = paste("finemap --sss --log", "--in-files", cfg$meta, args)
  dscrutils::run_cmd(cmd)

  # read output tables
  snp = read.table(cfg$snp,header=TRUE,sep=" ")
  snp$snp = as.character(snp$snp)

  snp = rank_snp(snp)
  config = read.table(cfg$config,header=TRUE,sep=" ")

  # Only keep configurations with cumulative 95% probability
  # config = within(config, config_prob_cumsum <- cumsum(config_prob))
  # config = config[config$config_prob_cumsum <= 0.95,]

  # extract number of causal
  ncausal = finemap_extract_ncausal(cfg$log)
  return(list(snp=snp, set=config, ncausal=ncausal))
}

rank_snp <- function(snp) {
  snp <- arrange(snp, -snp_prob) %>%
    mutate(
        rank = seq(1, n()),
        snp_prob_cumsum = cumsum(snp_prob) / sum(snp_prob)) %>%
    select(rank, snp, snp_prob, snp_prob_cumsum, snp_log10bf)
  return(snp)
}

finemap_extract_ncausal <- function(logfile)
{
  lines <- grep("->", readLines(logfile), value = TRUE)
  lines <- gsub("\\(|\\)|>", "", lines)
  splits <- strsplit(lines, "\\s+")
  tab <- data.frame(
    ncausal_num = sapply(splits, function(x) as.integer(x[2])),
    ncausal_prob = sapply(splits, function(x) as.double(x[4])))
  tab <- mutate(tab, type = ifelse(duplicated(ncausal_num), "post", "prior"))
  return(tab)
}

finemap_mvar <- function(zscore, LD_file, n, k, args, prefix, parallel = FALSE) {
  if (is.null(dim(zscore))) {
      zscore = matrix(ncol=1,zscore)
  }

  single_core = function(r) 
      run_finemap(zscore[,r], LD_file, n, k, args, 
                  paste0(prefix, '_condition_', r))
  if (parallel)
      return(parallel::mclapply(1:ncol(zscore), function(r) single_core(r),
                                mc.cores = min(8, ncol(zscore))))
  else
      return(lapply(1:ncol(zscore), function(r) single_core(r)))
}

eval(parse(text=commandArgs(T)))
dat = readRDS(input)
sumstats = dat$sumstats
N = nrow(dat$data$X)
ld = tempfile(fileext = ".ld")
write.table(cor(dat$data$X),ld,quote=F,col.names=F,row.names=F)
posterior = finemap_mvar(sumstats[1,,] / sumstats[2,,],
                                        ld, N, k=NULL,
                                        args, prefix=tempfile(fileext = ".finemap"))
saveRDS(posterior, paste0(output, '.rds'))


================================================
FILE: inst/code/finemap_1p4.R
================================================
#!/usr/bin/env Rscript
library(dplyr)
library(readr)
library(magrittr)

#' FINEMAP I/O
write_finemap_sumstats <- function(beta, se, LD_file, n, k, prefix) {
  cfg = list(z=paste0(prefix,".z"),
             ld=LD_file,
             snp=paste0(prefix,".snp"),
             config=paste0(prefix,".config"),
             cred=paste0(prefix, ".cred"),
             k=paste0(prefix,".k"),
             log=paste0(prefix,".log"),
             meta=paste0(prefix,".master"))
  se = replace(se, se == 0, 'nan')
  z = data.frame(chromosome="chr", position=seq(1, length(beta)), allele1='nan', allele2='nan', maf='nan', beta, se)
  z = cbind(rsid=z$position, z)
  write.table(z,cfg$z,quote=F,col.names=T,row.names=F)
  if (!is.null(k)) {
      write.table(t(k),cfg$k,quote=F,col.names=F,row.names=F)
      write("z;ld;snp;config;cred;n_samples;k;log",file=cfg$meta)
      write(paste(cfg$z, cfg$ld, cfg$snp, cfg$config, cfg$cred, n, cfg$k, cfg$log, sep=";"),
        file=cfg$meta,append=TRUE)
  } else {
      write("z;ld;snp;config;cred;n_samples;log",file=cfg$meta)
      write(paste(cfg$z, cfg$ld, cfg$snp, cfg$config, cfg$cred, n, cfg$log, sep=";"),
            file=cfg$meta,append=TRUE)
  }
  return(cfg)
}

#' Run FINEMAP version 1.4
#' http://www.christianbenner.com
## FIXME: read the finemapr implementation for data sanity check.
## Can be useful as a general data sanity checker (in previous modules)

run_finemap <- function(beta, se, LD_file, n, k, args = "", prefix="data")
{
  cfg = write_finemap_sumstats(beta, se, LD_file, n, k, prefix)
  cmd = paste("finemap --sss --log", "--in-files", cfg$meta, args)
  dscrutils::run_cmd(cmd)
  cfg$log = paste0(cfg$log, "_sss")

  # read output tables
  snp = read.table(cfg$snp,header=TRUE,sep=" ")
  snp$snp = as.character(snp$rsid)

  snp = rank_snp(snp)
  # we add snp-prob for backwards-compatability with code that used this script with FINEMAP v1.1
  snp$prob = snp$snp_prob
  config = read.table(cfg$config,header=TRUE,sep=" ")

  # Only keep configurations with cumulative 95% probability
  # config = within(config, config_prob_cumsum <- cumsum(config_prob))
  # config = config[config$config_prob_cumsum <= 0.95,]

  # extract number of causal
  ncausal = finemap_extract_ncausal(cfg$log)
  return(list(snp=snp, set=config, ncausal=ncausal))
}

rank_snp <- function(snp) {
  snp <- arrange(snp, -prob) %>%
    mutate(
        rank = seq(1, n()),
        prob_cumsum = cumsum(prob) / sum(prob)) %>%
    select(rank, snp, prob, prob_cumsum, log10bf)
  return(snp)
}

finemap_extract_ncausal <- function(logfile)
{
  lines <- grep("->", readLines(logfile), value = TRUE)
  lines <- gsub("\\(|\\)|>", "", lines)
  splits <- strsplit(lines, "\\s+")
  tab <- data.frame(
    ncausal_num = sapply(splits, function(x) as.integer(x[2])),
    ncausal_prob = sapply(splits, function(x) as.double(x[4])))
  tab <- mutate(tab, type = ifelse(duplicated(ncausal_num), "post", "prior"))
  return(tab)
}

finemap_mvar <- function(beta, se, LD_file, n, k, args, prefix, parallel = FALSE) {
  if (is.null(dim(beta))) {
      beta = matrix(ncol=1,beta)
  }
  if (is.null(dim(se))) {
      se = matrix(ncol=1,se)
  }

  single_core = function(r) 
      run_finemap(beta[,r], se[,r], LD_file, n, k, args, 
                  prefix=paste0(prefix, '_condition_', r))
  if (parallel)
      return(parallel::mclapply(1:ncol(beta), function(r) single_core(r),
                                mc.cores = min(8, ncol(beta))))
  else
      return(lapply(1:ncol(beta), function(r) single_core(r)))
}

eval(parse(text=commandArgs(T)))
dat = readRDS(input)
sumstats = dat$sumstats
N = nrow(dat$data$X)
ld = tempfile(fileext = ".ld")
ld_mat = cor(dat$data$X)
ld_mat[is.na(ld_mat)] = 'nan'
write.table(ld_mat,ld,quote=F,col.names=F,row.names=F)
posterior = finemap_mvar(sumstats[1,,], sumstats[2,,],
                                        ld, N, k=NULL,
                                        args, prefix=tempfile(fileext = ".finemap"))
saveRDS(posterior, paste0(output, '.rds'))


================================================
FILE: inst/code/gen_original_results.R
================================================
## results from original susie
devtools::install_github("stephenslab/susieR")
library(susieR)

create_sparsity_mat = function(sparsity, n, p){
  nonzero = round(n*p*(1-sparsity))
  nonzero.idx = sample(n*p, nonzero)
  mat = numeric(n*p)
  mat[nonzero.idx] = 1
  mat = matrix(mat, nrow=n, ncol=p)
  return(mat)
}

set.seed(1)
n = 100
p = 200
beta = rep(0,p)
beta[1]    = 10
beta[2]  = 10
beta[3]  = 10
beta[4] = 10
X.dense = create_sparsity_mat(0.99,n,p)
y = c(X.dense %*% beta + rnorm(n))
L = 10
residual_variance = 0.8
scaled_prior_variance = 0.2
s = list(alpha=matrix(1/p,nrow=L,ncol=p),
         mu=matrix(2,nrow=L,ncol=p),
         mu2=matrix(3,nrow=L,ncol=p),
         Xr=rep(5,n), KL=rep(1.2,L),
         sigma2=residual_variance, V=scaled_prior_variance * as.numeric(var(y)))
X = susieR:::set_X_attributes(X.dense)
Eb = rep(1, p)
Eb2 = rep(1, p)
s2 = residual_variance
V = scaled_prior_variance


objective.original.res = susieR::susie_get_objective(s)
saveRDS(objective.original.res, 'objective_original_res.rds')

Eloglik.original.res = susieR:::Eloglik(X,y,s)
saveRDS(Eloglik.original.res, 'Eloglik_original_res.rds')

ER2.original.res = susieR:::get_ER2(X,y,s)
saveRDS(ER2.original.res, 'ER2_original_res.rds')

SER.original.res = susieR:::SER_posterior_e_loglik(X,y,s2,Eb,Eb2)
saveRDS(SER.original.res, 'SER_original_res.rds')

singleReg.original.res = susieR:::single_effect_regression(y,X,V)
saveRDS(singleReg.original.res, 'singleReg_original_res.rds')

vbupdate.original.res = susieR:::update_each_effect(X, y, s)
saveRDS(vbupdate.original.res, 'vbupdate_original_res.rds')

susiefit.original.res = susie(X.dense,y)
saveRDS(susiefit.original.res, 'susiefit_original_res.rds')

susiefit.original.res2 = susie(X.dense, y, standardize = TRUE, intercept = FALSE)
susiefit.original.res3 = susie(X.dense, y, standardize = FALSE, intercept = TRUE)
susiefit.original.res4 = susie(X.dense, y, standardize = FALSE, intercept = FALSE)
saveRDS(susiefit.original.res2, 'susiefit_original_res2.rds')
saveRDS(susiefit.original.res3, 'susiefit_original_res3.rds')
saveRDS(susiefit.original.res4, 'susiefit_original_res4.rds')


================================================
FILE: inst/code/monitor_memory.py
================================================
#!/usr/bin/env python3
#
# Copyright (c) 2012 Realz Slaw, 2017 Gao Wang
#
# Permission is hereby granted, free of charge, to any person
# obtaining a copy of this software and associated documentation files
# (the "Software"), to deal in the Software without restriction,
# including without limitation the rights to use, copy, modify, merge,
# publish, distribute, sublicense, and/or sell copies of the Software,
# and to permit persons to whom the Software is furnished to do so,
# subject to the following conditions:
#
# The above copyright notice and this permission notice shall be
# included in all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
# NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
# BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
# ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
# CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

import time
import psutil
import subprocess

class ProcessTimer:
  def __init__(self, command, interval = 1):
    self.command = command
    self.execution_state = False
    self.interval = interval

  def execute(self):
    self.max_vms_memory = 0
    self.max_rss_memory = 0

    self.t0 = time.time()
    self.t1 = None
    self.max_t = [self.t0]
    try:
      self.p = subprocess.Popen(self.command, shell=False)
    except FileNotFoundError:
      self.p = None
      sys.exit("Invalid command `{}`".format(sys.argv[1]))
    self.execution_state = True

  def poll(self):
    if not self.check_execution_state():
      return False

    self.t1 = time.time()

    try:
      pp = psutil.Process(self.p.pid)

      # Obtain a list of the subprocess and all its descendants.
      descendants = list(pp.children(recursive=True))
      descendants = descendants + [pp]

      rss_memory = 0
      vms_memory = 0

      # Calculate and sum up the memory of the subprocess and all its
      # descendants.
      for descendant in descendants:
        try:
          mem_info = descendant.memory_info()

          rss_memory += mem_info[0]
          vms_memory += mem_info[1]
        except (psutil.NoSuchProcess, psutil.ZombieProcess, psutil.AccessDenied):
          
          # Sometimes a subprocess descendant will have terminated
          # between the time we obtain a list of descendants, and the
          # time we actually poll this descendant's memory usage.
          pass
      if int(self.max_vms_memory * 1E-8) < int(vms_memory * 1E-8):
        
        # Peak memory updated, at ~100-MB resolution.
        self.max_t = [self.t1]
      if int(self.max_vms_memory * 1E-8) == int(vms_memory * 1E-8):
        
        # Peak memory maintained.
        self.max_t = [self.max_t[0], self.t1]
      self.max_vms_memory = max(self.max_vms_memory,vms_memory)
      self.max_rss_memory = max(self.max_rss_memory,rss_memory)

    except (psutil.NoSuchProcess, psutil.ZombieProcess, psutil.AccessDenied):
      return self.check_execution_state()

    return self.check_execution_state()

  def is_running(self):
    return psutil.pid_exists(self.p.pid) and self.p.poll() == None

  def check_execution_state(self):
    if not self.execution_state:
      return False
    if self.is_running():
      return True
    self.executation_state = False
    self.t1 = time.time()
    return False

  def close(self,kill=False):
    if self.p is not None:
      try:
        pp = psutil.Process(self.p.pid)
        if kill:
          pp.kill()
        else:
          pp.terminate()
      except (psutil.NoSuchProcess, psutil.ZombieProcess, psutil.AccessDenied):
        pass

def takewhile_excluding(iterable, value = ['|', '<', '>']):
    for it in iterable:
        if it in value:
            return
        yield it

if __name__ == '__main__':
  import sys, os

  if len(sys.argv) <= 1:
    sys.exit()

  interval = float(os.environ['MEM_CHECK_INTERVAL']) if 'MEM_CHECK_INTERVAL' in os.environ else 1

  ptimer = ProcessTimer(takewhile_excluding(sys.argv[1:]), interval)

  try:
    ptimer.execute()
    
    # Poll as often as possible; otherwise the subprocess might
    # "sneak" in some extra memory usage while you aren't looking.
    while ptimer.poll():
      time.sleep(ptimer.interval)
      
  finally:
    
    # Make sure that we don't leave the process dangling.
    ptimer.close()

  sys.stderr.write('\ntime elapsed: {:.2f}s\n'.format(max(0, ptimer.t1 - ptimer.t0 - ptimer.interval * 0.5)))
  sys.stderr.write('peak first occurred: {:.2f}s\n'.format(min(ptimer.max_t) - ptimer.t0))
  sys.stderr.write('peak last occurred: {:.2f}s\n'.format(max(ptimer.max_t) - ptimer.t0))
  sys.stderr.write('max vms_memory: {:.2f}GB\n'.format(ptimer.max_vms_memory * 1.07E-9))
  sys.stderr.write('max rss_memory: {:.2f}GB\n'.format(ptimer.max_rss_memory * 1.07E-9))
  sys.stderr.write('memory check interval: %ss\n' % ptimer.interval)
  sys.stderr.write('return code: %s\n' % ptimer.p.returncode)


================================================
FILE: inst/code/python_example/N3finemapping_python.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "c7ac5176-713f-4752-b055-607a22a6dc3e",
   "metadata": {},
   "source": [
    "# N3 fine-mapping example (Python)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "571c6701-abff-4535-a25e-8c1bdf53d0a9",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import rpy2.robjects as ro\n",
    "from rpy2.robjects.packages import importr, data\n",
    "from rpy2.robjects import numpy2ri\n",
    "susie = importr('susieR')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "4395eb9b-af70-413a-adc5-edce1f5160fa",
   "metadata": {},
   "outputs": [],
   "source": [
    "conversion_rules = numpy2ri.converter + ro.default_converter\n",
    "with (conversion_rules).context():   \n",
    "    ro.r['set.seed'](1)\n",
    "    N3 = data(susie).fetch('N3finemapping')['N3finemapping']\n",
    "    N3_names = {v:i for i,v in enumerate(N3.names)}\n",
    "    n = N3[N3_names['X']].dim[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "235c3ed5-4415-4301-956d-00615ff6bf48",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array([402, 652, 772]),)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "b = N3[N3_names['true_coef']]\n",
    "np.where(np.array(b)[:,0] != 0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "f50d1770-94aa-4128-8f50-659d9e366d6b",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "R[write to console]: HINT: For estimate_residual_variance = TRUE, please check that R is the \"in-sample\" LD matrix; that is, the correlation matrix obtained using the exact same data matrix X that was used for the other summary statistics. Also note, when covariates are included in the univariate regressions that produced the summary statistics, also consider removing these effects from X before computing R.\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  cs cs_log10bf cs_avg_r2 cs_min_r2\n",
      "1  2   4.033879 1.0000000 1.0000000\n",
      "2  1   6.744085 0.9634847 0.9634847\n",
      "3  3   3.461470 0.9293299 0.7545197\n",
      "                                                                                                     variable\n",
      "1                                                                                                         653\n",
      "2                                                                                                     773,777\n",
      "3 362,365,372,373,374,379,381,383,384,386,387,388,389,391,392,396,397,398,399,400,401,403,404,405,407,408,415\n",
      "\n"
     ]
    }
   ],
   "source": [
    "with (conversion_rules).context():   \n",
    "    sumstats = susie.univariate_regression(\n",
    "        N3[N3_names['X']],\n",
    "        np.array(N3[N3_names['Y']])[:,0]\n",
    "    )\n",
    "    z_scores = np.array(sumstats[0])/np.array(sumstats[1])\n",
    "    R = np.corrcoef(N3[N3_names['X']], rowvar=False)\n",
    "    fitted_rss1 = susie.susie_rss(\n",
    "        bhat=sumstats[0], \n",
    "        shat=sumstats[1], \n",
    "        R=R,\n",
    "        n=n,\n",
    "        var_y=np.var(np.array(N3[N3_names['Y']])[:,0]),\n",
    "        L=10,\n",
    "        estimate_residual_variance=True\n",
    "    )\n",
    "    print(ro.r.summary(fitted_rss1)[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "f933cfd4-d5a8-4c3c-a197-289c50cad29d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1] TRUE\n",
      "\n"
     ]
    }
   ],
   "source": [
    "with (conversion_rules).context():   \n",
    "    fitted = susie.susie(N3[N3_names['X']], \n",
    "                         np.array(N3[N3_names['Y']])[:,0], \n",
    "                         L=10\n",
    "                        )\n",
    "    print(ro.r['all.equal'](fitted[-2], fitted_rss1[-1]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "7666219b-cd4f-4bbc-9ac1-e26a56953042",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "R[write to console]: HINT: For estimate_residual_variance = TRUE, please check that R is the \"in-sample\" LD matrix; that is, the correlation matrix obtained using the exact same data matrix X that was used for the other summary statistics. Also note, when covariates are included in the univariate regressions that produced the summary statistics, also consider removing these effects from X before computing R.\n",
      "\n",
      "R[write to console]: WARNING: XtX is not symmetric; forcing XtX to be symmetric by replacing XtX with (XtX + t(XtX))/2\n",
      "\n",
      "R[write to console]: Error in Xty - s$XtXr : non-conformable arrays\n",
      "\n"
     ]
    },
    {
     "ename": "RRuntimeError",
     "evalue": "Error in Xty - s$XtXr : non-conformable arrays\n",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mRRuntimeError\u001b[0m                             Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[6], line 2\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m (conversion_rules)\u001b[38;5;241m.\u001b[39mcontext():   \n\u001b[0;32m----> 2\u001b[0m     fitted_rss2 \u001b[38;5;241m=\u001b[39m \u001b[43msusie\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43msusie_rss\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m      3\u001b[0m \u001b[43m        \u001b[49m\u001b[43mz\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mz_scores\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m      4\u001b[0m \u001b[43m        \u001b[49m\u001b[43mR\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mR\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m      5\u001b[0m \u001b[43m        \u001b[49m\u001b[43mn\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mn\u001b[49m\u001b[43m,\u001b[49m\u001b[43m  \u001b[49m\n\u001b[1;32m      6\u001b[0m \u001b[43m        \u001b[49m\u001b[43mvar_y\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mnp\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mvar\u001b[49m\u001b[43m(\u001b[49m\u001b[43mnp\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43marray\u001b[49m\u001b[43m(\u001b[49m\u001b[43mN3\u001b[49m\u001b[43m[\u001b[49m\u001b[43mN3_names\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mY\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m]\u001b[49m\u001b[43m]\u001b[49m\u001b[43m)\u001b[49m\u001b[43m[\u001b[49m\u001b[43m:\u001b[49m\u001b[43m,\u001b[49m\u001b[38;5;241;43m0\u001b[39;49m\u001b[43m]\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m      7\u001b[0m \u001b[43m        \u001b[49m\u001b[43mL\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;241;43m10\u001b[39;49m\u001b[43m,\u001b[49m\n\u001b[1;32m      8\u001b[0m \u001b[43m        \u001b[49m\u001b[43mestimate_residual_variance\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\n\u001b[1;32m      9\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n",
      "File \u001b[0;32m~/miniforge3/envs/susie_rpy2/lib/python3.12/site-packages/rpy2/robjects/functions.py:208\u001b[0m, in \u001b[0;36mSignatureTranslatedFunction.__call__\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    206\u001b[0m         v \u001b[38;5;241m=\u001b[39m kwargs\u001b[38;5;241m.\u001b[39mpop(k)\n\u001b[1;32m    207\u001b[0m         kwargs[r_k] \u001b[38;5;241m=\u001b[39m v\n\u001b[0;32m--> 208\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m (\u001b[38;5;28;43msuper\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43mSignatureTranslatedFunction\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[43m)\u001b[49m\n\u001b[1;32m    209\u001b[0m \u001b[43m        \u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[38;5;21;43m__call__\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m)\n",
      "File \u001b[0;32m~/miniforge3/envs/susie_rpy2/lib/python3.12/site-packages/rpy2/robjects/functions.py:131\u001b[0m, in \u001b[0;36mFunction.__call__\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    129\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m    130\u001b[0m         new_kwargs[k] \u001b[38;5;241m=\u001b[39m cv\u001b[38;5;241m.\u001b[39mpy2rpy(v)\n\u001b[0;32m--> 131\u001b[0m res \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43msuper\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43mFunction\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[43m)\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[38;5;21;43m__call__\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mnew_args\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mnew_kwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    132\u001b[0m res \u001b[38;5;241m=\u001b[39m cv\u001b[38;5;241m.\u001b[39mrpy2py(res)\n\u001b[1;32m    133\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m res\n",
      "File \u001b[0;32m~/miniforge3/envs/susie_rpy2/lib/python3.12/site-packages/rpy2/rinterface_lib/conversion.py:45\u001b[0m, in \u001b[0;36m_cdata_res_to_rinterface.<locals>._\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m     44\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[38;5;21m_\u001b[39m(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs):\n\u001b[0;32m---> 45\u001b[0m     cdata \u001b[38;5;241m=\u001b[39m \u001b[43mfunction\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     46\u001b[0m     \u001b[38;5;66;03m# TODO: test cdata is of the expected CType\u001b[39;00m\n\u001b[1;32m     47\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m _cdata_to_rinterface(cdata)\n",
      "File \u001b[0;32m~/miniforge3/envs/susie_rpy2/lib/python3.12/site-packages/rpy2/rinterface.py:890\u001b[0m, in \u001b[0;36mSexpClosure.__call__\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    883\u001b[0m     res \u001b[38;5;241m=\u001b[39m rmemory\u001b[38;5;241m.\u001b[39mprotect(\n\u001b[1;32m    884\u001b[0m         openrlib\u001b[38;5;241m.\u001b[39mrlib\u001b[38;5;241m.\u001b[39mR_tryEval(\n\u001b[1;32m    885\u001b[0m             call_r,\n\u001b[1;32m    886\u001b[0m             call_context\u001b[38;5;241m.\u001b[39m__sexp__\u001b[38;5;241m.\u001b[39m_cdata,\n\u001b[1;32m    887\u001b[0m             error_occured)\n\u001b[1;32m    888\u001b[0m     )\n\u001b[1;32m    889\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m error_occured[\u001b[38;5;241m0\u001b[39m]:\n\u001b[0;32m--> 890\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m embedded\u001b[38;5;241m.\u001b[39mRRuntimeError(_rinterface\u001b[38;5;241m.\u001b[39m_geterrmessage())\n\u001b[1;32m    891\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m res\n",
      "\u001b[0;31mRRuntimeError\u001b[0m: Error in Xty - s$XtXr : non-conformable arrays\n"
     ]
    }
   ],
   "source": [
    "with (conversion_rules).context():   \n",
    "    fitted_rss2 = susie.susie_rss(\n",
    "        z=z_scores,\n",
    "        R=R,\n",
    "        n=n,  \n",
    "        var_y=np.var(np.array(N3[N3_names['Y']])[:,0]),\n",
    "        L=10,\n",
    "        estimate_residual_variance=True\n",
    "    )\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "00063c8b-6af3-4d65-9314-4971264d0d08",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "R version 4.4.2 (2024-10-31)\n",
      "Platform: x86_64-conda-linux-gnu\n",
      "Running under: Red Hat Enterprise Linux 8.6 (Ootpa)\n",
      "\n",
      "Matrix products: default\n",
      "BLAS/LAPACK: /hpfs/userws/chiouj02/software/conda_envs/susie_rpy2/lib/libopenblasp-r0.3.29.so;  LAPACK version 3.12.0\n",
      "\n",
      "locale:\n",
      " [1] LC_CTYPE=en_US.UTF-8       LC_NUMERIC=C              \n",
      " [3] LC_TIME=en_US.UTF-8        LC_COLLATE=en_US.UTF-8    \n",
      " [5] LC_MONETARY=en_US.UTF-8    LC_MESSAGES=en_US.UTF-8   \n",
      " [7] LC_PAPER=en_US.UTF-8       LC_NAME=C                 \n",
      " [9] LC_ADDRESS=C               LC_TELEPHONE=C            \n",
      "[11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C       \n",
      "\n",
      "time zone: America/New_York\n",
      "tzcode source: system (glibc)\n",
      "\n",
      "attached base packages:\n",
      "[1] tools     stats     graphics  grDevices utils     datasets  methods  \n",
      "[8] base     \n",
      "\n",
      "other attached packages:\n",
      "[1] susieR_0.12.35\n",
      "\n",
      "loaded via a namespace (and not attached):\n",
      " [1] crayon_1.5.3        mixsqp_0.3-54       vctrs_0.6.5        \n",
      " [4] cli_3.6.4           rlang_1.1.5         generics_0.1.3     \n",
      " [7] RcppZiggurat_0.1.6  RcppParallel_5.1.10 glue_1.8.0         \n",
      "[10] colorspace_2.1-1    plyr_1.8.9          scales_1.3.0       \n",
      "[13] grid_4.4.2          munsell_0.5.1       tibble_3.2.1       \n",
      "[16] lifecycle_1.0.4     compiler_4.4.2      dplyr_1.1.4        \n",
      "[19] irlba_2.3.5.1       Rcpp_1.0.14         pkgconfig_2.0.3    \n",
      "[22] Rfast_2.1.4         lattice_0.22-6      R6_2.6.1           \n",
      "[25] tidyselect_1.2.1    parallel_4.4.2      pillar_1.10.1      \n",
      "[28] magrittr_2.0.3      Matrix_1.7-2        gtable_0.3.6       \n",
      "[31] reshape_0.8.9       matrixStats_1.5.0   ggplot2_3.5.1      \n",
      "\n"
     ]
    }
   ],
   "source": [
    "print(ro.r.sessionInfo())"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "susie_rpy2",
   "language": "python",
   "name": "susie_rpy2"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}


================================================
FILE: inst/code/python_example/environment.yml
================================================
name: susie_rpy2
channels:
  - conda-forge
  - defaults
dependencies:
  - _libgcc_mutex=0.1=conda_forge
  - _openmp_mutex=4.5=2_gnu
  - _r-mutex=1.0.1=anacondar_1
  - asttokens=3.0.0=pyhd8ed1ab_1
  - binutils_impl_linux-64=2.43=h4bf12b8_4
  - bwidget=1.10.1=ha770c72_0
  - bzip2=1.0.8=h4bc722e_7
  - c-ares=1.34.4=hb9d3cd8_0
  - ca-certificates=2025.1.31=hbcca054_0
  - cairo=1.18.2=h3394656_1
  - comm=0.2.2=pyhd8ed1ab_1
  - curl=8.12.1=h332b0f4_0
  - debugpy=1.8.12=py312h2ec8cdc_0
  - decorator=5.2.1=pyhd8ed1ab_0
  - exceptiongroup=1.2.2=pyhd8ed1ab_1
  - executing=2.1.0=pyhd8ed1ab_1
  - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
  - font-ttf-inconsolata=3.000=h77eed37_0
  - font-ttf-source-code-pro=2.038=h77eed37_0
  - font-ttf-ubuntu=0.83=h77eed37_3
  - fontconfig=2.15.0=h7e30c49_1
  - fonts-conda-ecosystem=1=0
  - fonts-conda-forge=1=0
  - freetype=2.12.1=h267a509_2
  - fribidi=1.0.10=h36c2ea0_0
  - gcc_impl_linux-64=14.2.0=hdb7739f_2
  - gfortran_impl_linux-64=14.2.0=h0ee6e4a_2
  - graphite2=1.3.13=h59595ed_1003
  - gsl=2.7=he838d99_0
  - gxx_impl_linux-64=14.2.0=h2ead766_2
  - harfbuzz=10.3.0=h76408a6_0
  - icu=75.1=he02047a_0
  - importlib-metadata=8.6.1=pyha770c72_0
  - ipykernel=6.29.5=pyh3099207_0
  - ipython=8.32.0=pyh907856f_0
  - jedi=0.19.2=pyhd8ed1ab_1
  - jupyter_client=8.6.3=pyhd8ed1ab_1
  - jupyter_core=5.7.2=pyh31011fe_1
  - kernel-headers_linux-64=3.10.0=he073ed8_18
  - keyutils=1.6.1=h166bdaf_0
  - krb5=1.21.3=h659f571_0
  - ld_impl_linux-64=2.43=h712a8e2_4
  - lerc=4.0.0=h27087fc_0
  - libblas=3.9.0=31_h59b9bed_openblas
  - libcblas=3.9.0=31_he106b2a_openblas
  - libcurl=8.12.1=h332b0f4_0
  - libdeflate=1.23=h4ddbbb0_0
  - libedit=3.1.20250104=pl5321h7949ede_0
  - libev=4.33=hd590300_2
  - libexpat=2.6.4=h5888daf_0
  - libffi=3.4.6=h2dba641_0
  - libgcc=14.2.0=h767d61c_2
  - libgcc-devel_linux-64=14.2.0=h9c4974d_102
  - libgcc-ng=14.2.0=h69a702a_2
  - libgfortran=14.2.0=h69a702a_2
  - libgfortran-ng=14.2.0=h69a702a_2
  - libgfortran5=14.2.0=hf1ad2bd_2
  - libglib=2.82.2=h2ff4ddf_1
  - libgomp=14.2.0=h767d61c_2
  - libiconv=1.18=h4ce23a2_1
  - libjpeg-turbo=3.0.0=hd590300_1
  - liblapack=3.9.0=31_h7ac8fdf_openblas
  - liblzma=5.6.4=hb9d3cd8_0
  - libnghttp2=1.64.0=h161d5f1_0
  - libnsl=2.0.1=hd590300_0
  - libopenblas=0.3.29=pthreads_h94d23a6_0
  - libpng=1.6.47=h943b412_0
  - libsanitizer=14.2.0=hed042b8_2
  - libsodium=1.0.20=h4ab18f5_0
  - libsqlite=3.49.1=hee588c1_1
  - libssh2=1.11.1=hf672d98_0
  - libstdcxx=14.2.0=h8f9b012_2
  - libstdcxx-devel_linux-64=14.2.0=h9c4974d_102
  - libstdcxx-ng=14.2.0=h4852527_2
  - libtiff=4.7.0=hd9ff511_3
  - libuuid=2.38.1=h0b41bf4_0
  - libwebp-base=1.5.0=h851e524_0
  - libxcb=1.17.0=h8a09558_0
  - libxcrypt=4.4.36=hd590300_1
  - libzlib=1.3.1=hb9d3cd8_2
  - make=4.4.1=hb9d3cd8_2
  - matplotlib-inline=0.1.7=pyhd8ed1ab_1
  - ncurses=6.5=h2d0b736_3
  - nest-asyncio=1.6.0=pyhd8ed1ab_1
  - numpy=2.2.3=py312h72c5963_0
  - openssl=3.4.1=h7b32b05_0
  - packaging=24.2=pyhd8ed1ab_2
  - pandas=2.2.3=py312hf9745cd_1
  - pango=1.56.1=h861ebed_0
  - parso=0.8.4=pyhd8ed1ab_1
  - pcre2=10.44=hba22ea6_2
  - pexpect=4.9.0=pyhd8ed1ab_1
  - pickleshare=0.7.5=pyhd8ed1ab_1004
  - pip=25.0.1=pyh8b19718_0
  - pixman=0.44.2=h29eaf8c_0
  - platformdirs=4.3.6=pyhd8ed1ab_1
  - prompt-toolkit=3.0.50=pyha770c72_0
  - psutil=6.1.1=py312h66e93f0_0
  - pthread-stubs=0.4=hb9d3cd8_1002
  - ptyprocess=0.7.0=pyhd8ed1ab_1
  - pure_eval=0.2.3=pyhd8ed1ab_1
  - pygments=2.19.1=pyhd8ed1ab_0
  - python=3.12.9=h9e4cc4f_0_cpython
  - python-dateutil=2.9.0.post0=pyhff2d567_1
  - python-tzdata=2025.1=pyhd8ed1ab_0
  - python_abi=3.12=5_cp312
  - pytz=2024.1=pyhd8ed1ab_0
  - pyzmq=26.2.1=py312hbf22597_0
  - r-base=4.4.2=hc737e89_2
  - readline=8.2=h8c095d6_2
  - sed=4.8=he412f7d_0
  - setuptools=75.8.0=pyhff2d567_0
  - six=1.17.0=pyhd8ed1ab_0
  - stack_data=0.6.3=pyhd8ed1ab_1
  - sysroot_linux-64=2.17=h0157908_18
  - tk=8.6.13=noxft_h4845f30_101
  - tktable=2.10=h8bc8fbc_6
  - tornado=6.4.2=py312h66e93f0_0
  - traitlets=5.14.3=pyhd8ed1ab_1
  - typing_extensions=4.12.2=pyha770c72_1
  - tzdata=2025a=h78e105d_0
  - wcwidth=0.2.13=pyhd8ed1ab_1
  - wheel=0.45.1=pyhd8ed1ab_1
  - xorg-libice=1.1.2=hb9d3cd8_0
  - xorg-libsm=1.2.5=he73a12e_0
  - xorg-libx11=1.8.11=h4f16b4b_0
  - xorg-libxau=1.0.12=hb9d3cd8_0
  - xorg-libxdmcp=1.1.5=hb9d3cd8_0
  - xorg-libxext=1.3.6=hb9d3cd8_0
  - xorg-libxrender=0.9.12=hb9d3cd8_0
  - xorg-libxt=1.3.1=hb9d3cd8_0
  - zeromq=4.3.5=h3b0a872_7
  - zipp=3.21.0=pyhd8ed1ab_1
  - zstd=1.5.7=hb8e6e7a_1
  - pip:
      - cffi==1.17.1
      - jinja2==3.1.5
      - markupsafe==3.0.2
      - pycparser==2.22
      - rpy2==3.5.17
      - tzlocal==5.3
prefix: /home/chiouj02/miniforge3/envs/susie_rpy2


================================================
FILE: inst/code/simulate_lambda_pop_ld_bias.R
================================================
#!/usr/bin/env Rscript

# Simulate GTEx-like eQTL summary statistics from real-LD genotype matrices,
# then compare in-sample, ADSP-like, and UKB-like LD references with and without
# the population-bias correction.

default_config <- list(
  input_dir = "/home/gw/Documents/susie_ash_test/chat_test",
  output_dir = "/home/gw/Documents/susie_ash_test/chat_test/lambda_pop_sim_results",
  susie_repo = "/home/gw/GIT/susieR",
  simxqtl_repo = "/home/gw/GIT/simxQTL",
  n_reps = 20L,
  seed = 20260501L,
  p_max = 2500L,
  n_ref = 500L,
  L = 10L,
  max_iter = 80L,
  coverage = 0.95,
  min_abs_corr = 0.5,
  ld_proxy_threshold = 0.8,
  h2g = 0.15,
  n_sparse = 3L,
  n_oligogenic = 0L,
  n_inf = 0L,
  prop_h2_sparse = 1.00,
  prop_h2_oligogenic = 0.00,
  prop_h2_infinitesimal = 0.00,
  adsp_delta = 0.02,
  ukb_delta = 0.35,
  lambda_zero_tol = 0.01,
  include_map_qc = TRUE,
  verbose_fit = FALSE,
  verbose_reps = 1L,
  smoke = FALSE
)

vlog <- function(...) {
  msg <- paste0("[", format(Sys.time(), "%H:%M:%S"), "] ", ...)
  message(msg)
  flush.console()
}

parse_args <- function(defaults) {
  args <- commandArgs(trailingOnly = TRUE)
  cfg <- defaults
  if (!length(args)) {
    return(cfg)
  }
  for (arg in args) {
    if (!grepl("^--", arg)) {
      stop("Arguments must be --name=value; got: ", arg)
    }
    kv <- strsplit(sub("^--", "", arg), "=", fixed = TRUE)[[1]]
    key <- gsub("-", "_", kv[1])
    value <- if (length(kv) > 1) paste(kv[-1], collapse = "=") else "TRUE"
    if (!key %in% names(cfg)) {
      stop("Unknown argument --", kv[1])
    }
    old <- cfg[[key]]
    if (is.logical(old)) {
      cfg[[key]] <- tolower(value) %in% c("true", "t", "1", "yes", "y")
    } else if (is.integer(old)) {
      cfg[[key]] <- as.integer(value)
    } else if (is.numeric(old)) {
      cfg[[key]] <- as.numeric(value)
    } else {
      cfg[[key]] <- value
    }
  }
  if (isTRUE(cfg$smoke)) {
    cfg$n_reps <- min(cfg$n_reps, 1L)
    cfg$p_max <- min(cfg$p_max, 300L)
    cfg$n_ref <- min(cfg$n_ref, 200L)
    cfg$L <- min(cfg$L, 6L)
    cfg$max_iter <- min(cfg$max_iter, 20L)
  }
  cfg
}

load_local_packages <- function(cfg) {
  if (!requireNamespace("pkgload", quietly = TRUE)) {
    stop("Package 'pkgload' is required to load local susieR and simxQTL repos.")
  }
  pkgload::load_all(cfg$susie_repo, quiet = TRUE)
  pkgload::load_all(cfg$simxqtl_repo, quiet = TRUE)
}

write_json <- function(x, file) {
  if (requireNamespace("jsonlite", quietly = TRUE)) {
    jsonlite::write_json(x, file, pretty = TRUE, auto_unbox = TRUE, null = "null")
  } else {
    capture.output(str(x), file = file)
  }
}

standardize_matrix <- function(X) {
  X <- as.matrix(X)
  X <- scale(X, center = TRUE, scale = TRUE)
  X[is.na(X)] <- 0
  storage.mode(X) <- "double"
  X
}

select_variant_window <- function(G, p_max, seed) {
  G <- as.matrix(G)
  p <- ncol(G)
  if (p <= p_max) {
    return(standardize_matrix(G))
  }
  set.seed(seed)
  start <- sample.int(p - p_max + 1L, 1L)
  standardize_matrix(G[, start:(start + p_max - 1L), drop = FALSE])
}

read_genotype_files <- function(input_dir) {
  files <- list.files(input_dir, pattern = "[.]rds$", recursive = TRUE,
                      full.names = TRUE)
  ok <- logical(length(files))
  dims <- vector("list", length(files))
  for (i in seq_along(files)) {
    obj <- tryCatch(readRDS(files[i]), error = function(e) NULL)
    X <- if (!is.null(obj$G)) obj$G else obj$X
    ok[i] <- is.matrix(X) || is.data.frame(X)
    if (ok[i]) {
      dims[[i]] <- dim(X)
    }
  }
  data.frame(
    file = files[ok],
    n = vapply(dims[ok], `[`, numeric(1), 1L),
    p = vapply(dims[ok], `[`, numeric(1), 2L),
    stringsAsFactors = FALSE
  )
}

make_reference_panel <- function(G, n_ref, delta, seed) {
  set.seed(seed)
  n <- nrow(G)
  idx <- sample.int(n, n_ref, replace = n_ref > n)
  X <- G[idx, , drop = FALSE]
  if (delta > 0) {
    E <- matrix(rnorm(n_ref * ncol(G)), n_ref, ncol(G))
    X <- sqrt(1 - delta) * X + sqrt(delta) * E
  }
  standardize_matrix(X)
}

make_z_scores <- function(X, y) {
  z <- calc_z(X, y, center = TRUE, scale = FALSE)
  z[!is.finite(z)] <- 0
  as.numeric(z)
}

fit_susie_rss <- function(z, X_ref, n_target, cfg, method, verbose_fit = FALSE) {
  R_mismatch <- switch(method,
                   no_finite_no_bias = "none",
                   finite_only = "none",
                   bias_map = "map",
                   bias_map_qc = "map_qc",
                   stop("Unknown method: ", method))
  R_finite <- switch(method,
                     no_finite_no_bias = NULL,
                     finite_only = TRUE,
                     bias_map = TRUE,
                     bias_map_qc = TRUE,
                     stop("Unknown method: ", method))
  args <- list(
    z = z,
    X = X_ref,
    n = n_target,
    L = cfg$L,
    coverage = cfg$coverage,
	    min_abs_corr = cfg$min_abs_corr,
	    max_iter = cfg$max_iter,
	    R_finite = R_finite,
	    R_mismatch = R_mismatch,
	    estimate_residual_variance = FALSE,
	    verbose = isTRUE(verbose_fit)
	  )
  if (isTRUE(verbose_fit)) {
    return(do.call(susie_rss, args))
  }
  withCallingHandlers(do.call(susie_rss, args),
                      message = function(m) invokeRestart("muffleMessage"),
                      warning = function(w) invokeRestart("muffleWarning"))
}

extract_lambda_table <- function(fit, rep_id, panel, method) {
  diag <- fit$R_finite_diagnostics
  lb <- diag$lambda_bias
  if (is.null(lb)) {
    lb <- rep(NA_real_, nrow(fit$alpha))
  }
  bc <- diag$B_corrected
  if (is.null(bc)) {
    bc <- rep(NA_real_, length(lb))
  }
  data.frame(
    rep = rep_id,
    panel = panel,
    method = method,
    effect = seq_along(lb),
    R_finite_B = if (is.null(diag$B)) NA_real_ else as.numeric(diag$B),
    lambda_pop = as.numeric(lb),
    B_corrected = as.numeric(bc),
    stringsAsFactors = FALSE
  )
}

max_abs_ld_to_causal <- function(X_target, idx, causal) {
  if (!length(idx) || !length(causal)) {
    return(0)
  }
  idx <- intersect(idx, seq_len(ncol(X_target)))
  causal <- intersect(causal, seq_len(ncol(X_target)))
  if (!length(idx) || !length(causal)) {
    return(0)
  }
  C <- crossprod(X_target[, idx, drop = FALSE],
                 X_target[, causal, drop = FALSE]) / (nrow(X_target) - 1)
  max(abs(C))
}

causal_detected_by_cs <- function(X_target, cs, causal, ld_threshold) {
  if (!length(cs) || !length(causal)) {
    return(integer(0))
  }
  detected <- integer(0)
  for (j in causal) {
    if (j %in% cs) {
      detected <- c(detected, j)
    } else {
      C <- crossprod(X_target[, cs, drop = FALSE],
                     X_target[, j, drop = FALSE]) / (nrow(X_target) - 1)
      if (max(abs(C)) >= ld_threshold) {
        detected <- c(detected, j)
      }
    }
  }
  unique(detected)
}

extract_cs_metrics <- function(fit, X_target, causal, rep_id, panel, method,
                               ld_threshold) {
  cs_list <- fit$sets$cs
  if (is.null(cs_list) || !length(cs_list)) {
    return(data.frame(
      rep = rep_id, panel = panel, method = method, cs_name = NA_character_,
      cs_size = 0L, exact_hit = FALSE, proxy_hit = FALSE,
      max_abs_ld_to_causal = NA_real_, detected_causal = NA_character_,
      stringsAsFactors = FALSE
    ))
  }
  rows <- vector("list", length(cs_list))
  for (i in seq_along(cs_list)) {
    cs <- as.integer(cs_list[[i]])
    detected <- causal_detected_by_cs(X_target, cs, causal, ld_threshold)
    rows[[i]] <- data.frame(
      rep = rep_id,
      panel = panel,
      method = method,
      cs_name = names(cs_list)[i],
      cs_size = length(cs),
      exact_hit = any(cs %in% causal),
      proxy_hit = length(detected) > 0,
      max_abs_ld_to_causal = max_abs_ld_to_causal(X_target, cs, causal),
      detected_causal = paste(detected, collapse = ";"),
      stringsAsFactors = FALSE
    )
  }
  do.call(rbind, rows)
}

summarize_fit <- function(fit, X_target, causal, rep_id, panel, method,
                          elapsed, err = NULL, ld_threshold = 0.8) {
  if (!is.null(err)) {
    return(data.frame(
      rep = rep_id, panel = panel, method = method, status = "error",
      error = conditionMessage(err), elapsed_sec = elapsed,
      n_cs = NA_integer_, cs_tp_exact = NA_integer_, cs_tp_proxy = NA_integer_,
      cs_fp_proxy = NA_integer_, cs_fdr_proxy = NA_real_,
      causal_recall_proxy = NA_real_, top1_is_causal = NA,
      top1_ld_proxy = NA, max_pip_causal = NA_real_,
      mean_lambda_pop = NA_real_, max_lambda_pop = NA_real_,
      nonzero_lambda_pop = NA_integer_, R_finite_B = NA_real_,
      mean_B_corrected = NA_real_,
      max_per_variable_penalty = NA_real_, Q_art = NA_real_,
      artifact_flag = NA, mode_label = NA_character_, converged = NA,
      stringsAsFactors = FALSE
    ))
  }

  cs_rows <- extract_cs_metrics(fit, X_target, causal, rep_id, panel, method,
                                ld_threshold)
  has_cs <- !all(is.na(cs_rows$cs_name))
  detected <- integer(0)
  if (has_cs) {
    det_str <- cs_rows$detected_causal[nzchar(cs_rows$detected_causal)]
    detected <- unique(as.integer(unlist(strsplit(paste(det_str, collapse = ";"),
                                             ";", fixed = TRUE))))
    detected <- detected[!is.na(detected)]
  }
  top1 <- which.max(fit$pip)
  diag <- fit$R_finite_diagnostics
  lb <- diag$lambda_bias
  penalty <- diag$per_variable_penalty
  data.frame(
    rep = rep_id,
    panel = panel,
    method = method,
    status = "ok",
    error = NA_character_,
    elapsed_sec = elapsed,
    n_cs = if (has_cs) nrow(cs_rows) else 0L,
    cs_tp_exact = if (has_cs) sum(cs_rows$exact_hit) else 0L,
    cs_tp_proxy = if (has_cs) sum(cs_rows$proxy_hit) else 0L,
    cs_fp_proxy = if (has_cs) sum(!cs_rows$proxy_hit) else 0L,
    cs_fdr_proxy = if (has_cs) mean(!cs_rows$proxy_hit) else NA_real_,
    causal_recall_proxy = length(intersect(detected, causal)) / length(causal),
    top1_is_causal = top1 %in% causal,
    top1_ld_proxy = max_abs_ld_to_causal(X_target, top1, causal) >= ld_threshold,
    max_pip_causal = max(fit$pip[causal]),
    R_finite_B = if (is.null(diag$B)) NA_real_ else as.numeric(diag$B),
    mean_lambda_pop = if (is.null(lb)) NA_real_ else mean(lb),
    max_lambda_pop = if (is.null(lb)) NA_real_ else max(lb),
    nonzero_lambda_pop = if (is.null(lb)) NA_integer_ else sum(lb > 0),
    mean_B_corrected = if (is.null(diag$B_corrected)) NA_real_ else mean(diag$B_corrected),
    max_per_variable_penalty = if (is.null(penalty)) NA_real_ else max(penalty),
    Q_art = if (is.null(diag$Q_art)) NA_real_ else diag$Q_art,
    artifact_flag = if (is.null(diag$artifact_flag)) NA else isTRUE(diag$artifact_flag),
    mode_label = if (is.null(diag$mode_label)) NA_character_ else as.character(diag$mode_label),
    converged = isTRUE(fit$converged),
    stringsAsFactors = FALSE
  )
}

write_ai_readme <- function(cfg, out_dir) {
  lines <- c(
    "# Lambda-pop LD-bias simulation outputs",
    "",
    "Primary files for AI parsing:",
    "",
    "- `per_fit_metrics.csv`: one row per replicate, panel, and method. Key methods are `no_finite_no_bias`, `finite_only`, `bias_map`, and `bias_map_qc`; key columns are `R_finite_B`, `max_lambda_pop`, `mean_lambda_pop`, `mean_B_corrected`, `causal_recall_proxy`, `cs_fdr_proxy`, `top1_is_causal`, and `max_pip_causal`.",
    "- `per_effect_lambda.csv`: per-effect `R_finite_B`, `lambda_pop`, and `B_corrected` estimates.",
    "- `cs_metrics.csv`: one row per credible set, with exact and LD-proxy truth labels.",
    "- `replicate_metadata.csv`: source file, dimensions, causal indices, and realized h2.",
    "- `aggregate_summary.csv`: mean/median summaries grouped by panel and method.",
    "- `run_config.json`: exact simulation settings.",
    "",
    "Expected checks:",
    "",
    "1. In-sample LD with `method == bias_map` should have `lambda_pop` equal or very close to zero.",
    "2. `ADSP_like` should have smaller `lambda_pop` and larger `B_corrected` than `UKB_like`.",
    "3. `bias_map` should reduce false credible sets under biased LD without losing too much causal recall.",
    "",
    paste0("Configured ADSP delta = ", cfg$adsp_delta,
           "; UKB delta = ", cfg$ukb_delta,
           "; LD proxy threshold = ", cfg$ld_proxy_threshold, ".")
  )
  writeLines(lines, file.path(out_dir, "AI_PARSE_ME.md"))
}

aggregate_metrics <- function(metrics) {
  ok <- metrics[metrics$status == "ok", , drop = FALSE]
  if (!nrow(ok)) {
    return(data.frame())
  }
  groups <- unique(ok[, c("panel", "method")])
  rows <- vector("list", nrow(groups))
  for (i in seq_len(nrow(groups))) {
    idx <- ok$panel == groups$panel[i] & ok$method == groups$method[i]
    x <- ok[idx, , drop = FALSE]
    rows[[i]] <- data.frame(
      panel = groups$panel[i],
      method = groups$method[i],
      n_ok = nrow(x),
      mean_max_lambda_pop = mean(x$max_lambda_pop, na.rm = TRUE),
      median_max_lambda_pop = median(x$max_lambda_pop, na.rm = TRUE),
      mean_lambda_pop = mean(x$mean_lambda_pop, na.rm = TRUE),
      R_finite_B = mean(x$R_finite_B, na.rm = TRUE),
      mean_B_corrected = mean(x$mean_B_corrected, na.rm = TRUE),
      mean_causal_recall_proxy = mean(x$causal_recall_proxy, na.rm = TRUE),
      mean_cs_fdr_proxy = mean(x$cs_fdr_proxy, na.rm = TRUE),
      mean_n_cs = mean(x$n_cs, na.rm = TRUE),
      mean_max_pip_causal = mean(x$max_pip_causal, na.rm = TRUE),
      artifact_flag_rate = mean(x$artifact_flag, na.rm = TRUE),
      mean_Q_art = mean(x$Q_art, na.rm = TRUE),
      top1_causal_rate = mean(x$top1_is_causal, na.rm = TRUE),
      top1_proxy_rate = mean(x$top1_ld_proxy, na.rm = TRUE),
      stringsAsFactors = FALSE
    )
  }
  do.call(rbind, rows)
}

metric_value <- function(metrics, rep_i, panel, method, column) {
  idx <- metrics$rep == rep_i & metrics$panel == panel & metrics$method == method
  if (!any(idx)) {
    return(NA_real_)
  }
  value <- metrics[idx, column][1]
  if (is.logical(value)) {
    return(as.numeric(value))
  }
  as.numeric(value)
}

mean_metric <- function(metrics, panel, method, column) {
  idx <- metrics$status == "ok" & metrics$panel == panel & metrics$method == method
  if (!any(idx)) {
    return(NA_real_)
  }
  mean(as.numeric(metrics[idx, column]), na.rm = TRUE)
}

fmt_metric <- function(x, digits = 3) {
  if (!is.finite(x)) {
    return("NA")
  }
  formatC(x, format = "fg", digits = digits)
}

print_progress_line <- function(metrics, rep_i, cfg) {
  in_lambda <- metric_value(metrics, rep_i, "in_sample", "bias_map",
                            "max_lambda_pop")
  adsp_lambda <- metric_value(metrics, rep_i, "ADSP_like", "bias_map",
                              "max_lambda_pop")
  ukb_lambda <- metric_value(metrics, rep_i, "UKB_like", "bias_map",
                             "max_lambda_pop")
  adsp_recall <- metric_value(metrics, rep_i, "ADSP_like", "bias_map",
                              "causal_recall_proxy")
  ukb_recall <- metric_value(metrics, rep_i, "UKB_like", "bias_map",
                             "causal_recall_proxy")
  adsp_fdr <- metric_value(metrics, rep_i, "ADSP_like", "bias_map",
                           "cs_fdr_proxy")
  ukb_fdr <- metric_value(metrics, rep_i, "UKB_like", "bias_map",
                          "cs_fdr_proxy")

  mean_in_lambda <- mean_metric(metrics, "in_sample", "bias_map",
                                "max_lambda_pop")
  mean_adsp_lambda <- mean_metric(metrics, "ADSP_like", "bias_map",
                                  "max_lambda_pop")
  mean_ukb_lambda <- mean_metric(metrics, "UKB_like", "bias_map",
                                 "max_lambda_pop")
  mean_adsp_recall <- mean_metric(metrics, "ADSP_like", "bias_map",
                                  "causal_recall_proxy")
  mean_ukb_recall <- mean_metric(metrics, "UKB_like", "bias_map",
                                 "causal_recall_proxy")

  in_ok <- is.finite(in_lambda) && in_lambda <= cfg$lambda_zero_tol
  adsp_lt_ukb <- is.finite(adsp_lambda) && is.finite(ukb_lambda) &&
    adsp_lambda < ukb_lambda
  mean_adsp_lt_ukb <- is.finite(mean_adsp_lambda) &&
    is.finite(mean_ukb_lambda) && mean_adsp_lambda < mean_ukb_lambda

  message(
    "PROGRESS rep=", rep_i,
    " current: in_lambda=", fmt_metric(in_lambda),
    " in_zero=", in_ok,
    " ADSP_lambda=", fmt_metric(adsp_lambda),
    " UKB_lambda=", fmt_metric(ukb_lambda),
    " ADSP<UKB=", adsp_lt_ukb,
    " ADSP_recall=", fmt_metric(adsp_recall),
    " UKB_recall=", fmt_metric(ukb_recall),
    " ADSP_FDR=", fmt_metric(adsp_fdr),
    " UKB_FDR=", fmt_metric(ukb_fdr),
    " | running_mean: in_lambda=", fmt_metric(mean_in_lambda),
    " ADSP_lambda=", fmt_metric(mean_adsp_lambda),
    " UKB_lambda=", fmt_metric(mean_ukb_lambda),
    " ADSP<UKB=", mean_adsp_lt_ukb,
    " ADSP_recall=", fmt_metric(mean_adsp_recall),
    " UKB_recall=", fmt_metric(mean_ukb_recall)
  )
}

run_one_fit <- function(z, X_ref, n_target, cfg, method, rep_id, panel,
                        X_target, causal, verbose_fit = FALSE) {
  vlog("  fit start  rep=", rep_id, " panel=", panel, " method=", method,
       " (n_ref=", nrow(X_ref), ", p=", ncol(X_ref), ")")
  t0 <- proc.time()[["elapsed"]]
  fit <- tryCatch(fit_susie_rss(z, X_ref, n_target, cfg, method, verbose_fit),
                  error = function(e) e)
  elapsed <- proc.time()[["elapsed"]] - t0
  if (inherits(fit, "error")) {
    vlog("  fit ERROR  rep=", rep_id, " panel=", panel, " method=", method,
         " in ", fmt_metric(elapsed), "s: ", conditionMessage(fit))
    return(list(
      metric = summarize_fit(NULL, X_target, causal, rep_id, panel, method,
                             elapsed, fit, cfg$ld_proxy_threshold),
      lambda = data.frame(),
      cs = data.frame(),
      fit = NULL
    ))
  }
  metric <- summarize_fit(fit, X_target, causal, rep_id, panel, method,
                          elapsed, NULL, cfg$ld_proxy_threshold)
  vlog("  fit done   rep=", rep_id, " panel=", panel, " method=", method,
       " in ", fmt_metric(elapsed), "s | lambda=", fmt_metric(metric$max_lambda_pop),
       " Bcorr=", fmt_metric(metric$mean_B_corrected),
       " n_cs=", metric$n_cs, " recall=", fmt_metric(metric$causal_recall_proxy),
       " Q_art=", fmt_metric(metric$Q_art))
  list(
    metric = metric,
    lambda = extract_lambda_table(fit, rep_id, panel, method),
    cs = extract_cs_metrics(fit, X_target, causal, rep_id, panel, method,
                            cfg$ld_proxy_threshold),
    fit = fit
  )
}

main <- function() {
  cfg <- parse_args(default_config)
  set.seed(cfg$seed)
  vlog("=== lambda_pop LD-bias simulation ===")
  vlog("smoke=", cfg$smoke, "  n_reps=", cfg$n_reps, "  L=", cfg$L,
       "  max_iter=", cfg$max_iter, "  p_max=", cfg$p_max,
       "  n_ref=", cfg$n_ref)
  vlog("h2g=", cfg$h2g, "  n_sparse=", cfg$n_sparse,
       "  ADSP_delta=", cfg$adsp_delta, "  UKB_delta=", cfg$ukb_delta,
       "  include_map_qc=", cfg$include_map_qc,
       "  verbose_fit=", cfg$verbose_fit, "  verbose_reps=", cfg$verbose_reps)
  vlog("output_dir=", cfg$output_dir)
  vlog("Loading susieR and simxQTL via pkgload::load_all...")
  load_local_packages(cfg)
  dir.create(cfg$output_dir, recursive = TRUE, showWarnings = FALSE)
  write_json(cfg, file.path(cfg$output_dir, "run_config.json"))
  write_ai_readme(cfg, cfg$output_dir)

  vlog("Indexing genotype RDS files in ", cfg$input_dir, " ...")
  geno_index <- read_genotype_files(cfg$input_dir)
  if (!nrow(geno_index)) {
    stop("No RDS files with G or X matrices found in ", cfg$input_dir)
  }
  geno_index <- geno_index[order(-geno_index$n, -geno_index$p, geno_index$file), ]
  write.csv(geno_index, file.path(cfg$output_dir, "genotype_file_index.csv"),
            row.names = FALSE)
  vlog("Found ", nrow(geno_index), " usable genotype files; using top ",
       min(cfg$n_reps, nrow(geno_index)))

  chosen <- geno_index$file[seq_len(min(cfg$n_reps, nrow(geno_index)))]
  all_metrics <- list()
  all_lambda <- list()
  all_cs <- list()
  all_meta <- list()
  compact_fits <- list()

  for (rep_i in seq_along(chosen)) {
    rep_seed <- as.integer((cfg$seed + rep_i * 1000L) %% 1000000L)
    if (rep_seed <= 0L) {
      rep_seed <- rep_i
    }
    vlog("Replicate ", rep_i, "/", length(chosen), ": ", chosen[rep_i])
    obj <- readRDS(chosen[rep_i])
    G0 <- if (!is.null(obj$G)) obj$G else obj$X
    G <- select_variant_window(G0, cfg$p_max, rep_seed)
    vlog("  rep_seed=", rep_seed, "  genotype dim after window=",
         nrow(G), "x", ncol(G))

    sim <- generate_cis_qtl_data(
      G = G,
      h2g = cfg$h2g,
      prop_h2_sparse = cfg$prop_h2_sparse,
      prop_h2_oligogenic = cfg$prop_h2_oligogenic,
      prop_h2_infinitesimal = cfg$prop_h2_infinitesimal,
      n_sparse = cfg$n_sparse,
      n_oligogenic = cfg$n_oligogenic,
      n_inf = cfg$n_inf,
      standardize = TRUE,
      independent = TRUE,
      seed = rep_seed
    )
    X_target <- standardize_matrix(sim$G)
    y <- as.numeric(scale(sim$y, center = TRUE, scale = TRUE))
    z <- make_z_scores(X_target, y)
    causal <- sort(unique(sim$sparse_indices))
    causal <- causal[causal >= 1L & causal <= ncol(X_target)]
    if (!length(causal)) {
      causal <- sort(unique(which(sim$beta != 0)))
    }
    vlog("  simulated y: h2g_real=", fmt_metric(sim$h2g),
         "  causal=[", paste(causal, collapse = ","), "]")

    panels <- list(
      in_sample = X_target,
      ADSP_like = make_reference_panel(X_target, cfg$n_ref, cfg$adsp_delta,
                                       rep_seed + 11L),
      UKB_like = make_reference_panel(X_target, cfg$n_ref, cfg$ukb_delta,
                                      rep_seed + 23L)
    )
    methods <- c("no_finite_no_bias", "finite_only", "bias_map")
    if (isTRUE(cfg$include_map_qc)) {
      methods <- c(methods, "bias_map_qc")
    }

    all_meta[[rep_i]] <- data.frame(
      rep = rep_i,
      source_file = chosen[rep_i],
      n_target = nrow(X_target),
      p = ncol(X_target),
      n_causal_sparse = length(causal),
      causal_sparse = paste(causal, collapse = ";"),
      h2g_realized = sim$h2g,
      h2_sparse_realized = sim$h2_sparse,
      h2_oligogenic_realized = sim$h2_oligogenic,
      h2_infinitesimal_realized = sim$h2_infinitesimal,
      stringsAsFactors = FALSE
    )

    for (panel_name in names(panels)) {
      for (method in methods) {
        verbose_fit <- isTRUE(cfg$verbose_fit) &&
          rep_i <= cfg$verbose_reps &&
          method %in% c("bias_map", "bias_map_qc")
        if (verbose_fit) {
          message("VERBOSE_FIT_BEGIN rep=", rep_i, " panel=", panel_name,
                  " method=", method)
        }
        res <- run_one_fit(z, panels[[panel_name]], nrow(X_target), cfg,
                           method, rep_i, panel_name, X_target, causal,
                           verbose_fit = verbose_fit)
        if (verbose_fit) {
          message("VERBOSE_FIT_END rep=", rep_i, " panel=", panel_name,
                  " method=", method)
        }
        key <- paste(rep_i, panel_name, method, sep = "__")
        all_metrics[[key]] <- res$metric
        all_lambda[[key]] <- res$lambda
        all_cs[[key]] <- res$cs
        compact_fits[[key]] <- list(
          pip = if (!is.null(res$fit)) res$fit$pip else NULL,
          sets = if (!is.null(res$fit)) res$fit$sets else NULL,
          R_finite_diagnostics =
            if (!is.null(res$fit)) res$fit$R_finite_diagnostics else NULL
        )
      }
    }

    metrics_so_far <- do.call(rbind, all_metrics)
    write.csv(metrics_so_far, file.path(cfg$output_dir, "per_fit_metrics.csv"),
              row.names = FALSE)
    write.csv(do.call(rbind, all_meta),
              file.path(cfg$output_dir, "replicate_metadata.csv"),
              row.names = FALSE)
    if (length(all_lambda)) {
      write.csv(do.call(rbind, all_lambda),
                file.path(cfg$output_dir, "per_effect_lambda.csv"),
                row.names = FALSE)
    }
    if (length(all_cs)) {
      write.csv(do.call(rbind, all_cs), file.path(cfg$output_dir, "cs_metrics.csv"),
                row.names = FALSE)
    }
    write.csv(aggregate_metrics(metrics_so_far),
              file.path(cfg$output_dir, "aggregate_summary.csv"),
              row.names = FALSE)
    print_progress_line(metrics_so_far, rep_i, cfg)
  }

  final_metrics <- do.call(rbind, all_metrics)
  final <- list(
    config = cfg,
    metrics = final_metrics,
    lambda = if (length(all_lambda)) do.call(rbind, all_lambda) else data.frame(),
    cs = if (length(all_cs)) do.call(rbind, all_cs) else data.frame(),
    metadata = do.call(rbind, all_meta),
    aggregate = aggregate_metrics(final_metrics),
    compact_fits = compact_fits
  )
  saveRDS(final, file.path(cfg$output_dir, "all_results.rds"))
  write_json(list(
    completed_at = as.character(Sys.time()),
    output_dir = normalizePath(cfg$output_dir, mustWork = FALSE),
    n_reps_requested = cfg$n_reps,
    n_reps_completed = length(chosen),
    files = c("AI_PARSE_ME.md", "run_config.json", "genotype_file_index.csv",
              "replicate_metadata.csv", "per_fit_metrics.csv",
              "per_effect_lambda.csv", "cs_metrics.csv",
              "aggregate_summary.csv", "all_results.rds")
  ), file.path(cfg$output_dir, "manifest.json"))
  vlog("Done. Results written to: ", cfg$output_dir)
}

main()


================================================
FILE: inst/code/small_sim.R
================================================
# Small script to evaluate the NIG prior version of SuSiE in
# simulated data sets.
library(matrixStats)
library(susieR)
susie_version <- packageVersion("susieR")
outfile <- paste0("small_sim_out_v",susie_version,".RData")
print(outfile)
N <- 250
n <- 40
geno <- readRDS("../datafiles/Thyroid.FMO2.1Mb.RDS")$X
storage.mode(geno) <- "double"

causal_snps     <- vector("list",N)
res_susie       <- vector("list",N)
res_susie_small <- vector("list",N)
runtimes        <- data.frame(susie       = rep(0,N),
                              susie_small = rep(0,N))
for (iter in 1:N) {
  cat(iter,"")
  set.seed(iter)

  # Subsample the genotypes.
  i <- sample(nrow(geno),n)
  X <- geno[i,]

  # Remove SNPs that show no variation in the subset.
  j <- which(colSds(X) > 0)
  X <- X[,j]

  # Simulate b and y.
  p <- ncol(X)
  b <- rep(0,p)
  names(b) <- colnames(X)
  p1   <- sample(3,1)
  j    <- sample(p,p1)
  b[j] <- sample(c(-1,1),p1,replace = TRUE)
  e    <- rnorm(n,sd = 0.1)
  y    <- drop(X %*% b + e)
  y    <- y/sd(y)
  causal_snps[[iter]] <- j

  # Run susie with normal prior.
  t0 <- proc.time()
  fit1 <- suppressMessages(
            susie(X,y,L = 10,standardize = FALSE,min_abs_corr = 0.5,
                  estimate_prior_method = "EM",verbose = FALSE))
  t1 <- proc.time()
  res_susie[[iter]] <- fit1[c("V","sets")]
  runtimes[iter,"susie"] <- (t1 - t0)["elapsed"]

  # Run susie with NIG prior. 
  t0 <- proc.time()
  fit2 <- suppressMessages(
            susie(X,y,L = 10,standardize = FALSE,min_abs_corr = 0.5,
                  estimate_residual_method = "NIG",
                  estimate_prior_method = "EM",alpha0 = 0.1,beta0 = 0.1,
                  verbose = FALSE))
  t1 <- proc.time()
  res_susie_small[[iter]] <- fit2[c("V","sets")]
  runtimes[iter,"susie_small"] <- (t1 - t0)["elapsed"]
}
cat("\n")

# Save the results.
save(list = c("n","susie_version","causal_snps","res_susie",
              "res_susie_small","runtimes"),
     file = outfile)


================================================
FILE: inst/code/sparse_matrix_strategy.Rmd
================================================
---
title: "Sparse matrix multiplication strategy"
author: "Kaiqian Zhang"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Sparse vs. dense matrix operations}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 4.5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

## Set up environment

```{r, warning=FALSE, message=FALSE}
library(susieR)
library(Matrix)
library(microbenchmark)
library(ggplot2)
set.seed(1)
```

## Goal

Our intention is to use sparse matrix multiplications to help
reduce computation time.

## General strategy

Given a large sparse matrix `X`, we want to compute some matrix
multiplications associated with a scaled $\tilde{X}$. We notice
that after scaling, `X` becomes a dense matrix and is not possible for
a sparse matrix multiplication. So we construct formulae to apply
sparse matrix multiplication first on a standardized `X` since
standardization does not affect its sparsity. Then we perform
centering to get the same result.

## Types of matrix multiplications

There are two types of matrix multiplications we want to investigate:

+ Compute $\tilde{X}b$, where $\tilde{X}$ is an n by p scaled matrix
  and $b$ is a p vector.

+ Compute $\tilde{X}^Ty$, where $\tilde{X}$ is an n by p scaled matrix
  and $y$ is an n vector.

## Results

This strategy has a decent performance when computing both
$\tilde{X}b$ and $\tilde{X}^Ty$, compared to simple matrix
multiplication `%*%`.

## Strategy formulae details

### Computing $\boldsymbol{\tilde{X}b}$

Suppose we want to compute $\tilde{X}b$, where $\tilde{X}$ is a scaled
n by p matrix and $b$ is a p vector. Our goal is to express
$\tilde{X}b$ into a term involving unscaled $X$ matrix multiplication
to achieve sparse matrix operation.

\begin{equation}
\begin{aligned}
\tilde{X}b
&= \sum_{j=1}^{p} \tilde{X}_{\cdot j} b_j \\
&= \sum_{j=1}^{p} \frac{X_{\cdot j}-\mu_j}{\sigma_j}b_j \\
&= \sum_{j=1}^{p}\frac{X_{\cdot j}}{\sigma_j}b_j -
   \sum_{j=1}^{p} \frac{\mu_j}{\sigma_j}b_j \\
&= X b / \sigma - \mu^Tb/\sigma,
\end{aligned}
\end{equation}

where $\mu$ is a *p*-vector of column means, and $\sigma$ is a
*p*-vector of column standard deviations.

### Computing $\boldsymbol{\tilde{X}^Ty}$

Suppose we want to compute $\tilde{X}^Ty$, where $\tilde{X}$ is a
scaled n by p matrix and $y$ is an n vector. Similarly, we express
$\tilde{X}^Ty$ using unscaled $X$ so that we can perform sparse matrix
multiplication. We have the following:

\begin{equation}
\begin{aligned}
\tilde{X}^Ty &= \sum_{i=1}^{n} \tilde{X}_{i.}y_i \\
&= \sum_{i=1}^{n} \frac{X_{i.} - \mu}{\sigma}y_i \\
&= \frac{1}{\sigma}\sum_{i=1}^{n}X_{i.}y_i -
   \frac{\mu}{\sigma}\sum_{i=1}^{n} y_i \\
&= \frac{1}{\sigma}(X^Ty) - \frac{\mu}{\sigma}y^T 1,
\end{aligned}
\end{equation}

where $\mu$ is a *p*-vector of column means, and $\sigma$ is a
*p*-vector of columnwise standard deviations.

## Simulations

We simulate an `n = 1000` by `p = 10000` matrix `X` at sparsity
$99\%$, i.e. $99\%$ entries are zeros. We compare results between
normal matrix computation and our sparse strategy as well as comparing
speed using microbenchmark.

```{r}
create_sparsity_mat <- function(sparsity, n, p) {
  nonzero          <- round(n*p*(1-sparsity))
  nonzero.idx      <- sample(n*p, nonzero)
  mat              <- numeric(n*p)
  mat[nonzero.idx] <- 1
  mat              <- matrix(mat, nrow=n,ncol=p)
  return(mat)
}
n <- 1000
p <- 10000
```

```{r}
X.dense  <- create_sparsity_mat(0.99,n,p)
X.sparse <- as(X.dense,"sparseMatrix")
X.tilde  <- susieR:::set_X_attributes(X.dense) #returns a scaled X if input is a dense matrix
X <- susieR:::set_X_attributes(X.sparse) #return an unsacled sparse X if input is a sparse matrix 
                                     #but computes column means and standard deviations
```

```{r}
b <- rnorm(p)
y <- rnorm(n)
```

### Benchmark for computing $\boldsymbol{\tilde{X}b}$

The final results of two methods when computing $\tilde{X}b$ are very
close.

```{r}
res1 <- X.tilde %*% b
res2 <- susieR:::compute_Xb(X,b)
max(abs(res1 - res2))
```

```{r}
compute_Xb_benchmark <- microbenchmark(
  dense  = (use.normal.Xb <- X.tilde%*%b),
  sparse = (use.sparse.Xb <- susieR:::compute_Xb(X,b)),
  times = 20,unit = "s")
```

Our sparse strategy demonstrates an obvious advantage over the normal
matrix multiplication in computing $\tilde{X}b$.

```{r}
autoplot(compute_Xb_benchmark)
```

### Benchmark for computing $\boldsymbol{\tilde{X}^Ty}$

The final results of two methods when computing $\tilde{X}^Ty$ are
almost the same.

```{r}
res3 <- t(X.tilde) %*% y
res4 <- susieR:::compute_Xty(X,y)
max(abs(res3 - res4))
```

```{r}
compute_Xty_benchmark = microbenchmark(
  dense  = (use.normal.Xty <- t(X.tilde)%*%y),
  sparse = (use.sparse.Xty <- susieR:::compute_Xty(X, y)),
  times = 20,unit = "s")
```

Our sparse strategy evidently has a better performance than the normal
method in computing $\tilde{X}^Ty$.

```{r}
autoplot(compute_Xty_benchmark)
```


================================================
FILE: inst/code/summarize_small_sim.R
================================================
# Script to summarize the results of running small_sim.R.
library(ggplot2)
library(cowplot)
load("../datafiles/small_sim_out_v0.14.48.RData")
runtimes <- data.frame(susie    = runtimes$susie,
                       susie_ss = runtimes$susie_small)
methods <- c("susie","susie_ss")

# Summarize coverage, power and running times.
N <- length(causal_snps)
power           <- c(0,0)
coverage        <- c(0,0)
names(power)    <- methods
names(coverage) <- methods
V1_true <- NULL
V2_true <- NULL
V1_false <- NULL
V2_false <- NULL
for (i in 1:N) {
  get_tp <- function (cs) {
    if (length(cs) == 0)
      return(NULL)
    else
      return(names(which(sapply(cs, 
        function (x) length(intersect(causal_snps[[i]],x))>0))))
  }
  V1 <- res_susie[[i]]$V
  V2 <- res_susie_small[[i]]$V
  all_cs <- paste0("L",1:10)
  names(V1) <- all_cs
  names(V2) <- all_cs
  x1 <- get_tp(res_susie[[i]]$sets$cs)
  x2 <- get_tp(res_susie_small[[i]]$sets$cs)
  V1_true <- c(V1_true,V1[x1])
  V2_true <- c(V2_true,V2[x2])
  V1_false <- c(V1_false,V1[setdiff(all_cs,x1)])
  V2_false <- c(V2_false,V2[setdiff(all_cs,x2)])
  power["susie"]       <- power["susie"]       + length(x1)
  power["susie_ss"]    <- power["susie_ss"]    + length(x2)
  coverage["susie"]    <- coverage["susie"]    + length(x1)
  coverage["susie_ss"] <- coverage["susie_ss"] + length(x2)
}

num_causal   <- sum(sapply(causal_snps,length))
num_susie    <- sum(sapply(res_susie,function (x) length(x$sets$cs)))
num_susie_ss <- sum(sapply(res_susie_small,function (x) length(x$sets$cs)))
power <- power / num_causal
coverage["susie"]    <- coverage["susie"] / num_susie
coverage["susie_ss"] <- coverage["susie_ss"] / num_susie_ss
cat("power:\n")
print(power)
cat("coverage:\n")
print(coverage)
cat("running times:\n")
print(summary(runtimes))

# Summarize the CS sizes.
get_cs_sizes <- function (res)
  unlist(lapply(res,function (x) sapply(x$sets$cs,length)))
sizes_susie    <- get_cs_sizes(res_susie)
sizes_susie_ss <- get_cs_sizes(res_susie_small)
cat("median CS size:\n")
cat("susie =",median(sizes_susie),"\n")
cat("susie_ss =",median(sizes_susie_ss),"\n")
pdat <- rbind(data.frame(method = "susie",   size = sizes_susie),
              data.frame(method = "susie_ss",size = sizes_susie_ss))
pdat <- subset(pdat,size <= 50)
p1 <- ggplot(pdat,aes(x = size,fill = method)) +
  geom_histogram(color = "white",position = "dodge",bins = 16) +
  scale_fill_manual(values = c("darkblue","dodgerblue","darkorange")) +
  labs(x = "CS size",y = "number of CSs",fill = "") +
  theme_cowplot(font_size = 10) +
  theme(legend.position = "bottom",
        legend.direction = "vertical")
ggsave("small_sim_sizes.pdf",p1,height = 3,width = 3)

# Summarize the prior variances.
pdat <- rbind(data.frame(method = "susie",   causal = TRUE, V = V1_true),
              data.frame(method = "susie",   causal = FALSE,V = V1_false),
              data.frame(method = "susie_ss",causal = TRUE, V = V2_true),
              data.frame(method = "susie_ss",causal = FALSE,V = V2_false))
pdat <- transform(pdat,sigma = sqrt(V))
pdat <- subset(pdat,sigma < 2)
p2 <- ggplot(pdat,aes(x = sigma,color = causal,fill = causal)) +
  facet_grid(rows = vars(method),scales = "free_y") +
  geom_histogram(bins = 24,position = "dodge",linewidth = 0.05) +
  scale_color_manual(values = c("darkblue","orangered")) +
  scale_fill_manual(values = c("darkblue","orangered")) +
  labs(x = "prior s.d.") +
  theme_cowplot(font_size = 10)
ggsave("small_sim_V.pdf",p2,height = 3.5,width = 3)


================================================
FILE: inst/code/susie_memory.R
================================================
# export MEM_CHECK_INTERVAL=0.01
# python3 monitor_memory.py Rscript susie_memory.R
#
# NOTES:
#
# - Without any improvements:
#   Size of X: 1 GB
#   max rss_memory: 4.70 GB
#
# - With the improvements:
#   Size of X: 1 GB
#   max rss_memory: 3.00 GB
#
# set.seed(1)
# p <- 16000
# n <- 8000
# X <- matrix(rnorm(n*p),n,p)
# X <- scale(X,center = TRUE,scale = TRUE)
# y <- rnorm(n)
# save(list = c("X","y"),file = "susie_data.RData")
# library(susieR)
devtools::load_all()
load("susie_data.RData")
cat("Size of X:\n")
print(object.size(X),unit = "GB")
cat("Running susie.\n")
set.seed(1)
out <- susie(X,y,estimate_prior_variance = FALSE,min_abs_corr = 0,
             verbose = TRUE)
print(sapply(out$sets$cs,length))


================================================
FILE: inst/code/susie_rss_memory.R
================================================
# export MEM_CHECK_INTERVAL=0.01
# python3 monitor_memory.py Rscript susie_rss_memory.R
#
# NOTES:
#
# - Without any improvements:
#   Size of X: 0.5 GB
#   max rss_memory: 4.15 GB
#
# - With some improvements, the initial steps right before the main
#   loop use 0.86 GB.
#
# - susie_rss right before the CS and PIP calculations uses 1.6 GB.
#
# library(susieR)
devtools::load_all()
# set.seed(1)
# p  <- 8000
# n  <- 1000
# X  <- matrix(rnorm(n*p),n,p)
# y  <- rnorm(n)
# ss <- susieR:::univariate_regression(X,y)
# z  <- ss$betahat/ss$sebetahat
# R  <- cor(X)
# save(list = c("X","y","z","R"),file = "susie_rss_data.RData")
load("susie_rss_data.RData")
cat("Size of R:\n")
print(object.size(R),unit = "GB")
cat("Running susie_rss.\n")
set.seed(1)
out <- susie_rss(z,R,estimate_prior_variance = FALSE,min_abs_corr = 0,
                 check_input = FALSE,refine = FALSE,verbose = TRUE)
print(sapply(out$sets$cs,length))


================================================
FILE: inst/misc/README_susie_v2.md
================================================
# susieR 2.0 Architecture

## Overview

susieR 2.0 implements a unified architecture incorporating various extensions to the Sum of Single Effects model for Bayesian variable selection regression. 
The package supports multiple data types (individual-level, sufficient statistics, regression summary statistics) through a single algorithmic pipeline using S3 method dispatch.

## Architecture Diagram

```
Interface → Constructor → Workhorse → IBSS Core → Backend Methods
               ↓            ↓
          (data, params) → model
```

## Core Object Definitions

The architecture revolves around three key objects:

### **Data Object**
- **Purpose**: Contains input data in processed, algorithm-ready form
- **S3 Classes**: `individual`, `ss`, `rss_lambda` (determines method dispatch)
- **Mutability**: Immutable - never modified after creation
- **Contents**: 
  - Input matrices: X/y (individual), XtX/Xty/yty (ss), z/R (rss_lambda)
  - Metadata: n, p
  - Scaling attributes: For compute_Xb() compatibility
  - Specialized fields: Eigen decomposition for unmappable effects/rss_lambda


### **Params Object**
- **Purpose**: Contains ALL algorithm parameters and user settings
- **Mutability**: Immutable - never modified after validation
- **Contents**:
  - Algorithm parameters: L, max_iter, tol, convergence_method
  - Estimation settings: estimate_prior_method, estimate_residual_method
  - Model options: unmappable_effects, refine, standardize, intercept

### **Model Object**
- **Purpose**: Contains fitted SuSiE model state, results, and algorithm outputs
- **Mutability**: Mutable - updated throughout fitting process
- **Contents**:
  - Model matrices: alpha, mu, mu2, V, sigma2
  - Fitted values: Xr (individual), XtXr (ss), Rz (rss_lambda)
  - Algorithm outputs: ELBO, niter, converged
  - Final results: credible sets, PIPs, intercept, z-scores

## Constructor Pattern

### **Constructor Workflow**:
1. **Interface functions** (`susie()`, `susie_ss()`, and `susie_rss()`) take user inputs and call constructors functions
2. **Constructors** create validated (data, params) objects
3. **Workhorse** Validated (data, params) objects are directly forwarded to the workhorse function for the main SuSiE algorithm

### **Constructor Functions** (`susie_constructors.R`):
- `individual_data_constructor()` → Processes X, y matrices → (data, params)
- `sufficient_stats_constructor()`→ Processes XtX, Xty, yty → (data, params)  
- `summary_stats_constructor()`: Routes RSS inputs based on lambda parameter
   - If `lambda = 0` → Converts RSS data to SS → `sufficient_stats_constructor()` → (data, params)
   - If `lambda > 0` → `rss_lambda_constructor()`→ Processes z, R for regularized LD → (data, params)

### **Data Type Support**:

Each data object receives an S3 class to automatically route to the appropriate backend function based on the data object's S3 class.

- **`individual`**: Individual-level data (X, y matrices)
- **`ss`**: Sufficient statistics (XtX, Xty, yty, n)
- **`rss_lambda`**: RSS with regularized LD matrix (z, R, lambda > 0)

## Model Components

### Core Algorithm Files:

1. **`susie_workhorse.R`**: Main orchestration layer
   - Manages the complete fitting pipeline: initialize → iterate → finalize
   - Coordinates variance component updates
   - Handles convergence checking based on specified method
   - Tracks fit history when `track_fit=TRUE`

2. **`iterative_bayesian_stepwise_selection.R`**: IBSS algorithm
   - `ibss_initialize()`: Creates initial model state with L effects
   - `ibss_fit()`: Main iteration loop that updates each effect sequentially
   - `ibss_finalize()`: Post-processing to compute credible sets and PIPs

3. **`single_effect_regression.R`**: Single Effect Regression (SER) implementation
   - `single_effect_regression()`: Fits one sparse effect at a time
   - `optimize_prior_variance()`: Optimizes the prior variance for the lth effect
   - `single_effect_update()`: Implements the complete SER update pipeline

## Backend Method Implementations

Each data type has a corresponding backend file implementing the S3 methods defined in `generic_methods.R`:

- `individual_data_methods.R` - Methods for class `individual`
- `sufficient_stats_methods.R` - Methods for class `ss`
- `rss_lambda_methods.R` - Methods for class `rss_lambda`

The backend system allows the same high-level algorithm to work with different data representations through S3 method dispatch. Each backend file contains a 1:1 correspondence with the generic methods, implementing data-specific computations.

## Utility Functions

- **`susie_utils.R`**: Internal utility functions organized by:
  - **Fundamental Building Blocks** (general purpose-helpers, matrix operations)
  - **Data Processing & Validation** (input validation, data conversion)
  - **Model Initialization** (set up model state)
  - **Core Algorithm Components** (posterior mean calculation, lbf calculation)
  - **Variance Esimation** (residual variance and unmappable effects variance esimation)
  - **Convergence & Optimization** (Convergence checking, ELBO computation)
  - **Credible Sets & Post-processing** (Generate credible sets, pips)

- **`susie_rss_utils.R`**: Internal utility functions specific to RSS data with lambda > 0, organized by:
  - **Fundamental Computations** (core RSS computations)
  - **RSS Model Methods** (lambda estimation, precomputations)
  - **Diagnostic & Quality Control** (detect allele switch)

- **`susie_get_functions.R`**: Exported accessor functions for extracting results:
  - `susie_get_cs()`: Extract credible sets
  - `susie_get_pip()`: Extract posterior inclusion probabilities
  - Other accessor functions for model components


================================================
FILE: inst/misc/format_r_code.sh
================================================
#!/bin/bash

# Function to display error messages and exit the script
display_error() {
    echo "Error: $1"
    exit 1
}

# Check if the R file is provided as an argument
if [ $# -eq 0 ]; then
    display_error "Please provide the path to the R file as an argument."
fi

# Get the R file path from the argument
r_file="$1"

# Check if the R file exists
if [ ! -f "$r_file" ]; then
    display_error "The specified R file '$r_file' does not exist."
fi

echo "Formatting R code in file: $r_file"

# Format the R code using formatR and capture the output
# output=$(echo "library(formatR); tryCatch(tidy_source(\"$r_file\", file = \"$r_file\", indent = 2, args.newline = TRUE, arrow = TRUE), error = function(e) {message(\"Error formatting R code:\"); print(e)})" | R --slave --no-save 2>&1)
# Format the R code using styler and capture the output
output=$(echo "tryCatch(styler::style_file(\"$r_file\"), error = function(e) {message(\"Error formatting R code:\"); print(e)})" | R --slave --no-save 2>&1)

# Check if the formatting was successful
if echo "$output" | grep -q "Error formatting R code:"; then
    echo "Formatting failed. Please check the R code for syntax errors."
    echo -e "\033[0;31m$(echo "$output" | head -n -3)\033[0m"
    echo -e "\033[1;31m$(echo "$output" | tail -n 3)\033[0m"
    exit 1
else
    echo "R code formatting completed successfully."
fi

================================================
FILE: inst/misc/post-commit.sh
================================================
#!/bin/bash
#
# This script will be executed every time you run "git commit". It
# will commit changes made to package DESCRIPTION by the pre-commit hook
#
# To use this script, copy it to the .git/hooks directory of your
# local repository to filename `post-commit`, and make it executable.
#
ROOT_DIR=`git rev-parse --show-toplevel`
# Only commit DESCRIPTION file when it is not staged (due to changes by pre-commit hook)
if [[ -z `git diff HEAD` ]] || [[ ! -f $ROOT_DIR/DESCRIPTION ]] || [[ -z `git diff $ROOT_DIR/DESCRIPTION` ]]; then
    exit 0
else
    git add $ROOT_DIR/DESCRIPTION
    git commit --amend -C HEAD --no-verify
    echo "Amend current commit to incorporate version bump"
    exit 0
fi


================================================
FILE: inst/misc/pre-commit.sh
================================================
#!/bin/bash
#
# This script will be executed every time you run "git commit". It
# will update the 4th digit of package version by revision number.
#
# To use this script, copy it to the .git/hooks directory of your
# local repository to filename `pre-commit`, and make it executable.
#
ROOT_DIR=`git rev-parse --show-toplevel`
MSG="[WARNING] Auto-versioning disabled because string 'Version: x.y.z.r' cannot be found in DESCRIPTION file."
GREP_REGEX='^Version: [0-9]*\.[0-9]*\.[0-9]*\.[0-9]*'
SED_REGEX='^Version: \([0-9]*\.[0-9]*\.[0-9]*\)\.[0-9]*'
# `git diff HEAD` shows both staged and unstaged changes
if [[ -z `git diff HEAD` ]] || [[ ! -f $ROOT_DIR/DESCRIPTION ]]; then
    exit 0
elif [[ -z `grep "$GREP_REGEX" $ROOT_DIR/DESCRIPTION` ]]; then
    echo -e "\e[1;31m$MSG\e[0m"
    exit 0
else
    REV_ID=`git log --oneline | wc -l`
    REV_ID=`printf "%04d\n" $((REV_ID+1))`
    DATE=`date +%Y-%m-%d`
    echo "Version string bumped to revision $REV_ID on $DATE"
    sed -i "s/$SED_REGEX/Version: \1.$REV_ID/" $ROOT_DIR/DESCRIPTION
    sed -i "s/^Date: .*/Date: $DATE/" $ROOT_DIR/DESCRIPTION
    if [[ `git rev-parse --abbrev-ref HEAD` -eq "master" ]]; then
        cd $ROOT_DIR
        echo "Updating documentation ..."
        R --slave -e 'devtools::document()' &> /dev/null && git add man/*.Rd
        echo "Documentation updated!"
        echo "Running unit tests ..."
        R --slave -e 'devtools::test()'
        echo "Unit test completed!"
    fi
    exit 0
fi


================================================
FILE: inst/misc/uncrustify_default.cfg
================================================
# Downloaded from https://raw.githubusercontent.com/uncrustify/uncrustify/refs/heads/master/documentation/htdocs/default.cfg
# By Gao Wang on Jan 17, 2025
# with modifications to `align_func_params_span`
# usage: uncrustify -c /path/to/mashr/inst/misc/uncrustify_default.cfg --replace --no-backup -l CPP $f

# Uncrustify-0.80.1

#
# General options
#

# The type of line endings.
#
# Default: auto
newlines                        = auto     # lf/crlf/cr/auto

# The original size of tabs in the input.
#
# Default: 8
input_tab_size                  = 8        # unsigned number

# The size of tabs in the output (only used if align_with_tabs=true).
#
# Default: 8
output_tab_size                 = 8        # unsigned number

# The ASCII value of the string escape char, usually 92 (\) or (Pawn) 94 (^).
#
# Default: 92
string_escape_char              = 92       # unsigned number

# Alternate string escape char (usually only used for Pawn).
# Only works right before the quote char.
string_escape_char2             = 0        # unsigned number

# Replace tab characters found in string literals with the escape sequence \t
# instead.
string_replace_tab_chars        = false    # true/false

# Allow interpreting '>=' and '>>=' as part of a template in code like
# 'void f(list<list<B>>=val);'. If true, 'assert(x<0 && y>=3)' will be broken.
# Improvements to template detection may make this option obsolete.
tok_split_gte                   = false    # true/false

# Disable formatting of NL_CONT ('\\n') ended lines (e.g. multi-line macros).
disable_processing_nl_cont      = false    # true/false

# Specify the marker used in comments to disable processing of part of the
# file.
#
# Default:  *INDENT-OFF*
disable_processing_cmt          = " *INDENT-OFF*"      # string

# Specify the marker used in comments to (re)enable processing in a file.
#
# Default:  *INDENT-ON*
enable_processing_cmt           = " *INDENT-ON*"     # string

# Enable parsing of digraphs.
enable_digraphs                 = false    # true/false

# Option to allow both disable_processing_cmt and enable_processing_cmt
# strings, if specified, to be interpreted as ECMAScript regular expressions.
# If true, a regex search will be performed within comments according to the
# specified patterns in order to disable/enable processing.
processing_cmt_as_regex         = false    # true/false

# Add or remove the UTF-8 BOM (recommend 'remove').
utf8_bom                        = ignore   # ignore/add/remove/force

# If the file contains bytes with values between 128 and 255, but is not
# UTF-8, then output as UTF-8.
utf8_byte                       = false    # true/false

# Force the output encoding to UTF-8.
utf8_force                      = false    # true/false

#
# Spacing options
#

# Add or remove space around non-assignment symbolic operators ('+', '/', '%',
# '<<', and so forth).
sp_arith                        = ignore   # ignore/add/remove/force

# Add or remove space around arithmetic operators '+' and '-'.
#
# Overrides sp_arith.
sp_arith_additive               = ignore   # ignore/add/remove/force

# Add or remove space around assignment operator '=', '+=', etc.
sp_assign                       = ignore   # ignore/add/remove/force

# Add or remove space around '=' in C++11 lambda capture specifications.
#
# Overrides sp_assign.
sp_cpp_lambda_assign            = ignore   # ignore/add/remove/force

# Add or remove space after the capture specification of a C++11 lambda when
# an argument list is present, as in '[] <here> (int x){ ... }'.
sp_cpp_lambda_square_paren      = ignore   # ignore/add/remove/force

# Add or remove space after the capture specification of a C++11 lambda with
# no argument list is present, as in '[] <here> { ... }'.
sp_cpp_lambda_square_brace      = ignore   # ignore/add/remove/force

# Add or remove space after the opening parenthesis and before the closing
# parenthesis of a argument list of a C++11 lambda, as in
# '[]( <here> ){ ... }'
# with an empty list.
sp_cpp_lambda_argument_list_empty = ignore   # ignore/add/remove/force

# Add or remove space after the opening parenthesis and before the closing
# parenthesis of a argument list of a C++11 lambda, as in
# '[]( <here> int x <here> ){ ... }'.
sp_cpp_lambda_argument_list     = ignore   # ignore/add/remove/force

# Add or remove space after the argument list of a C++11 lambda, as in
# '[](int x) <here> { ... }'.
sp_cpp_lambda_paren_brace       = ignore   # ignore/add/remove/force

# Add or remove space between a lambda body and its call operator of an
# immediately invoked lambda, as in '[]( ... ){ ... } <here> ( ... )'.
sp_cpp_lambda_fparen            = ignore   # ignore/add/remove/force

# Add or remove space around assignment operator '=' in a prototype.
#
# If set to ignore, use sp_assign.
sp_assign_default               = ignore   # ignore/add/remove/force

# Add or remove space before assignment operator '=', '+=', etc.
#
# Overrides sp_assign.
sp_before_assign                = ignore   # ignore/add/remove/force

# Add or remove space after assignment operator '=', '+=', etc.
#
# Overrides sp_assign.
sp_after_assign                 = ignore   # ignore/add/remove/force

# Add or remove space in 'enum {'.
#
# Default: add
sp_enum_brace                   = add      # ignore/add/remove/force

# Add or remove space in 'NS_ENUM ('.
sp_enum_paren                   = ignore   # ignore/add/remove/force

# Add or remove space around assignment '=' in enum.
sp_enum_assign                  = ignore   # ignore/add/remove/force

# Add or remove space before assignment '=' in enum.
#
# Overrides sp_enum_assign.
sp_enum_before_assign           = ignore   # ignore/add/remove/force

# Add or remove space after assignment '=' in enum.
#
# Overrides sp_enum_assign.
sp_enum_after_assign            = ignore   # ignore/add/remove/force

# Add or remove space around assignment ':' in enum.
sp_enum_colon                   = ignore   # ignore/add/remove/force

# Add or remove space around preprocessor '##' concatenation operator.
#
# Default: add
sp_pp_concat                    = add      # ignore/add/remove/force

# Add or remove space after preprocessor '#' stringify operator.
# Also affects the '#@' charizing operator.
sp_pp_stringify                 = ignore   # ignore/add/remove/force

# Add or remove space before preprocessor '#' stringify operator
# as in '#define x(y) L#y'.
sp_before_pp_stringify          = ignore   # ignore/add/remove/force

# Add or remove space around boolean operators '&&' and '||'.
sp_bool                         = ignore   # ignore/add/remove/force

# Add or remove space around compare operator '<', '>', '==', etc.
sp_compare                      = ignore   # ignore/add/remove/force

# Add or remove space inside '(' and ')'.
sp_inside_paren                 = ignore   # ignore/add/remove/force

# Add or remove space between nested parentheses, i.e. '((' vs. ') )'.
sp_paren_paren                  = ignore   # ignore/add/remove/force

# Add or remove space between back-to-back parentheses, i.e. ')(' vs. ') ('.
sp_cparen_oparen                = ignore   # ignore/add/remove/force

# Add or remove space between ')' and '{'.
sp_paren_brace                  = ignore   # ignore/add/remove/force

# Add or remove space between nested braces, i.e. '{{' vs. '{ {'.
sp_brace_brace                  = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*'.
sp_before_ptr_star              = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*' that isn't followed by a
# variable name. If set to ignore, sp_before_ptr_star is used instead.
sp_before_unnamed_ptr_star      = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*' that is followed by a qualifier.
# If set to ignore, sp_before_unnamed_ptr_star is used instead.
sp_before_qualifier_ptr_star    = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*' that is followed by 'operator' keyword.
# If set to ignore, sp_before_unnamed_ptr_star is used instead.
sp_before_operator_ptr_star     = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*' that is followed by
# a class scope (as in 'int *MyClass::method()') or namespace scope
# (as in 'int *my_ns::func()').
# If set to ignore, sp_before_unnamed_ptr_star is used instead.
sp_before_scope_ptr_star        = ignore   # ignore/add/remove/force

# Add or remove space before pointer star '*' that is followed by '::',
# as in 'int *::func()'.
# If set to ignore, sp_before_unnamed_ptr_star is used instead.
sp_before_global_scope_ptr_star = ignore   # ignore/add/remove/force

# Add or remove space between a qualifier and a pointer star '*' that isn't
# followed by a variable name, as in '(char const *)'. If set to ignore,
# sp_before_ptr_star is used instead.
sp_qualifier_unnamed_ptr_star   = ignore   # ignore/add/remove/force

# Add or remove space between pointer stars '*', as in 'int ***a;'.
sp_between_ptr_star             = ignore   # ignore/add/remove/force

# Add or remove space between pointer star '*' and reference '&', as in 'int *& a;'.
sp_between_ptr_ref              = ignore   # ignore/add/remove/force

# Add or remove space after pointer star '*', if followed by a word.
#
# Overrides sp_type_func.
sp_after_ptr_star               = ignore   # ignore/add/remove/force

# Add or remove space after pointer caret '^', if followed by a word.
sp_after_ptr_block_caret        = ignore   # ignore/add/remove/force

# Add or remove space after pointer star '*', if followed by a qualifier.
sp_after_ptr_star_qualifier     = ignore   # ignore/add/remove/force

# Add or remove space after a pointer star '*', if followed by a function
# prototype or function definition.
#
# Overrides sp_after_ptr_star and sp_type_func.
sp_after_ptr_star_func          = ignore   # ignore/add/remove/force

# Add or remove space after a pointer star '*' in the trailing return of a
# function prototype or function definition.
sp_after_ptr_star_trailing      = ignore   # ignore/add/remove/force

# Add or remove space between the pointer star '*' and the name of the variable
# in a function pointer definition.
sp_ptr_star_func_var            = ignore   # ignore/add/remove/force

# Add or remove space between the pointer star '*' and the name of the type
# in a function pointer type definition.
sp_ptr_star_func_type           = ignore   # ignore/add/remove/force

# Add or remove space after a pointer star '*', if followed by an open
# parenthesis, as in 'void* (*)()'.
sp_ptr_star_paren               = ignore   # ignore/add/remove/force

# Add or remove space before a pointer star '*', if followed by a function
# prototype or function definition. If set to ignore, sp_before_ptr_star is
# used instead.
sp_before_ptr_star_func         = ignore   # ignore/add/remove/force

# Add or remove space between a qualifier and a pointer star '*' followed by
# the name of the function in a function prototype or definition, as in
# 'char const *foo()`. If set to ignore, sp_before_ptr_star is used instead.
sp_qualifier_ptr_star_func      = ignore   # ignore/add/remove/force

# Add or remove space before a pointer star '*' in the trailing return of a
# function prototype or function definition.
sp_before_ptr_star_trailing     = ignore   # ignore/add/remove/force

# Add or remove space between a qualifier and a pointer star '*' in the
# trailing return of a function prototype or function definition, as in
# 'auto foo() -> char const *'.
sp_qualifier_ptr_star_trailing  = ignore   # ignore/add/remove/force

# Add or remove space before a reference sign '&'.
sp_before_byref                 = ignore   # ignore/add/remove/force

# Add or remove space before a reference sign '&' that isn't followed by a
# variable name. If set to ignore, sp_before_byref is used instead.
sp_before_unnamed_byref         = ignore   # ignore/add/remove/force

# Add or remove space after reference sign '&', if followed by a word.
#
# Overrides sp_type_func.
sp_after_byref                  = ignore   # ignore/add/remove/force

# Add or remove space after a reference sign '&', if followed by a function
# prototype or function definition.
#
# Overrides sp_after_byref and sp_type_func.
sp_after_byref_func             = ignore   # ignore/add/remove/force

# Add or remove space before a reference sign '&', if followed by a function
# prototype or function definition.
sp_before_byref_func            = ignore   # ignore/add/remove/force

# Add or remove space after a reference sign '&', if followed by an open
# parenthesis, as in 'char& (*)()'.
sp_byref_paren                  = ignore   # ignore/add/remove/force

# Add or remove space between type and word. In cases where total removal of
# whitespace would be a syntax error, a value of 'remove' is treated the same
# as 'force'.
#
# This also affects some other instances of space following a type that are
# not covered by other options; for example, between the return type and
# parenthesis of a function type template argument, between the type and
# parenthesis of an array parameter, or between 'decltype(...)' and the
# following word.
#
# Default: force
sp_after_type                   = force    # ignore/add/remove/force

# Add or remove space between 'decltype(...)' and word,
# brace or function call.
sp_after_decltype               = ignore   # ignore/add/remove/force

# (D) Add or remove space before the parenthesis in the D constructs
# 'template Foo(' and 'class Foo('.
sp_before_template_paren        = ignore   # ignore/add/remove/force

# Add or remove space between 'template' and '<'.
# If set to ignore, sp_before_angle is used.
sp_template_angle               = ignore   # ignore/add/remove/force

# Add or remove space before '<'.
sp_before_angle                 = ignore   # ignore/add/remove/force

# Add or remove space inside '<' and '>'.
sp_inside_angle                 = ignore   # ignore/add/remove/force

# Add or remove space inside '<>'.
# if empty.
sp_inside_angle_empty           = ignore   # ignore/add/remove/force

# Add or remove space between '>' and ':'.
sp_angle_colon                  = ignore   # ignore/add/remove/force

# Add or remove space after '>'.
sp_after_angle                  = ignore   # ignore/add/remove/force

# Add or remove space between '>' and '(' as found in 'new List<byte>(foo);'.
sp_angle_paren                  = ignore   # ignore/add/remove/force

# Add or remove space between '>' and '()' as found in 'new List<byte>();'.
sp_angle_paren_empty            = ignore   # ignore/add/remove/force

# Add or remove space between '>' and a word as in 'List<byte> m;' or
# 'template <typename T> static ...'.
sp_angle_word                   = ignore   # ignore/add/remove/force

# Add or remove space between '>' and '>' in '>>' (template stuff).
#
# Default: add
sp_angle_shift                  = add      # ignore/add/remove/force

# (C++11) Permit removal of the space between '>>' in 'foo<bar<int> >'. Note
# that sp_angle_shift cannot remove the space without this option.
sp_permit_cpp11_shift           = false    # true/false

# Add or remove space before '(' of control statements ('if', 'for', 'switch',
# 'while', etc.).
sp_before_sparen                = ignore   # ignore/add/remove/force

# Add or remove space inside '(' and ')' of control statements other than
# 'for'.
sp_inside_sparen                = ignore   # ignore/add/remove/force

# Add or remove space after '(' of control statements other than 'for'.
#
# Overrides sp_inside_sparen.
sp_inside_sparen_open           = ignore   # ignore/add/remove/force

# Add or remove space before ')' of control statements other than 'for'.
#
# Overrides sp_inside_sparen.
sp_inside_sparen_close          = ignore   # ignore/add/remove/force

# Add or remove space inside '(' and ')' of 'for' statements.
sp_inside_for                   = ignore   # ignore/add/remove/force

# Add or remove space after '(' of 'for' statements.
#
# Overrides sp_inside_for.
sp_inside_for_open              = ignore   # ignore/add/remove/force

# Add or remove space before ')' of 'for' statements.
#
# Overrides sp_inside_for.
sp_inside_for_close             = ignore   # ignore/add/remove/force

# Add or remove space between '((' or '))' of control statements.
sp_sparen_paren                 = ignore   # ignore/add/remove/force

# Add or remove space after ')' of control statements.
sp_after_sparen                 = ignore   # ignore/add/remove/force

# Add or remove space between ')' and '{' of control statements.
sp_sparen_brace                 = ignore   # ignore/add/remove/force

# Add or remove space between 'do' and '{'.
sp_do_brace_open                = ignore   # ignore/add/remove/force

# Add or remove space between '}' and 'while'.
sp_brace_close_while            = ignore   # ignore/add/remove/force

# Add or remove space between 'while' and '('. Overrides sp_before_sparen.
sp_while_paren_open             = ignore   # ignore/add/remove/force

# (D) Add or remove space between 'invariant' and '('.
sp_invariant_paren              = ignore   # ignore/add/remove/force

# (D) Add or remove space after the ')' in 'invariant (C) c'.
sp_after_invariant_paren        = ignore   # ignore/add/remove/force

# Add or remove space before empty statement ';' on 'if', 'for' and 'while'.
# examples:
#   if (b) <here> ;
#   for (a=1; a<10; a++) <here> ;
#   while (*p++ = ' ') <here> ;
sp_special_semi                 = ignore   # ignore/add/remove/force

# Add or remove space before ';'.
#
# Default: remove
sp_before_semi                  = remove   # ignore/add/remove/force

# Add or remove space before ';' in non-empty 'for' statements.
sp_before_semi_for              = ignore   # ignore/add/remove/force

# Add or remove space before a semicolon of an empty left part of a for
# statement, as in 'for ( <here> ; ; )'.
sp_before_semi_for_empty        = ignore   # ignore/add/remove/force

# Add or remove space between the semicolons of an empty middle part of a for
# statement, as in 'for ( ; <here> ; )'.
sp_between_semi_for_empty       = ignore   # ignore/add/remove/force

# Add or remove space after ';', except when followed by a comment.
#
# Default: add
sp_after_semi                   = add      # ignore/add/remove/force

# Add or remove space after ';' in non-empty 'for' statements.
#
# Default: force
sp_after_semi_for               = force    # ignore/add/remove/force

# Add or remove space after the final semicolon of an empty part of a for
# statement, as in 'for ( ; ; <here> )'.
sp_after_semi_for_empty         = ignore   # ignore/add/remove/force

# Add or remove space before '[' (except '[]').
sp_before_square                = ignore   # ignore/add/remove/force

# Add or remove space before '[' for a variable definition.
#
# Default: remove
sp_before_vardef_square         = remove   # ignore/add/remove/force

# Add or remove space before '[' for asm block.
sp_before_square_asm_block      = ignore   # ignore/add/remove/force

# Add or remove space before '[]'.
sp_before_squares               = ignore   # ignore/add/remove/force

# Add or remove space before C++17 structured bindings
# after byref.
sp_cpp_before_struct_binding_after_byref = ignore   # ignore/add/remove/force

# Add or remove space before C++17 structured bindings.
sp_cpp_before_struct_binding    = ignore   # ignore/add/remove/force

# Add or remove space inside a non-empty '[' and ']'.
sp_inside_square                = ignore   # ignore/add/remove/force

# Add or remove space inside '[]'.
# if empty.
sp_inside_square_empty          = ignore   # ignore/add/remove/force

# (OC) Add or remove space inside a non-empty Objective-C boxed array '@[' and
# ']'. If set to ignore, sp_inside_square is used.
sp_inside_square_oc_array       = ignore   # ignore/add/remove/force

# Add or remove space after ',', i.e. 'a,b' vs. 'a, b'.
sp_after_comma                  = ignore   # ignore/add/remove/force

# Add or remove space before ',', i.e. 'a,b' vs. 'a ,b'.
#
# Default: remove
sp_before_comma                 = remove   # ignore/add/remove/force

# (C#, Vala) Add or remove space between ',' and ']' in multidimensional array type
# like 'int[,,]'.
sp_after_mdatype_commas         = ignore   # ignore/add/remove/force

# (C#, Vala) Add or remove space between '[' and ',' in multidimensional array type
# like 'int[,,]'.
sp_before_mdatype_commas        = ignore   # ignore/add/remove/force

# (C#, Vala) Add or remove space between ',' in multidimensional array type
# like 'int[,,]'.
sp_between_mdatype_commas       = ignore   # ignore/add/remove/force

# Add or remove space between an open parenthesis and comma,
# i.e. '(,' vs. '( ,'.
#
# Default: force
sp_paren_comma                  = force    # ignore/add/remove/force

# Add or remove space between a type and ':'.
sp_type_colon                   = ignore   # ignore/add/remove/force

# Add or remove space after the variadic '...' when preceded by a
# non-punctuator.
# The value REMOVE will be overridden with FORCE
sp_after_ellipsis               = ignore   # ignore/add/remove/force

# Add or remove space before the variadic '...' when preceded by a
# non-punctuator.
# The value REMOVE will be overridden with FORCE
sp_before_ellipsis              = ignore   # ignore/add/remove/force

# Add or remove space between a type and '...'.
sp_type_ellipsis                = ignore   # ignore/add/remove/force

# Add or remove space between a '*' and '...'.
sp_ptr_type_ellipsis            = ignore   # ignore/add/remove/force

# Add or remove space between ')' and '...'.
sp_paren_ellipsis               = ignore   # ignore/add/remove/force

# Add or remove space between '&&' and '...'.
sp_byref_ellipsis               = ignore   # ignore/add/remove/force

# Add or remove space between ')' and a qualifier such as 'const'.
sp_paren_qualifier              = ignore   # ignore/add/remove/force

# Add or remove space between ')' and 'noexcept'.
sp_paren_noexcept               = ignore   # ignore/add/remove/force

# Add or remove space after class ':'.
sp_after_class_colon            = ignore   # ignore/add/remove/force

# Add or remove space before class ':'.
sp_before_class_colon           = ignore   # ignore/add/remove/force

# Add or remove space after class constructor ':'.
#
# Default: add
sp_after_constr_colon           = add      # ignore/add/remove/force

# Add or remove space before class constructor ':'.
#
# Default: add
sp_before_constr_colon          = add      # ignore/add/remove/force

# Add or remove space before case ':'.
#
# Default: remove
sp_before_case_colon            = remove   # ignore/add/remove/force

# Add or remove space between 'operator' and operator sign.
sp_after_operator               = ignore   # ignore/add/remove/force

# Add or remove space between the operator symbol and the open parenthesis, as
# in 'operator ++('.
sp_after_operator_sym           = ignore   # ignore/add/remove/force

# Overrides sp_after_operator_sym when the operator has no arguments, as in
# 'operator *()'.
sp_after_operator_sym_empty     = ignore   # ignore/add/remove/force

# Add or remove space after C/D cast, i.e. 'cast(int)a' vs. 'cast(int) a' or
# '(int)a' vs. '(int) a'.
sp_after_cast                   = ignore   # ignore/add/remove/force

# Add or remove spaces inside cast parentheses.
sp_inside_paren_cast            = ignore   # ignore/add/remove/force

# Add or remove space between the type and open parenthesis in a C++ cast,
# i.e. 'int(exp)' vs. 'int (exp)'.
sp_cpp_cast_paren               = ignore   # ignore/add/remove/force

# Add or remove space between 'sizeof' and '('.
sp_sizeof_paren                 = ignore   # ignore/add/remove/force

# Add or remove space between 'sizeof' and '...'.
sp_sizeof_ellipsis              = ignore   # ignore/add/remove/force

# Add or remove space between 'sizeof...' and '('.
sp_sizeof_ellipsis_paren        = ignore   # ignore/add/remove/force

# Add or remove space between '...' and a parameter pack.
sp_ellipsis_parameter_pack      = ignore   # ignore/add/remove/force

# Add or remove space between a parameter pack and '...'.
sp_parameter_pack_ellipsis      = ignore   # ignore/add/remove/force

# Add or remove space between 'decltype' and '('.
sp_decltype_paren               = ignore   # ignore/add/remove/force

# (Pawn) Add or remove space after the tag keyword.
sp_after_tag                    = ignore   # ignore/add/remove/force

# Add or remove space inside enum '{' and '}'.
sp_inside_braces_enum           = ignore   # ignore/add/remove/force

# Add or remove space inside struct/union '{' and '}'.
sp_inside_braces_struct         = ignore   # ignore/add/remove/force

# (OC) Add or remove space inside Objective-C boxed dictionary '{' and '}'
sp_inside_braces_oc_dict        = ignore   # ignore/add/remove/force

# Add or remove space after open brace in an unnamed temporary
# direct-list-initialization
# if statement is a brace_init_lst
# works only if sp_brace_brace is set to ignore.
sp_after_type_brace_init_lst_open = ignore   # ignore/add/remove/force

# Add or remove space before close brace in an unnamed temporary
# direct-list-initialization
# if statement is a brace_init_lst
# works only if sp_brace_brace is set to ignore.
sp_before_type_brace_init_lst_close = ignore   # ignore/add/remove/force

# Add or remove space inside an unnamed temporary direct-list-initialization
# if statement is a brace_init_lst
# works only if sp_brace_brace is set to ignore
# works only if sp_before_type_brace_init_lst_close is set to ignore.
sp_inside_type_brace_init_lst   = ignore   # ignore/add/remove/force

# Add or remove space inside '{' and '}'.
sp_inside_braces                = ignore   # ignore/add/remove/force

# Add or remove space inside '{}'.
# if empty.
sp_inside_braces_empty          = ignore   # ignore/add/remove/force

# Add or remove space around trailing return operator '->'.
sp_trailing_return              = ignore   # ignore/add/remove/force

# Add or remove space between return type and function name. A minimum of 1
# is forced except for pointer return types.
sp_type_func                    = ignore   # ignore/add/remove/force

# Add or remove space between type and open brace of an unnamed temporary
# direct-list-initialization.
sp_type_brace_init_lst          = ignore   # ignore/add/remove/force

# Add or remove space between function name and '(' on function declaration.
sp_func_proto_paren             = ignore   # ignore/add/remove/force

# Add or remove space between function name and '()' on function declaration
# if empty.
sp_func_proto_paren_empty       = ignore   # ignore/add/remove/force

# Add or remove space between function name and '(' with a typedef specifier.
sp_func_type_paren              = ignore   # ignore/add/remove/force

# Add or remove space between alias name and '(' of a non-pointer function type typedef.
sp_func_def_paren               = ignore   # ignore/add/remove/force

# Add or remove space between function name and '()' on function definition
# if empty.
sp_func_def_paren_empty         = ignore   # ignore/add/remove/force

# Add or remove space inside empty function '()'.
# Overrides sp_after_angle unless use_sp_after_angle_always is set to true.
sp_inside_fparens               = ignore   # ignore/add/remove/force

# Add or remove space inside function '(' and ')'.
sp_inside_fparen                = ignore   # ignore/add/remove/force

# Add or remove space inside user functor '(' and ')'.
sp_func_call_user_inside_rparen = ignore   # ignore/add/remove/force

# Add or remove space inside empty functor '()'.
# Overrides sp_after_angle unless use_sp_after_angle_always is set to true.
sp_inside_rparens               = ignore   # ignore/add/remove/force

# Add or remove space inside functor '(' and ')'.
sp_inside_rparen                = ignore   # ignore/add/remove/force

# Add or remove space inside the first parentheses in a function type, as in
# 'void (*x)(...)'.
sp_inside_tparen                = ignore   # ignore/add/remove/force

# Add or remove space between the ')' and '(' in a function type, as in
# 'void (*x)(...)'.
sp_after_tparen_close           = ignore   # ignore/add/remove/force

# Add or remove space between ']' and '(' when part of a function call.
sp_square_fparen                = ignore   # ignore/add/remove/force

# Add or remove space between ')' and '{' of function.
sp_fparen_brace                 = ignore   # ignore/add/remove/force

# Add or remove space between ')' and '{' of a function call in object
# initialization.
#
# Overrides sp_fparen_brace.
sp_fparen_brace_initializer     = ignore   # ignore/add/remove/force

# (Java) Add or remove space between ')' and '{{' of double brace initializer.
sp_fparen_dbrace                = ignore   # ignore/add/remove/force

# Add or remove space between function name and '(' on function calls.
sp_func_call_paren              = ignore   # ignore/add/remove/force

# Add or remove space between function name and '()' on function calls without
# parameters. If set to ignore (the default), sp_func_call_paren is used.
sp_func_call_paren_empty        = ignore   # ignore/add/remove/force

# Add or remove space between the user function name and '(' on function
# calls. You need to set a keyword to be a user function in the config file,
# like:
#   set func_call_user tr _ i18n
sp_func_call_user_paren         = ignore   # ignore/add/remove/force

# Add or remove space inside user function '(' and ')'.
sp_func_call_user_inside_fparen = ignore   # ignore/add/remove/force

# Add or remove space between nested parentheses with user functions,
# i.e. '((' vs. '( ('.
sp_func_call_user_paren_paren   = ignore   # ignore/add/remove/force

# Add or remove space between a constructor/destructor and the open
# parenthesis.
sp_func_class_paren             = ignore   # ignore/add/remove/force

# Add or remove space between a constructor without parameters or destructor
# and '()'.
sp_func_class_paren_empty       = ignore   # ignore/add/remove/force

# Add or remove space after 'return'.
#
# Default: force
sp_return                       = force    # ignore/add/remove/force

# Add or remove space between 'return' and '('.
sp_return_paren                 = ignore   # ignore/add/remove/force

# Add or remove space between 'return' and '{'.
sp_return_brace                 = ignore   # ignore/add/remove/force

# Add or remove space between '__attribute__' and '('.
sp_attribute_paren              = ignore   # ignore/add/remove/force

# Add or remove space between 'defined' and '(' in '#if defined (FOO)'.
sp_defined_paren                = ignore   # ignore/add/remove/force

# Add or remove space between 'throw' and '(' in 'throw (something)'.
sp_throw_paren                  = ignore   # ignore/add/remove/force

# Add or remove space between 'throw' and anything other than '(' as in
# '@throw [...];'.
sp_after_throw                  = ignore   # ignore/add/remove/force

# Add or remove space between 'catch' and '(' in 'catch (something) { }'.
# If set to ignore, sp_before_sparen is used.
sp_catch_paren                  = ignore   # ignore/add/remove/force

# (OC) Add or remove space between '@catch' and '('
# in '@catch (something) { }'. If set to ignore, sp_catch_paren is used.
sp_oc_catch_paren               = ignore   # ignore/add/remove/force

# (OC) Add or remove space before Objective-C protocol list
# as in '@protocol Protocol<here><Protocol_A>' or '@interface MyClass : NSObject<here><MyProtocol>'.
sp_before_oc_proto_list         = ignore   # ignore/add/remove/force

# (OC) Add or remove space between class name and '('
# in '@interface className(categoryName)<ProtocolName>:BaseClass'
sp_oc_classname_paren           = ignore   # ignore/add/remove/force

# (D) Add or remove space between 'version' and '('
# in 'version (something) { }'. If set to ignore, sp_before_sparen is used.
sp_version_paren                = ignore   # ignore/add/remove/force

# (D) Add or remove space between 'scope' and '('
# in 'scope (something) { }'. If set to ignore, sp_before_sparen is used.
sp_scope_paren                  = ignore   # ignore/add/remove/force

# Add or remove space between 'super' and '(' in 'super (something)'.
#
# Default: remove
sp_super_paren                  = remove   # ignore/add/remove/force

# Add or remove space between 'this' and '(' in 'this (something)'.
#
# Default: remove
sp_this_paren                   = remove   # ignore/add/remove/force

# Add or remove space between a macro name and its definition.
sp_macro                        = ignore   # ignore/add/remove/force

# Add or remove space between a macro function ')' and its definition.
sp_macro_func                   = ignore   # ignore/add/remove/force

# Add or remove space between 'else' and '{' if on the same line.
sp_else_brace                   = ignore   # ignore/add/remove/force

# Add or remove space between '}' and 'else' if on the same line.
sp_brace_else                   = ignore   # ignore/add/remove/force

# Add or remove space between '}' and the name of a typedef on the same line.
sp_brace_typedef                = ignore   # ignore/add/remove/force

# Add or remove space before the '{' of a 'catch' statement, if the '{' and
# 'catch' are on the same line, as in 'catch (decl) <here> {'.
sp_catch_brace                  = ignore   # ignore/add/remove/force

# (OC) Add or remove space before the '{' of a '@catch' statement, if the '{'
# and '@catch' are on the same line, as in '@catch (decl) <here> {'.
# If set to ignore, sp_catch_brace is used.
sp_oc_catch_brace               = ignore   # ignore/add/remove/force

# Add or remove space between '}' and 'catch' if on the same line.
sp_brace_catch                  = ignore   # ignore/add/remove/force

# (OC) Add or remove space between '}' and '@catch' if on the same line.
# If set to ignore, sp_brace_catch is used.
sp_oc_brace_catch               = ignore   # ignore/add/remove/force

# Add or remove space between 'finally' and '{' if on the same line.
sp_finally_brace                = ignore   # ignore/add/remove/force

# Add or remove space between '}' and 'finally' if on the same line.
sp_brace_finally                = ignore   # ignore/add/remove/force

# Add or remove space between 'try' and '{' if on the same line.
sp_try_brace                    = ignore   # ignore/add/remove/force

# Add or remove space between get/set and '{' if on the same line.
sp_getset_brace                 = ignore   # ignore/add/remove/force

# Add or remove space between a variable and '{' for C++ uniform
# initialization.
sp_word_brace_init_lst          = ignore   # ignore/add/remove/force

# Add or remove space between a variable and '{' for a namespace.
#
# Default: add
sp_word_brace_ns                = add      # ignore/add/remove/force

# Add or remove space before the '::' operator.
sp_before_dc                    = ignore   # ignore/add/remove/force

# Add or remove space after the '::' operator.
sp_after_dc                     = ignore   # ignore/add/remove/force

# (D) Add or remove around the D named array initializer ':' operator.
sp_d_array_colon                = ignore   # ignore/add/remove/force

# Add or remove space after the '!' (not) unary operator.
#
# Default: remove
sp_not                          = remove   # ignore/add/remove/force

# Add or remove space between two '!' (not) unary operators.
# If set to ignore, sp_not will be used.
sp_not_not                      = ignore   # ignore/add/remove/force

# Add or remove space after the '~' (invert) unary operator.
#
# Default: remove
sp_inv                          = remove   # ignore/add/remove/force

# Add or remove space after the '&' (address-of) unary operator. This does not
# affect the spacing after a '&' that is part of a type.
#
# Default: remove
sp_addr                         = remove   # ignore/add/remove/force

# Add or remove space around the '.' or '->' operators.
#
# Default: remove
sp_member                       = remove   # ignore/add/remove/force

# Add or remove space after the '*' (dereference) unary operator. This does
# not affect the spacing after a '*' that is part of a type.
#
# Default: remove
sp_deref                        = remove   # ignore/add/remove/force

# Add or remove space after '+' or '-', as in 'x = -5' or 'y = +7'.
#
# Default: remove
sp_sign                         = remove   # ignore/add/remove/force

# Add or remove space between '++' and '--' the word to which it is being
# applied, as in '(--x)' or 'y++;'.
#
# Default: remove
sp_incdec                       = remove   # ignore/add/remove/force

# Add or remove space before a backslash-newline at the end of a line.
#
# Default: add
sp_before_nl_cont               = add      # ignore/add/remove/force

# (OC) Add or remove space after the scope '+' or '-', as in '-(void) foo;'
# or '+(int) bar;'.
sp_after_oc_scope               = ignore   # ignore/add/remove/force

# (OC) Add or remove space after the colon in message specs,
# i.e. '-(int) f:(int) x;' vs. '-(int) f: (int) x;'.
sp_after_oc_colon               = ignore   # ignore/add/remove/force

# (OC) Add or remove space before the colon in message specs,
# i.e. '-(int) f: (int) x;' vs. '-(int) f : (int) x;'.
sp_before_oc_colon              = ignore   # ignore/add/remove/force

# (OC) Add or remove space after the colon in immutable dictionary expression
# 'NSDictionary *test = @{@"foo" :@"bar"};'.
sp_after_oc_dict_colon          = ignore   # ignore/add/remove/force

# (OC) Add or remove space before the colon in immutable dictionary expression
# 'NSDictionary *test = @{@"foo" :@"bar"};'.
sp_before_oc_dict_colon         = ignore   # ignore/add/remove/force

# (OC) Add or remove space after the colon in message specs,
# i.e. '[object setValue:1];' vs. '[object setValue: 1];'.
sp_after_send_oc_colon          = ignore   # ignore/add/remove/force

# (OC) Add or remove space before the colon in message specs,
# i.e. '[object setValue:1];' vs. '[object setValue :1];'.
sp_before_send_oc_colon         = ignore   # ignore/add/remove/force

# (OC) Add or remove space after the (type) in message specs,
# i.e. '-(int)f: (int) x;' vs. '-(int)f: (int)x;'.
sp_after_oc_type                = ignore   # ignore/add/remove/force

# (OC) Add or remove space after the first (type) in message specs,
# i.e. '-(int) f:(int)x;' vs. '-(int)f:(int)x;'.
sp_after_oc_return_type         = ignore   # ignore/add/remove/force

# (OC) Add or remove space between '@selector' and '(',
# i.e. '@selector(msgName)' vs. '@selector (msgName)'.
# Also applies to '@protocol()' constructs.
sp_after_oc_at_sel              = ignore   # ignore/add/remove/force

# (OC) Add or remove space between '@selector(x)' and the following word,
# i.e. '@selector(foo) a:' vs. '@selector(foo)a:'.
sp_after_oc_at_sel_parens       = ignore   # ignore/add/remove/force

# (OC) Add or remove space inside '@selector' parentheses,
# i.e. '@selector(foo)' vs. '@selector( foo )'.
# Also applies to '@protocol()' constructs.
sp_inside_oc_at_sel_parens      = ignore   # ignore/add/remove/force

# (OC) Add or remove space before a block pointer caret,
# i.e. '^int (int arg){...}' vs. ' ^int (int arg){...}'.
sp_before_oc_block_caret        = ignore   # ignore/add/remove/force

# (OC) Add or remove space after a block pointer caret,
# i.e. '^int (int arg){...}' vs. '^ int (int arg){...}'.
sp_after_oc_block_caret         = ignore   # ignore/add/remove/force

# (OC) Add or remove space between the receiver and selector in a message,
# as in '[receiver selector ...]'.
sp_after_oc_msg_receiver        = ignore   # ignore/add/remove/force

# (OC) Add or remove space after '@property'.
sp_after_oc_property            = ignore   # ignore/add/remove/force

# (OC) Add or remove space between '@synchronized' and the open parenthesis,
# i.e. '@synchronized(foo)' vs. '@synchronized (foo)'.
sp_after_oc_synchronized        = ignore   # ignore/add/remove/force

# Add or remove space around the ':' in 'b ? t : f'.
sp_cond_colon                   = ignore   # ignore/add/remove/force

# Add or remove space before the ':' in 'b ? t : f'.
#
# Overrides sp_cond_colon.
sp_cond_colon_before            = ignore   # ignore/add/remove/force

# Add or remove space after the ':' in 'b ? t : f'.
#
# Overrides sp_cond_colon.
sp_cond_colon_after             = ignore   # ignore/add/remove/force

# Add or remove space around the '?' in 'b ? t : f'.
sp_cond_question                = ignore   # ignore/add/remove/force

# Add or remove space before the '?' in 'b ? t : f'.
#
# Overrides sp_cond_question.
sp_cond_question_before         = ignore   # ignore/add/remove/force

# Add or remove space after the '?' in 'b ? t : f'.
#
# Overrides sp_cond_question.
sp_cond_question_after          = ignore   # ignore/add/remove/force

# In the abbreviated ternary form '(a ?: b)', add or remove space between '?'
# and ':'.
#
# Overrides all other sp_cond_* options.
sp_cond_ternary_short           = ignore   # ignore/add/remove/force

# Fix the spacing between 'case' and the label. Only 'ignore' and 'force' make
# sense here.
sp_case_label                   = ignore   # ignore/add/remove/force

# (D) Add or remove space around the D '..' operator.
sp_range                        = ignore   # ignore/add/remove/force

# Add or remove space after ':' in a Java/C++11 range-based 'for',
# as in 'for (Type var : <here> expr)'.
sp_after_for_colon              = ignore   # ignore/add/remove/force

# Add or remove space before ':' in a Java/C++11 range-based 'for',
# as in 'for (Type var <here> : expr)'.
sp_before_for_colon             = ignore   # ignore/add/remove/force

# (D) Add or remove space between 'extern' and '(' as in 'extern <here> (C)'.
sp_extern_paren                 = ignore   # ignore/add/remove/force

# Add or remove space after the opening of a C++ comment, as in '// <here> A'.
sp_cmt_cpp_start                = ignore   # ignore/add/remove/force

# remove space after the '//' and the pvs command '-V1234',
# only works with sp_cmt_cpp_start set to add or force.
sp_cmt_cpp_pvs                  = false    # true/false

# remove space after the '//' and the command 'lint',
# only works with sp_cmt_cpp_start set to add or force.
sp_cmt_cpp_lint                 = false    # true/false

# Add or remove space in a C++ region marker comment, as in '// <here> BEGIN'.
# A region marker is defined as a comment which is not preceded by other text
# (i.e. the comment is the first non-whitespace on the line), and which starts
# with either 'BEGIN' or 'END'.
#
# Overrides sp_cmt_cpp_start.
sp_cmt_cpp_region               = ignore   # ignore/add/remove/force

# If true, space added with sp_cmt_cpp_start will be added after Doxygen
# sequences like '///', '///<', '//!' and '//!<'.
sp_cmt_cpp_doxygen              = false    # true/false

# If true, space added with sp_cmt_cpp_start will be added after Qt translator
# or meta-data comments like '//:', '//=', and '//~'.
sp_cmt_cpp_qttr                 = false    # true/false

# Add or remove space between #else or #endif and a trailing comment.
sp_endif_cmt                    = ignore   # ignore/add/remove/force

# Add or remove space after 'new', 'delete' and 'delete[]'.
sp_after_new                    = ignore   # ignore/add/remove/force

# Add or remove space between 'new' and '(' in 'new()'.
sp_between_new_paren            = ignore   # ignore/add/remove/force

# Add or remove space between ')' and type in 'new(foo) BAR'.
sp_after_newop_paren            = ignore   # ignore/add/remove/force

# Add or remove space inside parentheses of the new operator
# as in 'new(foo) BAR'.
sp_inside_newop_paren           = ignore   # ignore/add/remove/force

# Add or remove space after the open parenthesis of the new operator,
# as in 'new(foo) BAR'.
#
# Overrides sp_inside_newop_paren.
sp_inside_newop_paren_open      = ignore   # ignore/add/remove/force

# Add or remove space before the close parenthesis of the new operator,
# as in 'new(foo) BAR'.
#
# Overrides sp_inside_newop_paren.
sp_inside_newop_paren_close     = ignore   # ignore/add/remove/force

# Add or remove space before a trailing comment.
sp_before_tr_cmt                = ignore   # ignore/add/remove/force

# Number of spaces before a trailing comment.
sp_num_before_tr_cmt            = 0        # unsigned number

# Add or remove space before an embedded comment.
#
# Default: force
sp_before_emb_cmt               = force    # ignore/add/remove/force

# Number of spaces before an embedded comment.
#
# Default: 1
sp_num_before_emb_cmt           = 1        # unsigned number

# Add or remove space after an embedded comment.
#
# Default: force
sp_after_emb_cmt                = force    # ignore/add/remove/force

# Number of spaces after an embedded comment.
#
# Default: 1
sp_num_after_emb_cmt            = 1        # unsigned number

# Embedded comment spacing options have higher priority (== override)
# than other spacing options (comma, parenthesis, braces, ...)
sp_emb_cmt_priority             = false    # true/false

# (Java) Add or remove space between an annotation and the open parenthesis.
sp_annotation_paren             = ignore   # ignore/add/remove/force

# If true, vbrace tokens are dropped to the previous token and skipped.
sp_skip_vbrace_tokens           = false    # true/false

# Add or remove space after 'noexcept'.
sp_after_noexcept               = ignore   # ignore/add/remove/force

# Add or remove space after '_'.
sp_vala_after_translation       = ignore   # ignore/add/remove/force

# Add or remove space before a bit colon ':'.
sp_before_bit_colon             = ignore   # ignore/add/remove/force

# Add or remove space after a bit colon ':'.
sp_after_bit_colon              = ignore   # ignore/add/remove/force

# If true, a <TAB> is inserted after #define.
force_tab_after_define          = false    # true/false

# Add or remove space between two strings.
sp_string_string                = ignore   # ignore/add/remove/force

# Add or remove space 'struct' and a type.
sp_struct_type                  = ignore   # ignore/add/remove/force

#
# Indenting options
#

# The number of columns to indent per level. Usually 2, 3, 4, or 8.
#
# Default: 8
indent_columns                  = 8        # unsigned number

# Whether to ignore indent for the first continuation line. Subsequent
# continuation lines will still be indented to match the first.
indent_ignore_first_continue    = false    # true/false

# The continuation indent. If non-zero, this overrides the indent of '(', '['
# and '=' continuation indents. Negative values are OK; negative value is
# absolute and not increased for each '(' or '[' level.
#
# For FreeBSD, this is set to 4.
# Requires indent_ignore_first_continue=false.
indent_continue                 = 0        # number

# The continuation indent, only for class header line(s). If non-zero, this
# overrides the indent of 'class' continuation indents.
# Requires indent_ignore_first_continue=false.
indent_continue_class_head      = 0        # unsigned number

# Whether to indent empty lines (i.e. lines which contain only spaces before
# the newline character).
indent_single_newlines          = false    # true/false

# The continuation indent for func_*_param if they are true. If non-zero, this
# overrides the indent.
indent_param                    = 0        # unsigned number

# How to use tabs when indenting code.
#
# 0: Spaces only
# 1: Indent with tabs to brace level, align with spaces (default)
# 2: Indent and align with tabs, using spaces when not on a tabstop
#
# Default: 1
indent_with_tabs                = 1        # unsigned number

# Whether to indent comments that are not at a brace level with tabs on a
# tabstop. Requires indent_with_tabs=2. If false, will use spaces.
indent_cmt_with_tabs            = false    # true/false

# Whether to indent strings broken by '\' so that they line up.
indent_align_string             = false    # true/false

# The number of spaces to indent multi-line XML strings.
# Requires indent_align_string=true.
indent_xml_string               = 0        # unsigned number

# Spaces to indent '{' from level.
indent_brace                    = 0        # unsigned number

# Whether braces are indented to the body level.
indent_braces                   = false    # true/false

# Whether to disable indenting function braces if indent_braces=true.
indent_braces_no_func           = false    # true/false

# Whether to disable indenting class braces if indent_braces=true.
indent_braces_no_class          = false    # true/false

# Whether to disable indenting struct braces if indent_braces=true.
indent_braces_no_struct         = false    # true/false

# Whether to indent based on the size of the brace parent,
# i.e. 'if' => 3 spaces, 'for' => 4 spaces, etc.
indent_brace_parent             = false    # true/false

# Whether to indent based on the open parenthesis instead of the open brace
# in '({\n'.
indent_paren_open_brace         = false    # true/false

# (C#) Whether to indent the brace of a C# delegate by another level.
indent_cs_delegate_brace        = false    # true/false

# (C#) Whether to indent a C# delegate (to handle delegates with no brace) by
# another level.
indent_cs_delegate_body         = false    # true/false

# Whether to indent the body of a 'namespace'.
indent_namespace                = false    # true/false

# Whether to indent only the first namespace, and not any nested namespaces.
# Requires indent_namespace=true.
indent_namespace_single_indent  = false    # true/false

# The number of spaces to indent a namespace block.
# If set to zero, use the value indent_columns
indent_namespace_level          = 0        # unsigned number

# If the body of the namespace is longer than this number, it won't be
# indented. Requires indent_namespace=true. 0 means no limit.
indent_namespace_limit          = 0        # unsigned number

# Whether to indent only in inner namespaces (nested in other namespaces).
# Requires indent_namespace=true.
indent_namespace_inner_only     = false    # true/false

# Whether the 'extern "C"' body is indented.
indent_extern                   = false    # true/false

# Whether the 'class' body is indented.
indent_class                    = false    # true/false

# Whether to ignore indent for the leading base class colon.
indent_ignore_before_class_colon = false    # true/false

# Additional indent before the leading base class colon.
# Negative values decrease indent down to the first column.
# Requires indent_ignore_before_class_colon=false and a newline break before
# the colon (see pos_class_colon and nl_class_colon)
indent_before_class_colon       = 0        # number

# Whether to indent the stuff after a leading base class colon.
indent_class_colon              = false    # true/false

# Whether to indent based on a class colon instead of the stuff after the
# colon. Requires indent_class_colon=true.
indent_class_on_colon           = false    # true/false

# Whether to ignore indent for a leading class initializer colon.
indent_ignore_before_constr_colon = false    # true/false

# Whether to indent the stuff after a leading class initializer colon.
indent_constr_colon             = false    # true/false

# Virtual indent from the ':' for leading member initializers.
#
# Default: 2
indent_ctor_init_leading        = 2        # unsigned number

# Virtual indent from the ':' for following member initializers.
#
# Default: 2
indent_ctor_init_following      = 2        # unsigned number

# Additional indent for constructor initializer list.
# Negative values decrease indent down to the first column.
indent_ctor_init                = 0        # number

# Whether to indent 'if' following 'else' as a new block under the 'else'.
# If false, 'else\nif' is treated as 'else if' for indenting purposes.
indent_else_if                  = false    # true/false

# Amount to indent variable declarations after a open brace.
#
#  <0: Relative
# >=0: Absolute
indent_var_def_blk              = 0        # number

# Whether to indent continued variable declarations instead of aligning.
indent_var_def_cont             = false    # true/false

# How to indent continued shift expressions ('<<' and '>>').
# Set align_left_shift=false when using this.
#  0: Align shift operators instead of indenting them (default)
#  1: Indent by one level
# -1: Preserve original indentation
indent_shift                    = 0        # number

# Whether to force indentation of function definitions to start in column 1.
indent_func_def_force_col1      = false    # true/false

# Whether to indent continued function call parameters one indent level,
# rather than aligning parameters under the open parenthesis.
indent_func_call_param          = false    # true/false

# Whether to indent continued function definition parameters one indent level,
# rather than aligning parameters under the open parenthesis.
indent_func_def_param           = false    # true/false

# for function definitions, only if indent_func_def_param is false
# Allows to align params when appropriate and indent them when not
# behave as if it was true if paren position is more than this value
# if paren position is more than the option value
indent_func_def_param_paren_pos_threshold = 0        # unsigned number

# Whether to indent continued function call prototype one indent level,
# rather than aligning parameters under the open parenthesis.
indent_func_proto_param         = false    # true/false

# Whether to indent continued function call declaration one indent level,
# rather than aligning parameters under the open parenthesis.
indent_func_class_param         = false    # true/false

# Whether to indent continued class variable constructors one indent level,
# rather than aligning parameters under the open parenthesis.
indent_func_ctor_var_param      = false    # true/false

# Whether to indent continued template parameter list one indent level,
# rather than aligning parameters under the open parenthesis.
indent_template_param           = false    # true/false

# Double the indent for indent_func_xxx_param options.
# Use both values of the options indent_columns and indent_param.
indent_func_param_double        = false    # true/false

# Indentation column for standalone 'const' qualifier on a function
# prototype.
indent_func_const               = 0        # unsigned number

# Indentation column for standalone 'throw' qualifier on a function
# prototype.
indent_func_throw               = 0        # unsigned number

# How to indent within a macro followed by a brace on the same line
# This allows reducing the indent in macros that have (for example)
# `do { ... } while (0)` blocks bracketing them.
#
# true:  add an indent for the brace on the same line as the macro
# false: do not add an indent for the brace on the same line as the macro
#
# Default: true
indent_macro_brace              = true     # true/false

# The number of spaces to indent a continued '->' or '.'.
# Usually set to 0, 1, or indent_columns.
indent_member                   = 0        # unsigned number

# Whether lines broken at '.' or '->' should be indented by a single indent.
# The indent_member option will not be effective if this is set to true.
indent_member_single            = false    # true/false

# Spaces to indent single line ('//') comments on lines before code.
indent_single_line_comments_before = 0        # unsigned number

# Spaces to indent single line ('//') comments on lines after code.
indent_single_line_comments_after = 0        # unsigned number

# When opening a paren for a control statement (if, for, while, etc), increase
# the indent level by this value. Negative values decrease the indent level.
indent_sparen_extra             = 0        # number

# Whether to indent trailing single line ('//') comments relative to the code
# instead of trying to keep the same absolute column.
indent_relative_single_line_comments = false    # true/false

# Spaces to indent 'case' from 'switch'. Usually 0 or indent_columns.
# It might be wise to choose the same value for the option indent_case_brace.
indent_switch_case              = 0        # unsigned number

# Spaces to indent the body of a 'switch' before any 'case'.
# Usually the same as indent_columns or indent_switch_case.
indent_switch_body              = 0        # unsigned number

# Whether to ignore indent for '{' following 'case'.
indent_ignore_case_brace        = false    # true/false

# Spaces to indent '{' from 'case'. By default, the brace will appear under
# the 'c' in case. Usually set to 0 or indent_columns. Negative values are OK.
# It might be wise to choose the same value for the option indent_switch_case.
indent_case_brace               = 0        # number

# indent 'break' with 'case' from 'switch'.
indent_switch_break_with_case   = false    # true/false

# Whether to indent preprocessor statements inside of switch statements.
#
# Default: true
indent_switch_pp                = true     # true/false

# Spaces to shift the 'case' line, without affecting any other lines.
# Usually 0.
indent_case_shift               = 0        # unsigned number

# Whether to align comments before 'case' with the 'case'.
#
# Default: true
indent_case_comment             = true     # true/false

# Whether to indent comments not found in first column.
#
# Default: true
indent_comment                  = true     # true/false

# Whether to indent comments found in first column.
indent_col1_comment             = false    # true/false

# Whether to indent multi string literal in first column.
indent_col1_multi_string_literal = false    # true/false

# Align comments on adjacent lines that are this many columns apart or less.
#
# Default: 3
indent_comment_align_thresh     = 3        # unsigned number

# Whether to ignore indent for goto labels.
indent_ignore_label             = false    # true/false

# How to indent goto labels. Requires indent_ignore_label=false.
#
#  >0: Absolute column where 1 is the leftmost column
# <=0: Subtract from brace indent
#
# Default: 1
indent_label                    = 1        # number

# How to indent access specifiers that are followed by a
# colon.
#
#  >0: Absolute column where 1 is the leftmost column
# <=0: Subtract from brace indent
#
# Default: 1
indent_access_spec              = 1        # number

# Whether to indent the code after an access specifier by one level.
# If true, this option forces 'indent_access_spec=0'.
indent_access_spec_body         = false    # true/false

# If an open parenthesis is followed by a newline, whether to indent the next
# line so that it lines up after the open parenthesis (not recommended).
indent_paren_nl                 = false    # true/false

# How to indent a close parenthesis after a newline.
#
#  0: Indent to body level (default)
#  1: Align under the open parenthesis
#  2: Indent to the brace level
# -1: Preserve original indentation
indent_paren_close              = 0        # number

# Whether to indent the open parenthesis of a function definition,
# if the parenthesis is on its own line.
indent_paren_after_func_def     = false    # true/false

# Whether to indent the open parenthesis of a function declaration,
# if the parenthesis is on its own line.
indent_paren_after_func_decl    = false    # true/false

# Whether to indent the open parenthesis of a function call,
# if the parenthesis is on its own line.
indent_paren_after_func_call    = false    # true/false

# How to indent a comma when inside braces.
#  0: Indent by one level (default)
#  1: Align under the open brace
# -1: Preserve original indentation
indent_comma_brace              = 0        # number

# How to indent a comma when inside parentheses.
#  0: Indent by one level (default)
#  1: Align under the open parenthesis
# -1: Preserve original indentation
indent_comma_paren              = 0        # number

# How to indent a Boolean operator when inside parentheses.
#  0: Indent by one level (default)
#  1: Align under the open parenthesis
# -1: Preserve original indentation
indent_bool_paren               = 0        # number

# Whether to ignore the indentation of a Boolean operator when outside
# parentheses.
indent_ignore_bool              = false    # true/false

# Whether to ignore the indentation of an arithmetic operator.
indent_ignore_arith             = false    # true/false

# Whether to indent a semicolon when inside a for parenthesis.
# If true, aligns under the open for parenthesis.
indent_semicolon_for_paren      = false    # true/false

# Whether to ignore the indentation of a semicolon outside of a 'for'
# statement.
indent_ignore_semicolon         = false    # true/false

# Whether to align the first expression to following ones
# if indent_bool_paren=1.
indent_first_bool_expr          = false    # true/false

# Whether to align the first expression to following ones
# if indent_semicolon_for_paren=true.
indent_first_for_expr           = false    # true/false

# If an open square is followed by a newline, whether to indent the next line
# so that it lines up after the open square (not recommended).
indent_square_nl                = false    # true/false

# (ESQL/C) Whether to preserve the relative indent of 'EXEC SQL' bodies.
indent_preserve_sql             = false    # true/false

# Whether to ignore the indentation of an assignment operator.
indent_ignore_assign            = false    # true/false

# Whether to align continued statements at the '='. If false or if the '=' is
# followed by a newline, the next line is indent one tab.
#
# Default: true
indent_align_assign             = true     # true/false

# If true, the indentation of the chunks after a '=' sequence will be set at
# LHS token indentation column before '='.
indent_off_after_assign         = false    # true/false

# Whether to align continued statements at the '('. If false or the '(' is
# followed by a newline, the next line indent is one tab.
#
# Default: true
indent_align_paren              = true     # true/false

# (OC) Whether to indent Objective-C code inside message selectors.
indent_oc_inside_msg_sel        = false    # true/false

# (OC) Whether to indent Objective-C blocks at brace level instead of usual
# rules.
indent_oc_block                 = false    # true/false

# (OC) Indent for Objective-C blocks in a message relative to the parameter
# name.
#
# =0: Use indent_oc_block rules
# >0: Use specified number of spaces to indent
indent_oc_block_msg             = 0        # unsigned number

# (OC) Minimum indent for subsequent parameters
indent_oc_msg_colon             = 0        # unsigned number

# (OC) Whether to prioritize aligning with initial colon (and stripping spaces
# from lines, if necessary).
#
# Default: true
indent_oc_msg_prioritize_first_colon = true     # true/false

# (OC) Whether to indent blocks the way that Xcode does by default
# (from the keyword if the parameter is on its own line; otherwise, from the
# previous indentation level). Requires indent_oc_block_msg=true.
indent_oc_block_msg_xcode_style = false    # true/false

# (OC) Whether to indent blocks from where the brace is, relative to a
# message keyword. Requires indent_oc_block_msg=true.
indent_oc_block_msg_from_keyword = false    # true/false

# (OC) Whether to indent blocks from where the brace is, relative to a message
# colon. Requires indent_oc_block_msg=true.
indent_oc_block_msg_from_colon  = false    # true/false

# (OC) Whether to indent blocks from where the block caret is.
# Requires indent_oc_block_msg=true.
indent_oc_block_msg_from_caret  = false    # true/false

# (OC) Whether to indent blocks from where the brace caret is.
# Requires indent_oc_block_msg=true.
indent_oc_block_msg_from_brace  = false    # true/false

# When indenting after virtual brace open and newline add further spaces to
# reach this minimum indent.
indent_min_vbrace_open          = 0        # unsigned number

# Whether to add further spaces after regular indent to reach next tabstop
# when indenting after virtual brace open and newline.
indent_vbrace_open_on_tabstop   = false    # true/false

# How to indent after a brace followed by another token (not a newline).
# true:  indent all contained lines to match the token
# false: indent all contained lines to match the brace
#
# Default: true
indent_token_after_brace        = true     # true/false

# Whether to indent the body of a C++11 lambda.
indent_cpp_lambda_body          = false    # true/false

# How to indent compound literals that are being returned.
# true: add both the indent from return & the compound literal open brace
#       (i.e. 2 indent levels)
# false: only indent 1 level, don't add the indent for the open brace, only
#        add the indent for the return.
#
# Default: true
indent_compound_literal_return  = true     # true/false

# (C#) Whether to indent a 'using' block if no braces are used.
#
# Default: true
indent_using_block              = true     # true/false

# How to indent the continuation of ternary operator.
#
# 0: Off (default)
# 1: When the `if_false` is a continuation, indent it under the `if_true` branch
# 2: When the `:` is a continuation, indent it under `?`
indent_ternary_operator         = 0        # unsigned number

# Whether to indent the statements inside ternary operator.
indent_inside_ternary_operator  = false    # true/false

# If true, the indentation of the chunks after a `return` sequence will be set at return indentation column.
indent_off_after_return         = false    # true/false

# If true, the indentation of the chunks after a `return new` sequence will be set at return indentation column.
indent_off_after_return_new     = false    # true/false

# If true, the tokens after return are indented with regular single indentation. By default (false) the indentation is after the return token.
indent_single_after_return      = false    # true/false

# Whether to ignore indent and alignment for 'asm' blocks (i.e. assume they
# have their own indentation).
indent_ignore_asm_block         = false    # true/false

# Don't indent the close parenthesis of a function definition,
# if the parenthesis is on its own line.
donot_indent_func_def_close_paren = false    # true/false

#
# Newline adding and removing options
#

# Whether to collapse empty blocks between '{' and '}' except for functions.
# Use nl_collapse_empty_body_functions to specify how empty function braces
# should be formatted.
nl_collapse_empty_body          = false    # true/false

# Whether to collapse empty blocks between '{' and '}' for functions only.
# If true, overrides nl_inside_empty_func.
nl_collapse_empty_body_functions = false    # true/false

# Don't split one-line braced assignments, as in 'foo_t f = { 1, 2 };'.
nl_assign_leave_one_liners      = false    # true/false

# Don't split one-line braced statements inside a 'class xx { }' body.
nl_class_leave_one_liners       = false    # true/false

# Don't split one-line enums, as in 'enum foo { BAR = 15 };'
nl_enum_leave_one_liners        = false    # true/false

# Don't split one-line get or set functions.
nl_getset_leave_one_liners      = false    # true/false

# (C#) Don't split one-line property get or set functions.
nl_cs_property_leave_one_liners = false    # true/false

# Don't split one-line function definitions, as in 'int foo() { return 0; }'.
# might modify nl_func_type_name
nl_func_leave_one_liners        = false    # true/false

# Don't split one-line C++11 lambdas, as in '[]() { return 0; }'.
nl_cpp_lambda_leave_one_liners  = false    # true/false

# Don't split one-line if/else statements, as in 'if(...) b++;'.
nl_if_leave_one_liners          = false    # true/false

# Don't split one-line while statements, as in 'while(...) b++;'.
nl_while_leave_one_liners       = false    # true/false

# Don't split one-line do statements, as in 'do { b++; } while(...);'.
nl_do_leave_one_liners          = false    # true/false

# Don't split one-line for statements, as in 'for(...) b++;'.
nl_for_leave_one_liners         = false    # true/false

# (OC) Don't split one-line Objective-C messages.
nl_oc_msg_leave_one_liner       = false    # true/false

# (OC) Add or remove newline between method declaration and '{'.
nl_oc_mdef_brace                = ignore   # ignore/add/remove/force

# (OC) Add or remove newline between Objective-C block signature and '{'.
nl_oc_block_brace               = ignore   # ignore/add/remove/force

# (OC) Add or remove blank line before '@interface' statement.
nl_oc_before_interface          = ignore   # ignore/add/remove/force

# (OC) Add or remove blank line before '@implementation' statement.
nl_oc_before_implementation     = ignore   # ignore/add/remove/force

# (OC) Add or remove blank line before '@end' statement.
nl_oc_before_end                = ignore   # ignore/add/remove/force

# (OC) Add or remove newline between '@interface' and '{'.
nl_oc_interface_brace           = ignore   # ignore/add/remove/force

# (OC) Add or remove newline between '@implementation' and '{'.
nl_oc_implementation_brace      = ignore   # ignore/add/remove/force

# Add or remove newlines at the start of the file.
nl_start_of_file                = ignore   # ignore/add/remove/force

# The minimum number of newlines at the start of the file (only used if
# nl_start_of_file is 'add' or 'force').
nl_start_of_file_min            = 0        # unsigned number

# Add or remove newline at the end of the file.
nl_end_of_file                  = ignore   # ignore/add/remove/force

# The minimum number of newlines at the end of the file (only used if
# nl_end_of_file is 'add' or 'force').
nl_end_of_file_min              = 0        # unsigned number

# Add or remove newline between '=' and '{'.
nl_assign_brace                 = ignore   # ignore/add/remove/force

# (D) Add or remove newline between '=' and '['.
nl_assign_square                = ignore   # ignore/add/remove/force

# Add or remove newline between '[]' and '{'.
nl_tsquare_brace                = ignore   # ignore/add/remove/force

# (D) Add or remove newline after '= ['. Will also affect the newline before
# the ']'.
nl_after_square_assign          = ignore   # ignore/add/remove/force

# Add or remove newline between a function call's ')' and '{', as in
# 'list_for_each(item, &list) { }'.
nl_fcall_brace                  = ignore   # ignore/add/remove/force

# Add or remove newline between 'enum' and '{'.
nl_enum_brace                   = ignore   # ignore/add/remove/force

# Add or remove newline between 'enum' and 'class'.
nl_enum_class                   = ignore   # ignore/add/remove/force

# Add or remove newline between 'enum class' and the identifier.
nl_enum_class_identifier        = ignore   # ignore/add/remove/force

# Add or remove newline between 'enum class' type and ':'.
nl_enum_identifier_colon        = ignore   # ignore/add/remove/force

# Add or remove newline between 'enum class identifier :' and type.
nl_enum_colon_type              = ignore   # ignore/add/remove/force

# Add or remove newline between 'struct and '{'.
nl_struct_brace                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'union' and '{'.
nl_union_brace                  = ignore   # ignore/add/remove/force

# Add or remove newline between 'if' and '{'.
nl_if_brace                     = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and 'else'.
nl_brace_else                   = ignore   # ignore/add/remove/force

# Add or remove newline between 'else if' and '{'. If set to ignore,
# nl_if_brace is used instead.
nl_elseif_brace                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'else' and '{'.
nl_else_brace                   = ignore   # ignore/add/remove/force

# Add or remove newline between 'else' and 'if'.
nl_else_if                      = ignore   # ignore/add/remove/force

# Add or remove newline before '{' opening brace
nl_before_opening_brace_func_class_def = ignore   # ignore/add/remove/force

# Add or remove newline before 'if'/'else if' closing parenthesis.
nl_before_if_closing_paren      = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and 'finally'.
nl_brace_finally                = ignore   # ignore/add/remove/force

# Add or remove newline between 'finally' and '{'.
nl_finally_brace                = ignore   # ignore/add/remove/force

# Add or remove newline between 'try' and '{'.
nl_try_brace                    = ignore   # ignore/add/remove/force

# Add or remove newline between get/set and '{'.
nl_getset_brace                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'for' and '{'.
nl_for_brace                    = ignore   # ignore/add/remove/force

# Add or remove newline before the '{' of a 'catch' statement, as in
# 'catch (decl) <here> {'.
nl_catch_brace                  = ignore   # ignore/add/remove/force

# (OC) Add or remove newline before the '{' of a '@catch' statement, as in
# '@catch (decl) <here> {'. If set to ignore, nl_catch_brace is used.
nl_oc_catch_brace               = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and 'catch'.
nl_brace_catch                  = ignore   # ignore/add/remove/force

# (OC) Add or remove newline between '}' and '@catch'. If set to ignore,
# nl_brace_catch is used.
nl_oc_brace_catch               = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and ']'.
nl_brace_square                 = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and ')' in a function invocation.
nl_brace_fparen                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'while' and '{'.
nl_while_brace                  = ignore   # ignore/add/remove/force

# (D) Add or remove newline between 'scope (x)' and '{'.
nl_scope_brace                  = ignore   # ignore/add/remove/force

# (D) Add or remove newline between 'unittest' and '{'.
nl_unittest_brace               = ignore   # ignore/add/remove/force

# (D) Add or remove newline between 'version (x)' and '{'.
nl_version_brace                = ignore   # ignore/add/remove/force

# (C#) Add or remove newline between 'using' and '{'.
nl_using_brace                  = ignore   # ignore/add/remove/force

# Add or remove newline between two open or close braces. Due to general
# newline/brace handling, REMOVE may not work.
nl_brace_brace                  = ignore   # ignore/add/remove/force

# Add or remove newline between 'do' and '{'.
nl_do_brace                     = ignore   # ignore/add/remove/force

# Add or remove newline between '}' and 'while' of 'do' statement.
nl_brace_while                  = ignore   # ignore/add/remove/force

# Add or remove newline between 'switch' and '{'.
nl_switch_brace                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'synchronized' and '{'.
nl_synchronized_brace           = ignore   # ignore/add/remove/force

# Add a newline between ')' and '{' if the ')' is on a different line than the
# if/for/etc.
#
# Overrides nl_for_brace, nl_if_brace, nl_switch_brace, nl_while_switch and
# nl_catch_brace.
nl_multi_line_cond              = false    # true/false

# Add a newline after '(' if an if/for/while/switch condition spans multiple
# lines
nl_multi_line_sparen_open       = ignore   # ignore/add/remove/force

# Add a newline before ')' if an if/for/while/switch condition spans multiple
# lines. Overrides nl_before_if_closing_paren if both are specified.
nl_multi_line_sparen_close      = ignore   # ignore/add/remove/force

# Force a newline in a define after the macro name for multi-line defines.
nl_multi_line_define            = false    # true/false

# Whether to add a newline before 'case', and a blank line before a 'case'
# statement that follows a ';' or '}'.
nl_before_case                  = false    # true/false

# Whether to add a newline after a 'case' statement.
nl_after_case                   = false    # true/false

# Add or remove newline between a case ':' and '{'.
#
# Overrides nl_after_case.
nl_case_colon_brace             = ignore   # ignore/add/remove/force

# Add or remove newline between ')' and 'throw'.
nl_before_throw                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'namespace' and '{'.
nl_namespace_brace              = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template class.
nl_template_class               = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template class declaration.
#
# Overrides nl_template_class.
nl_template_class_decl          = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<>' of a specialized class declaration.
#
# Overrides nl_template_class_decl.
nl_template_class_decl_special  = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template class definition.
#
# Overrides nl_template_class.
nl_template_class_def           = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<>' of a specialized class definition.
#
# Overrides nl_template_class_def.
nl_template_class_def_special   = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template function.
nl_template_func                = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template function
# declaration.
#
# Overrides nl_template_func.
nl_template_func_decl           = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<>' of a specialized function
# declaration.
#
# Overrides nl_template_func_decl.
nl_template_func_decl_special   = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template function
# definition.
#
# Overrides nl_template_func.
nl_template_func_def            = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<>' of a specialized function
# definition.
#
# Overrides nl_template_func_def.
nl_template_func_def_special    = ignore   # ignore/add/remove/force

# Add or remove newline after 'template<...>' of a template variable.
nl_template_var                 = ignore   # ignore/add/remove/force

# Add or remove newline between 'template<...>' and 'using' of a templated
# type alias.
nl_template_using               = ignore   # ignore/add/remove/force

# Add or remove newline between 'class' and '{'.
nl_class_brace                  = ignore   # ignore/add/remove/force

# Add or remove newline before or after (depending on pos_class_comma,
# may not be IGNORE) each',' in the base class list.
nl_class_init_args              = ignore   # ignore/add/remove/force

# Add or remove newline after each ',' in the constructor member
# initialization. Related to nl_constr_colon, pos_constr_colon and
# pos_constr_comma.
nl_constr_init_args             = ignore   # ignore/add/remove/force

# Add or remove newline before first element, after comma, and after last
# element, in 'enum'.
nl_enum_own_lines               = ignore   # ignore/add/remove/force

# Add or remove newline between return type and function name in a function
# definition.
# might be modified by nl_func_leave_one_liners
nl_func_type_name               = ignore   # ignore/add/remove/force

# Add or remove newline between return type and function name inside a class
# definition. If set to ignore, nl_func_type_name or nl_func_proto_type_name
# is used instead.
nl_func_type_name_class         = ignore   # ignore/add/remove/force

# Add or remove newline between class specification and '::'
# in 'void A::f() { }'. Only appears in separate member implementation (does
# not appear with in-line implementation).
nl_func_class_scope             = ignore   # ignore/add/remove/force

# Add or remove newline between function scope and name, as in
# 'void A :: <here> f() { }'.
nl_func_scope_name              = ignore   # ignore/add/remove/force

# Add or remove newline between return type and function name in a prototype.
nl_func_proto_type_name         = ignore   # ignore/add/remove/force

# Add or remove newline between a function name and the opening '(' in the
# declaration.
nl_func_paren                   = ignore   # ignore/add/remove/force

# Overrides nl_func_paren for functions with no parameters.
nl_func_paren_empty             = ignore   # ignore/add/remove/force

# Add or remove newline between a function name and the opening '(' in the
# definition.
nl_func_def_paren               = ignore   # ignore/add/remove/force

# Overrides nl_func_def_paren for functions with no parameters.
nl_func_def_paren_empty         = ignore   # ignore/add/remove/force

# Add or remove newline between a function name and the opening '(' in the
# call.
nl_func_call_paren              = ignore   # ignore/add/remove/force

# Overrides nl_func_call_paren for functions with no parameters.
nl_func_call_paren_empty        = ignore   # ignore/add/remove/force

# Add or remove newline after '(' in a function declaration.
nl_func_decl_start              = ignore   # ignore/add/remove/force

# Add or remove newline after '(' in a function definition.
nl_func_def_start               = ignore   # ignore/add/remove/force

# Overrides nl_func_decl_start when there is only one parameter.
nl_func_decl_start_single       = ignore   # ignore/add/remove/force

# Overrides nl_func_def_start when there is only one parameter.
nl_func_def_start_single        = ignore   # ignore/add/remove/force

# Whether to add a newline after '(' in a function declaration if '(' and ')'
# are in different lines. If false, nl_func_decl_start is used instead.
nl_func_decl_start_multi_line   = false    # true/false

# Whether to add a newline after '(' in a function definition if '(' and ')'
# are in different lines. If false, nl_func_def_start is used instead.
nl_func_def_start_multi_line    = false    # true/false

# Add or remove newline after each ',' in a function declaration.
nl_func_decl_args               = ignore   # ignore/add/remove/force

# Add or remove newline after each ',' in a function definition.
nl_func_def_args                = ignore   # ignore/add/remove/force

# Add or remove newline after each ',' in a function call.
nl_func_call_args               = ignore   # ignore/add/remove/force

# Whether to add a newline after each ',' in a function declaration if '('
# and ')' are in different lines. If false, nl_func_decl_args is used instead.
nl_func_decl_args_multi_line    = false    # true/false

# Whether to add a newline after each ',' in a function definition if '('
# and ')' are in different lines. If false, nl_func_def_args is used instead.
nl_func_def_args_multi_line     = false    # true/false

# Add or remove newline before the ')' in a function declaration.
nl_func_decl_end                = ignore   # ignore/add/remove/force

# Add or remove newline before the ')' in a function definition.
nl_func_def_end                 = ignore   # ignore/add/remove/force

# Overrides nl_func_decl_end when there is only one parameter.
nl_func_decl_end_single         = ignore   # ignore/add/remove/force

# Overrides nl_func_def_end when there is only one parameter.
nl_func_def_end_single          = ignore   # ignore/add/remove/force

# Whether to add a newline before ')' in a function declaration if '(' and ')'
# are in different lines. If false, nl_func_decl_end is used instead.
nl_func_decl_end_multi_line     = false    # true/false

# Whether to add a newline before ')' in a function definition if '(' and ')'
# are in different lines. If false, nl_func_def_end is used instead.
nl_func_def_end_multi_line      = false    # true/false

# Add or remove newline between '()' in a function declaration.
nl_func_decl_empty              = ignore   # ignore/add/remove/force

# Add or remove newline between '()' in a function definition.
nl_func_def_empty               = ignore   # ignore/add/remove/force

# Add or remove newline between '()' in a function call.
nl_func_call_empty              = ignore   # ignore/add/remove/force

# Whether to add a newline after '(' in a function call,
# has preference over nl_func_call_start_multi_line.
nl_func_call_start              = ignore   # ignore/add/remove/force

# Whether to add a newline before ')' in a function call.
nl_func_call_end                = ignore   # ignore/add/remove/force

# Whether to add a newline after '(' in a function call if '(' and ')' are in
# different lines.
nl_func_call_start_multi_line   = false    # true/false

# Whether to add a newline after each ',' in a function call if '(' and ')'
# are in different lines.
nl_func_call_args_multi_line    = false    # true/false

# Whether to add a newline before ')' in a function call if '(' and ')' are in
# different lines.
nl_func_call_end_multi_line     = false    # true/false

# Whether to respect nl_func_call_XXX option in case of closure args.
nl_func_call_args_multi_line_ignore_closures = false    # true/false

# Whether to add a newline after '<' of a template parameter list.
nl_template_start               = false    # true/false

# Whether to add a newline after each ',' in a template parameter list.
nl_template_args                = false    # true/false

# Whether to add a newline before '>' of a template parameter list.
nl_template_end                 = false    # true/false

# (OC) Whether to put each Objective-C message parameter on a separate line.
# See nl_oc_msg_leave_one_liner.
nl_oc_msg_args                  = false    # true/false

# (OC) Minimum number of Objective-C message parameters before applying nl_oc_msg_args.
nl_oc_msg_args_min_params       = 0        # unsigned number

# (OC) Max code width of Objective-C message before applying nl_oc_msg_args.
nl_oc_msg_args_max_code_width   = 0        # unsigned number

# (OC) Whether to apply nl_oc_msg_args if some of the parameters are already
# on new lines. Overrides nl_oc_msg_args_min_params and nl_oc_msg_args_max_code_width.
nl_oc_msg_args_finish_multi_line = false    # true/false

# Add or remove newline between function signature and '{'.
nl_fdef_brace                   = ignore   # ignore/add/remove/force

# Add or remove newline between function signature and '{',
# if signature ends with ')'. Overrides nl_fdef_brace.
nl_fdef_brace_cond              = ignore   # ignore/add/remove/force

# Add or remove newline between C++11 lambda signature and '{'.
nl_cpp_ldef_brace               = ignore   # ignore/add/remove/force

# Add or remove newline between 'return' and the return expression.
nl_return_expr                  = ignore   # ignore/add/remove/force

# Add or remove newline between 'throw' and the throw expression.
nl_throw_expr                   = ignore   # ignore/add/remove/force

# Whether to add a newline after semicolons, except in 'for' statements.
nl_after_semicolon              = false    # true/false

# (Java) Add or remove newline between the ')' and '{{' of the double brace
# initializer.
nl_paren_dbrace_open            = ignore   # ignore/add/remove/force

# Whether to add a newline after the type in an unnamed temporary
# direct-list-initialization, better:
# before a direct-list-initialization.
nl_type_brace_init_lst          = ignore   # ignore/add/remove/force

# Whether to add a newline after the open brace in an unnamed temporary
# direct-list-initialization.
nl_type_brace_init_lst_open     = ignore   # ignore/add/remove/force

# Whether to add a newline before the close brace in an unnamed temporary
# direct-list-initialization.
nl_type_brace_init_lst_close    = ignore   # ignore/add/remove/force

# Whether to add a newline before '{'.
nl_before_brace_open            = false    # true/false

# Whether to add a newline after '{'.
nl_after_brace_open             = false    # true/false

# Whether to add a newline between the open brace and a trailing single-line
# comment. Requires nl_after_brace_open=true.
nl_after_brace_open_cmt         = false    # true/false

# Whether to add a newline after a virtual brace open with a non-empty body.
# These occur in un-braced if/while/do/for statement bodies.
nl_after_vbrace_open            = false    # true/false

# Whether to add a newline after a virtual brace open with an empty body.
# These occur in un-braced if/while/do/for statement bodies.
nl_after_vbrace_open_empty      = false    # true/false

# Whether to add a newline after '}'. Does not apply if followed by a
# necessary ';'.
nl_after_brace_close            = false    # true/false

# Whether to add a newline after a virtual brace close,
# as in 'if (foo) a++; <here> return;'.
nl_after_vbrace_close           = false    # true/false

# Add or remove newline between the close brace and identifier,
# as in 'struct { int a; } <here> b;'. Affects enumerations, unions and
# structures. If set to ignore, uses nl_after_brace_close.
nl_brace_struct_var             = ignore   # ignore/add/remove/force

# Whether to alter newlines in '#define' macros.
nl_define_macro                 = false    # true/false

# Whether to alter newlines between consecutive parenthesis closes. The number
# of closing parentheses in a line will depend on respective open parenthesis
# lines.
nl_squeeze_paren_close          = false    # true/false

# Whether to remove blanks after '#ifxx' and '#elxx', or before '#elxx' and
# '#endif'. Does not affect top-level #ifdefs.
nl_squeeze_ifdef                = false    # true/false

# Makes the nl_squeeze_ifdef option affect the top-level #ifdefs as well.
nl_squeeze_ifdef_top_level      = false    # true/false

# Add or remove blank line before 'if'.
nl_before_if                    = ignore   # ignore/add/remove/force

# Add or remove blank line after 'if' statement. Add/Force work only if the
# next token is not a closing brace.
nl_after_if                     = ignore   # ignore/add/remove/force

# Add or remove blank line before 'for'.
nl_before_for                   = ignore   # ignore/add/remove/force

# Add or remove blank line after 'for' statement.
nl_after_for                    = ignore   # ignore/add/remove/force

# Add or remove blank line before 'while'.
nl_before_while                 = ignore   # ignore/add/remove/force

# Add or remove blank line after 'while' statement.
nl_after_while                  = ignore   # ignore/add/remove/force

# Add or remove blank line before 'switch'.
nl_before_switch                = ignore   # ignore/add/remove/force

# Add or remove blank line after 'switch' statement.
nl_after_switch                 = ignore   # ignore/add/remove/force

# Add or remove blank line before 'synchronized'.
nl_before_synchronized          = ignore   # ignore/add/remove/force

# Add or remove blank line after 'synchronized' statement.
nl_after_synchronized           = ignore   # ignore/add/remove/force

# Add or remove blank line before 'do'.
nl_before_do                    = ignore   # ignore/add/remove/force

# Add or remove blank line after 'do/while' statement.
nl_after_do                     = ignore   # ignore/add/remove/force

# Ignore nl_before_{if,for,switch,do,synchronized} if the control
# statement is immediately after a case statement.
# if nl_before_{if,for,switch,do} is set to remove, this option
# does nothing.
nl_before_ignore_after_case     = false    # true/false

# Whether to put a blank line before 'return' statements, unless after an open
# brace.
nl_before_return                = false    # true/false

# Whether to put a blank line after 'return' statements, unless followed by a
# close brace.
nl_after_return                 = false    # true/false

# Whether to put a blank line before a member '.' or '->' operators.
nl_before_member                = ignore   # ignore/add/remove/force

# (Java) Whether to put a blank line after a member '.' or '->' operators.
nl_after_member                 = ignore   # ignore/add/remove/force

# Whether to double-space commented-entries in 'struct'/'union'/'enum'.
nl_ds_struct_enum_cmt           = false    # true/false

# Whether to force a newline before '}' of a 'struct'/'union'/'enum'.
# (Lower priority than eat_blanks_before_close_brace.)
nl_ds_struct_enum_close_brace   = false    # true/false

# Add or remove newline before or after (depending on pos_class_colon) a class
# colon, as in 'class Foo <here> : <or here> public Bar'.
nl_class_colon                  = ignore   # ignore/add/remove/force

# Add or remove newline around a class constructor colon. The exact position
# depends on nl_constr_init_args, pos_constr_colon and pos_constr_comma.
nl_constr_colon                 = ignore   # ignore/add/remove/force

# Whether to collapse a two-line namespace, like 'namespace foo\n{ decl; }'
# into a single line. If true, prevents other brace newline rules from turning
# such code into four lines. If true, it also preserves one-liner namespaces.
nl_namespace_two_to_one_liner   = false    # true/false

# Whether to remove a newline in simple unbraced if statements, turning them
# into one-liners, as in 'if(b)\n i++;' => 'if(b) i++;'.
nl_create_if_one_liner          = false    # true/false

# Whether to remove a newline in simple unbraced for statements, turning them
# into one-liners, as in 'for (...)\n stmt;' => 'for (...) stmt;'.
nl_create_for_one_liner         = false    # true/false

# Whether to remove a newline in simple unbraced while statements, turning
# them into one-liners, as in 'while (expr)\n stmt;' => 'while (expr) stmt;'.
nl_create_while_one_liner       = false    # true/false

# Whether to collapse a function definition whose body (not counting braces)
# is only one line so that the entire definition (prototype, braces, body) is
# a single line.
nl_create_func_def_one_liner    = false    # true/false

# Whether to split one-line simple list definitions into three lines by
# adding newlines, as in 'int a[12] = { <here> 0 <here> };'.
nl_create_list_one_liner        = false    # true/false

# Whether to split one-line simple unbraced if statements into two lines by
# adding a newline, as in 'if(b) <here> i++;'.
nl_split_if_one_liner           = false    # true/false

# Whether to split one-line simple unbraced for statements into two lines by
# adding a newline, as in 'for (...) <here> stmt;'.
nl_split_for_one_liner          = false    # true/false

# Whether to split one-line simple unbraced while statements into two lines by
# adding a newline, as in 'while (expr) <here> stmt;'.
nl_split_while_one_liner        = false    # true/false

# Don't add a newline before a cpp-comment in a parameter list of a function
# call.
donot_add_nl_before_cpp_comment = false    # true/false

#
# Blank line options
#

# The maximum number of consecutive newlines (3 = 2 blank lines).
nl_max                          = 0        # unsigned number

# The maximum number of consecutive newlines in a function.
nl_max_blank_in_func            = 0        # unsigned number

# The number of newlines inside an empty function body.
# This option overrides eat_blanks_after_open_brace and
# eat_blanks_before_close_brace, but is ignored when
# nl_collapse_empty_body_functions=true
nl_inside_empty_func            = 0        # unsigned number

# The number of newlines before a function prototype.
nl_before_func_body_proto       = 0        # unsigned number

# The number of newlines before a multi-line function definition. Where
# applicable, this option is overridden with eat_blanks_after_open_brace=true
nl_before_func_body_def         = 0        # unsigned number

# The number of newlines before a class constructor/destructor prototype.
nl_before_func_class_proto      = 0        # unsigned number

# The number of newlines before a class constructor/destructor definition.
nl_before_func_class_def        = 0        # unsigned number

# The number of newlines after a function prototype.
nl_after_func_proto             = 0        # unsigned number

# The number of newlines after a function prototype, if not followed by
# another function prototype.
nl_after_func_proto_group       = 0        # unsigned number

# The number of newlines after a class constructor/destructor prototype.
nl_after_func_class_proto       = 0        # unsigned number

# The number of newlines after a class constructor/destructor prototype,
# if not followed by another constructor/destructor prototype.
nl_after_func_class_proto_group = 0        # unsigned number

# Whether one-line method definitions inside a class body should be treated
# as if they were prototypes for the purposes of adding newlines.
#
# Requires nl_class_leave_one_liners=true. Overrides nl_before_func_body_def
# and nl_before_func_class_def for one-liners.
nl_class_leave_one_liner_groups = false    # true/false

# The number of newlines after '}' of a multi-line function body.
#
# Overrides nl_min_after_func_body and nl_max_after_func_body.
nl_after_func_body              = 0        # unsigned number

# The minimum number of newlines after '}' of a multi-line function body.
#
# Only works when nl_after_func_body is 0.
nl_min_after_func_body          = 0        # unsigned number

# The maximum number of newlines after '}' of a multi-line function body.
#
# Only works when nl_after_func_body is 0.
# Takes precedence over nl_min_after_func_body.
nl_max_after_func_body          = 0        # unsigned number

# The number of newlines after '}' of a multi-line function body in a class
# declaration. Also affects class constructors/destructors.
#
# Overrides nl_after_func_body.
nl_after_func_body_class        = 0        # unsigned number

# The number of newlines after '}' of a single line function body. Also
# affects class constructors/destructors.
#
# Overrides nl_after_func_body and nl_after_func_body_class.
nl_after_func_body_one_liner    = 0        # unsigned number

# The number of newlines before a block of typedefs. If nl_after_access_spec
# is non-zero, that option takes precedence.
#
# 0: No change (default).
nl_typedef_blk_start            = 0        # unsigned number

# The number of newlines after a block of typedefs.
#
# 0: No change (default).
nl_typedef_blk_end              = 0        # unsigned number

# The maximum number of consecutive newlines within a block of typedefs.
#
# 0: No change (default).
nl_typedef_blk_in               = 0        # unsigned number

# The minimum number of blank lines after a block of variable definitions
# at the top of a function body. If any preprocessor directives appear
# between the opening brace of the function and the variable block, then
# it is considered as not at the top of the function.Newlines are added
# before trailing preprocessor directives, if any exist.
#
# 0: No change (default).
nl_var_def_blk_end_func_top     = 0        # unsigned number

# The minimum number of empty newlines before a block of variable definitions
# not at the top of a function body. If nl_after_access_spec is non-zero,
# that option takes precedence. Newlines are not added at the top of the
# file or just after an opening brace. Newlines are added above any
# preprocessor directives before the block.
#
# 0: No change (default).
nl_var_def_blk_start            = 0        # unsigned number

# The minimum number of empty newlines after a block of variable definitions
# not at the top of a function body. Newlines are not added if the block
# is at the bottom of the file or just before a preprocessor directive.
#
# 0: No change (default).
nl_var_def_blk_end              = 0        # unsigned number

# The maximum number of consecutive newlines within a block of variable
# definitions.
#
# 0: No change (default).
nl_var_def_blk_in               = 0        # unsigned number

# The minimum number of newlines before a multi-line comment.
# Doesn't apply if after a brace open or another multi-line comment.
nl_before_block_comment         = 0        # unsigned number

# The minimum number of newlines before a single-line C comment.
# Doesn't apply if after a brace open or other single-line C comments.
nl_before_c_comment             = 0        # unsigned number

# The minimum number of newlines before a CPP comment.
# Doesn't apply if after a brace open or other CPP comments.
nl_before_cpp_comment           = 0        # unsigned number

# Whether to force a newline after a multi-line comment.
nl_after_multiline_comment      = false    # true/false

# Whether to force a newline after a label's colon.
nl_after_label_colon            = false    # true/false

# The number of newlines before a struct definition.
nl_before_struct                = 0        # unsigned number

# The number of newlines after '}' or ';' of a struct/enum/union definition.
nl_after_struct                 = 0        # unsigned number

# The number of newlines before a class definition.
nl_before_class                 = 0        # unsigned number

# The number of newlines after '}' or ';' of a class definition.
nl_after_class                  = 0        # unsigned number

# The number of newlines before a namespace.
nl_before_namespace             = 0        # unsigned number

# The number of newlines after '{' of a namespace. This also adds newlines
# before the matching '}'.
#
# 0: Apply eat_blanks_after_open_brace or eat_blanks_before_close_brace if
#     applicable, otherwise no change.
#
# Overrides eat_blanks_after_open_brace and eat_blanks_before_close_brace.
nl_inside_namespace             = 0        # unsigned number

# The number of newlines after '}' of a namespace.
nl_after_namespace              = 0        # unsigned number

# The number of newlines before an access specifier label. This also includes
# the Qt-specific 'signals:' and 'slots:'. Will not change the newline count
# if after a brace open.
#
# 0: No change (default).
nl_before_access_spec           = 0        # unsigned number

# The number of newlines after an access specifier label. This also includes
# the Qt-specific 'signals:' and 'slots:'. Will not change the newline count
# if after a brace open.
#
# 0: No change (default).
#
# Overrides nl_typedef_blk_start and nl_var_def_blk_start.
nl_after_access_spec            = 0        # unsigned number

# The number of newlines between a function definition and the function
# comment, as in '// comment\n <here> void foo() {...}'.
#
# 0: No change (default).
nl_comment_func_def             = 0        # unsigned number

# The number of newlines after a try-catch-finally block that isn't followed
# by a brace close.
#
# 0: No change (default).
nl_after_try_catch_finally      = 0        # unsigned number

# (C#) The number of newlines before and after a property, indexer or event
# declaration.
#
# 0: No change (default).
nl_around_cs_property           = 0        # unsigned number

# (C#) The number of newlines between the get/set/add/remove handlers.
#
# 0: No change (default).
nl_between_get_set              = 0        # unsigned number

# (C#) Add or remove newline between property and the '{'.
nl_property_brace               = ignore   # ignore/add/remove/force

# Whether to remove blank lines after '{'.
eat_blanks_after_open_brace     = false    # true/false

# Whether to remove blank lines before '}'.
eat_blanks_before_close_brace   = false    # true/false

# How aggressively to remove extra newlines not in preprocessor.
#
# 0: No change (default)
# 1: Remove most newlines not handled by other config
# 2: Remove all newlines and reformat completely by config
nl_remove_extra_newlines        = 0        # unsigned number

# (Java) Add or remove newline after an annotation statement. Only affects
# annotations that are after a newline.
nl_after_annotation             = ignore   # ignore/add/remove/force

# (Java) Add or remove newline between two annotations.
nl_between_annotation           = ignore   # ignore/add/remove/force

# The number of newlines before a whole-file #ifdef.
#
# 0: No change (default).
nl_before_whole_file_ifdef      = 0        # unsigned number

# The number of newlines after a whole-file #ifdef.
#
# 0: No change (default).
nl_after_whole_file_ifdef       = 0        # unsigned number

# The number of newlines before a whole-file #endif.
#
# 0: No change (default).
nl_before_whole_file_endif      = 0        # unsigned number

# The number of newlines after a whole-file #endif.
#
# 0: No change (default).
nl_after_whole_file_endif       = 0        # unsigned number

#
# Positioning options
#

# The position of arithmetic operators in wrapped expressions.
pos_arith                       = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of assignment in wrapped expressions. Do not affect '='
# followed by '{'.
pos_assign                      = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of Boolean operators in wrapped expressions.
pos_bool                        = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of comparison operators in wrapped expressions.
pos_compare                     = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of conditional operators, as in the '?' and ':' of
# 'expr ? stmt : stmt', in wrapped expressions.
pos_conditional                 = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of the comma in wrapped expressions.
pos_comma                       = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of the comma in enum entries.
pos_enum_comma                  = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of the comma in the base class list if there is more than one
# line. Affects nl_class_init_args.
pos_class_comma                 = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of the comma in the constructor initialization list.
# Related to nl_constr_colon, nl_constr_init_args and pos_constr_colon.
pos_constr_comma                = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of trailing/leading class colon, between class and base class
# list. Affects nl_class_colon.
pos_class_colon                 = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of colons between constructor and member initialization.
# Related to nl_constr_colon, nl_constr_init_args and pos_constr_comma.
pos_constr_colon                = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

# The position of shift operators in wrapped expressions.
pos_shift                       = ignore   # ignore/break/force/lead/trail/join/lead_break/lead_force/trail_break/trail_force

#
# Line splitting options
#

# Try to limit code width to N columns.
code_width                      = 0        # unsigned number

# Whether to fully split long 'for' statements at semi-colons.
ls_for_split_full               = false    # true/false

# Whether to fully split long function prototypes/calls at commas.
# The option ls_code_width has priority over the option ls_func_split_full.
ls_func_split_full              = false    # true/false

# Whether to split lines as close to code_width as possible and ignore some
# groupings.
# The option ls_code_width has priority over the option ls_func_split_full.
ls_code_width                   = false    # true/false

#
# Code alignment options (not left column spaces/tabs)
#

# Whether to keep non-indenting tabs.
align_keep_tabs                 = false    # true/false

# Whether to use tabs for aligning.
align_with_tabs                 = false    # true/false

# Whether to bump out to the next tab when aligning.
align_on_tabstop                = false    # true/false

# Whether to right-align numbers.
align_number_right              = false    # true/false

# Whether to keep whitespace not required for alignment.
align_keep_extra_space          = false    # true/false

# Whether to align variable definitions in prototypes and functions.
align_func_params               = false    # true/false

# The span for aligning parameter definitions in function on parameter name.
#
# 0: Don't align (default).
align_func_params_span          = 1        # unsigned number

# The threshold for aligning function parameter definitions.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_func_params_thresh        = 0        # number

# The gap for aligning function parameter definitions.
align_func_params_gap           = 0        # unsigned number

# The span for aligning constructor value.
#
# 0: Don't align (default).
align_constr_value_span         = 0        # unsigned number

# The threshold for aligning constructor value.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_constr_value_thresh       = 0        # number

# The gap for aligning constructor value.
align_constr_value_gap          = 0        # unsigned number

# Whether to align parameters in single-line functions that have the same
# name. The function names must already be aligned with each other.
align_same_func_call_params     = false    # true/false

# The span for aligning function-call parameters for single line functions.
#
# 0: Don't align (default).
align_same_func_call_params_span = 0        # unsigned number

# The threshold for aligning function-call parameters for single line
# functions.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_same_func_call_params_thresh = 0        # number

# The span for aligning variable definitions.
#
# 0: Don't align (default).
align_var_def_span              = 0        # unsigned number

# How to consider (or treat) the '*' in the alignment of variable definitions.
#
# 0: Part of the type     'void *   foo;' (default)
# 1: Part of the variable 'void     *foo;'
# 2: Dangling             'void    *foo;'
# Dangling: the '*' will not be taken into account when aligning.
align_var_def_star_style        = 0        # unsigned number

# How to consider (or treat) the '&' in the alignment of variable definitions.
#
# 0: Part of the type     'long &   foo;' (default)
# 1: Part of the variable 'long     &foo;'
# 2: Dangling             'long    &foo;'
# Dangling: the '&' will not be taken into account when aligning.
align_var_def_amp_style         = 0        # unsigned number

# The threshold for aligning variable definitions.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_var_def_thresh            = 0        # number

# The gap for aligning variable definitions.
align_var_def_gap               = 0        # unsigned number

# Whether to align the colon in struct bit fields.
align_var_def_colon             = false    # true/false

# The gap for aligning the colon in struct bit fields.
align_var_def_colon_gap         = 0        # unsigned number

# Whether to align any attribute after the variable name.
align_var_def_attribute         = false    # true/false

# Whether to align inline struct/enum/union variable definitions.
align_var_def_inline            = false    # true/false

# The span for aligning on '=' in assignments.
#
# 0: Don't align (default).
align_assign_span               = 0        # unsigned number

# The span for aligning on '=' in function prototype modifier.
#
# 0: Don't align (default).
align_assign_func_proto_span    = 0        # unsigned number

# The threshold for aligning on '=' in assignments.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_assign_thresh             = 0        # number

# Whether to align on the left most assignment when multiple
# definitions are found on the same line.
# Depends on 'align_assign_span' and 'align_assign_thresh' settings.
align_assign_on_multi_var_defs  = false    # true/false

# The span for aligning on '{' in braced init list.
#
# 0: Don't align (default).
align_braced_init_list_span     = 0        # unsigned number

# The threshold for aligning on '{' in braced init list.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_braced_init_list_thresh   = 0        # number

# How to apply align_assign_span to function declaration "assignments", i.e.
# 'virtual void foo() = 0' or '~foo() = {default|delete}'.
#
# 0: Align with other assignments (default)
# 1: Align with each other, ignoring regular assignments
# 2: Don't align
align_assign_decl_func          = 0        # unsigned number

# The span for aligning on '=' in enums.
#
# 0: Don't align (default).
align_enum_equ_span             = 0        # unsigned number

# The threshold for aligning on '=' in enums.
# Use a negative number for absolute thresholds.
#
# 0: no limit (default).
align_enum_equ_thresh           = 0        # number

# The span for aligning class member definitions.
#
# 0: Don't align (default).
align_var_class_span            = 0        # unsigned number

# The threshold for aligning class member definitions.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_var_class_thresh          = 0        # number

# The gap for aligning class member definitions.
align_var_class_gap             = 0        # unsigned number

# The span for aligning struct/union member definitions.
#
# 0: Don't align (default).
align_var_struct_span           = 0        # unsigned number

# The threshold for aligning struct/union member definitions.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_var_struct_thresh         = 0        # number

# The gap for aligning struct/union member definitions.
align_var_struct_gap            = 0        # unsigned number

# The span for aligning struct initializer values.
#
# 0: Don't align (default).
align_struct_init_span          = 0        # unsigned number

# The span for aligning single-line typedefs.
#
# 0: Don't align (default).
align_typedef_span              = 0        # unsigned number

# The minimum space between the type and the synonym of a typedef.
align_typedef_gap               = 0        # unsigned number

# How to align typedef'd functions with other typedefs.
#
# 0: Don't mix them at all (default)
# 1: Align the open parenthesis with the types
# 2: Align the function type name with the other type names
align_typedef_func              = 0        # unsigned number

# How to consider (or treat) the '*' in the alignment of typedefs.
#
# 0: Part of the typedef type, 'typedef int * pint;' (default)
# 1: Part of type name:        'typedef int   *pint;'
# 2: Dangling:                 'typedef int  *pint;'
# Dangling: the '*' will not be taken into account when aligning.
align_typedef_star_style        = 0        # unsigned number

# How to consider (or treat) the '&' in the alignment of typedefs.
#
# 0: Part of the typedef type, 'typedef int & intref;' (default)
# 1: Part of type name:        'typedef int   &intref;'
# 2: Dangling:                 'typedef int  &intref;'
# Dangling: the '&' will not be taken into account when aligning.
align_typedef_amp_style         = 0        # unsigned number

# The span for aligning comments that end lines.
#
# 0: Don't align (default).
align_right_cmt_span            = 0        # unsigned number

# Minimum number of columns between preceding text and a trailing comment in
# order for the comment to qualify for being aligned. Must be non-zero to have
# an effect.
align_right_cmt_gap             = 0        # unsigned number

# If aligning comments, whether to mix with comments after '}' and #endif with
# less than three spaces before the comment.
align_right_cmt_mix             = false    # true/false

# Whether to only align trailing comments that are at the same brace level.
align_right_cmt_same_level      = false    # true/false

# Minimum column at which to align trailing comments. Comments which are
# aligned beyond this column, but which can be aligned in a lesser column,
# may be "pulled in".
#
# 0: Ignore (default).
align_right_cmt_at_col          = 0        # unsigned number

# The span for aligning function prototypes.
#
# 0: Don't align (default).
align_func_proto_span           = 0        # unsigned number

# Whether to ignore continuation lines when evaluating the number of
# new lines for the function prototype alignment's span.
#
# false: continuation lines are part of the newlines count
# true:  continuation lines are not counted
align_func_proto_span_ignore_cont_lines = false    # true/false

# How to consider (or treat) the '*' in the alignment of function prototypes.
#
# 0: Part of the type     'void *   foo();' (default)
# 1: Part of the function 'void     *foo();'
# 2: Dangling             'void    *foo();'
# Dangling: the '*' will not be taken into account when aligning.
align_func_proto_star_style     = 0        # unsigned number

# How to consider (or treat) the '&' in the alignment of function prototypes.
#
# 0: Part of the type     'long &   foo();' (default)
# 1: Part of the function 'long     &foo();'
# 2: Dangling             'long    &foo();'
# Dangling: the '&' will not be taken into account when aligning.
align_func_proto_amp_style      = 0        # unsigned number

# The threshold for aligning function prototypes.
# Use a negative number for absolute thresholds.
#
# 0: No limit (default).
align_func_proto_thresh         = 0        # number

# Minimum gap between the return type and the function name.
align_func_proto_gap            = 0        # unsigned number

# Whether to align function prototypes on the 'operator' keyword instead of
# what follows.
align_on_operator               = false    # true/false

# Whether to mix aligning prototype and variable declarations. If true,
# align_var_def_XXX options are used instead of align_func_proto_XXX options.
align_mix_var_proto             = false    # true/false

# Whether to align single-line functions with function prototypes.
# Uses align_func_proto_span.
align_single_line_func          = false    # true/false

# Whether to align the open brace of single-line functions.
# Requires align_single_line_func=true. Uses align_func_proto_span.
align_single_line_brace         = false    # true/false

# Gap for align_single_line_brace.
align_single_line_brace_gap     = 0        # unsigned number

# (OC) The span for aligning Objective-C message specifications.
#
# 0: Don't align (default).
align_oc_msg_spec_span          = 0        # unsigned number

# Whether and how to align backslashes that split a macro onto multiple lines.
# This will not work right if the macro contains a multi-line comment.
#
# 0: Do nothing (default)
# 1: Align the backslashes in the column at the end of the longest line
# 2: Align with the backslash that is farthest to the left, or, if that
#    backslash is farther left than the end of the longest line, at the end of
#    the longest line
# 3: Align with the backslash that is farthest to the right
align_nl_cont                   = 0        # unsigned number

# The minimum number of spaces between the end of a line and its continuation
# backslash. Requires align_nl_cont.
#
# Default: 1
align_nl_cont_spaces            = 1        # unsigned number

# Whether to align macro functions and variables together.
align_pp_define_together        = false    # true/false

# The span for aligning on '#define' bodies.
#
# =0: Don't align (default)
# >0: Number of lines (including comments) between blocks
align_pp_define_span            = 0        # unsigned number

# The minimum space between label and value of a preprocessor define.
align_pp_define_gap             = 0        # unsigned number

# Whether to align lines that start with '<<' with previous '<<'.
#
# Default: true
align_left_shift                = true     # true/false

# Whether to align comma-separated statements following '<<' (as used to
# initialize Eigen matrices).
align_eigen_comma_init          = false    # true/false

# Whether to align text after 'asm volatile ()' colons.
align_asm_colon                 = false    # true/false

# (OC) Span for aligning parameters in an Objective-C message call
# on the ':'.
#
# 0: Don't align.
align_oc_msg_colon_span         = 0        # unsigned number

# (OC) Whether to always align with the first parameter, even if it is too
# short.
align_oc_msg_colon_first        = false    # true/false

# (OC) Whether to align parameters in an Objective-C '+' or '-' declaration
# on the ':'.
align_oc_decl_colon             = false    # true/false

# (OC) Whether to not align parameters in an Objectve-C message call if first
# colon is not on next line of the message call (the same way Xcode does
# alignment)
align_oc_msg_colon_xcode_like   = false    # true/false

#
# Comment modification options
#

# Try to wrap comments at N columns.
cmt_width                       = 0        # unsigned number

# How to reflow comments.
#
# 0: No reflowing (apart from the line wrapping due to cmt_width) (default)
# 1: No touching at all
# 2: Full reflow (enable cmt_indent_multi for indent with line wrapping due to cmt_width)
cmt_reflow_mode                 = 0        # unsigned number

# Path to a file that contains regular expressions describing patterns for
# which the end of one line and the beginning of the next will be folded into
# the same sentence or paragraph during full comment reflow. The regular
# expressions are described using ECMAScript syntax. The syntax for this
# specification is as follows, where "..." indicates the custom regular
# expression and "n" indicates the nth end_of_prev_line_regex and
# beg_of_next_line_regex regular expression pair:
#
# end_of_prev_line_regex[1] = "...$"
# beg_of_next_line_regex[1] = "^..."
# end_of_prev_line_regex[2] = "...$"
# beg_of_next_line_regex[2] = "^..."
#             .
#             .
#             .
# end_of_prev_line_regex[n] = "...$"
# beg_of_next_line_regex[n] = "^..."
#
# Note that use of this option overrides the default reflow fold regular
# expressions, which are internally defined as follows:
#
# end_of_prev_line_regex[1] = "[\w,\]\)]$"
# beg_of_next_line_regex[1] = "^[\w,\[\(]"
# end_of_prev_line_regex[2] = "\.$"
# beg_of_next_line_regex[2] = "^[A-Z]"
cmt_reflow_fold_regex_file      = ""         # string

# Whether to indent wrapped lines to the start of the encompassing paragraph
# during full comment reflow (cmt_reflow_mode = 2). Overrides the value
# specified by cmt_sp_after_star_cont.
#
# Note that cmt_align_doxygen_javadoc_tags overrides this option for
# paragraphs associated with javadoc tags
cmt_reflow_indent_to_paragraph_start = false    # true/false

# Whether to convert all tabs to spaces in comments. If false, tabs in
# comments are left alone, unless used for indenting.
cmt_convert_tab_to_spaces       = false    # true/false

# Whether to apply changes to multi-line comments, including cmt_width,
# keyword substitution and leading chars.
#
# Default: true
cmt_indent_multi                = true     # true/false

# Whether to align doxygen javadoc-style tags ('@param', '@return', etc.)
# and corresponding fields such that groups of consecutive block tags,
# parameter names, and descriptions align with one another. Overrides that
# which is specified by the cmt_sp_after_star_cont. If cmt_width > 0, it may
# be necessary to enable cmt_indent_multi and set cmt_reflow_mode = 2
# in order to achieve the desired alignment for line-wrapping.
cmt_align_doxygen_javadoc_tags  = false    # true/false

# The number of spaces to insert after the star and before doxygen
# javadoc-style tags (@param, @return, etc). Requires enabling
# cmt_align_doxygen_javadoc_tags. Overrides that which is specified by the
# cmt_sp_after_star_cont.
#
# Default: 1
cmt_sp_before_doxygen_javadoc_tags = 1        # unsigned number

# Whether to change trailing, single-line c-comments into cpp-comments.
cmt_trailing_single_line_c_to_cpp = false    # true/false

# Whether to group c-comments that look like they are in a block.
cmt_c_group                     = false    # true/false

# Whether to put an empty '/*' on the first line of the combined c-comment.
cmt_c_nl_start                  = false    # true/false

# Whether to add a newline before the closing '*/' of the combined c-comment.
cmt_c_nl_end                    = false    # true/false

# Whether to change cpp-comments into c-comments.
cmt_cpp_to_c                    = false    # true/false

# Whether to group cpp-comments that look like they are in a block. Only
# meaningful if cmt_cpp_to_c=true.
cmt_cpp_group                   = false    # true/false

# Whether to put an empty '/*' on the first line of the combined cpp-comment
# when converting to a c-comment.
#
# Requires cmt_cpp_to_c=true and cmt_cpp_group=true.
cmt_cpp_nl_start                = false    # true/false

# Whether to add a newline before the closing '*/' of the combined cpp-comment
# when converting to a c-comment.
#
# Requires cmt_cpp_to_c=true and cmt_cpp_group=true.
cmt_cpp_nl_end                  = false    # true/false

# Whether to put a star on subsequent comment lines.
cmt_star_cont                   = false    # true/false

# The number of spaces to insert at the start of subsequent comment lines.
cmt_sp_before_star_cont         = 0        # unsigned number

# The number of spaces to insert after the star on subsequent comment lines.
cmt_sp_after_star_cont          = 0        # unsigned number

# For multi-line comments with a '*' lead, remove leading spaces if the first
# and last lines of the comment are the same length.
#
# Default: true
cmt_multi_check_last            = true     # true/false

# For multi-line comments with a '*' lead, remove leading spaces if the first
# and last lines of the comment are the same length AND if the length is
# bigger as the first_len minimum.
#
# Default: 4
cmt_multi_first_len_minimum     = 4        # unsigned number

# Path to a file that contains text to insert at the beginning of a file if
# the file doesn't start with a C/C++ comment. If the inserted text contains
# '$(filename)', that will be replaced with the current file's name.
cmt_insert_file_header          = ""         # string

# Path to a file that contains text to insert at the end of a file if the
# file doesn't end with a C/C++ comment. If the inserted text contains
# '$(filename)', that will be replaced with the current file's name.
cmt_insert_file_footer          = ""         # string

# Path to a file that contains text to insert before a function definition if
# the function isn't preceded by a C/C++ comment. If the inserted text
# contains '$(function)', '$(javaparam)' or '$(fclass)', these will be
# replaced with, respectively, the name of the function, the javadoc '@param'
# and '@return' stuff, or the name of the class to which the member function
# belongs.
cmt_insert_func_header          = ""         # string

# Path to a file that contains text to insert before a class if the class
# isn't preceded by a C/C++ comment. If the inserted text contains '$(class)',
# that will be replaced with the class name.
cmt_insert_class_header         = ""         # string

# Path to a file that contains text to insert before an Objective-C message
# specification, if the method isn't preceded by a C/C++ comment. If the
# inserted text contains '$(message)' or '$(javaparam)', these will be
# replaced with, respectively, the name of the function, or the javadoc
# '@param' and '@return' stuff.
cmt_insert_oc_msg_header        = ""         # string

# Whether a comment should be inserted if a preprocessor is encountered when
# stepping backwards from a function name.
#
# Applies to cmt_insert_oc_msg_header, cmt_insert_func_header and
# cmt_insert_class_header.
cmt_insert_before_preproc       = false    # true/false

# Whether a comment should be inserted if a function is declared inline to a
# class definition.
#
# Applies to cmt_insert_func_header.
#
# Default: true
cmt_insert_before_inlines       = true     # true/false

# Whether a comment should be inserted if the function is a class constructor
# or destructor.
#
# Applies to cmt_insert_func_header.
cmt_insert_before_ctor_dtor     = false    # true/false

#
# Code modifying options (non-whitespace)
#

# Add or remove braces on a single-line 'do' statement.
mod_full_brace_do               = ignore   # ignore/add/remove/force

# Add or remove braces on a single-line 'for' statement.
mod_full_brace_for              = ignore   # ignore/add/remove/force

# (Pawn) Add or remove braces on a single-line function definition.
mod_full_brace_function         = ignore   # ignore/add/remove/force

# Add or remove braces on a single-line 'if' statement. Braces will not be
# removed if the braced statement contains an 'else'.
mod_full_brace_if               = ignore   # ignore/add/remove/force

# Whether to enforce that all blocks of an 'if'/'else if'/'else' chain either
# have, or do not have, braces. Overrides mod_full_brace_if.
#
# 0: Don't override mod_full_brace_if
# 1: Add braces to all blocks if any block needs braces and remove braces if
#    they can be removed from all blocks
# 2: Add braces to all blocks if any block already has braces, regardless of
#    whether it needs them
# 3: Add braces to all blocks if any block needs braces and remove braces if
#    they can be removed from all blocks, except if all blocks have braces
#    despite none needing them
mod_full_brace_if_chain         = 0        # unsigned number

# Whether to add braces to all blocks of an 'if'/'else if'/'else' chain.
# If true, mod_full_brace_if_chain will only remove braces from an 'if' that
# does not have an 'else if' or 'else'.
mod_full_brace_if_chain_only    = false    # true/false

# Add or remove braces on single-line 'while' statement.
mod_full_brace_while            = ignore   # ignore/add/remove/force

# Add or remove braces on single-line 'using ()' statement.
mod_full_brace_using            = ignore   # ignore/add/remove/force

# Don't remove braces around statements that span N newlines
mod_full_brace_nl               = 0        # unsigned number

# Whether to prevent removal of braces from 'if'/'for'/'while'/etc. blocks
# which span multiple lines.
#
# Affects:
#   mod_full_brace_for
#   mod_full_brace_if
#   mod_full_brace_if_chain
#   mod_full_brace_if_chain_only
#   mod_full_brace_while
#   mod_full_brace_using
#
# Does not affect:
#   mod_full_brace_do
#   mod_full_brace_function
mod_full_brace_nl_block_rem_mlcond = false    # true/false

# Add or remove unnecessary parentheses on 'return' statement.
mod_paren_on_return             = ignore   # ignore/add/remove/force

# Add or remove unnecessary parentheses on 'throw' statement.
mod_paren_on_throw              = ignore   # ignore/add/remove/force

# (Pawn) Whether to change optional semicolons to real semicolons.
mod_pawn_semicolon              = false    # true/false

# Whether to fully parenthesize Boolean expressions in 'while' and 'if'
# statement, as in 'if (a && b > c)' => 'if (a && (b > c))'.
mod_full_paren_if_bool          = false    # true/false

# Whether to fully parenthesize Boolean expressions after '='
# statement, as in 'x = a && b > c;' => 'x = (a && (b > c));'.
mod_full_paren_assign_bool      = false    # true/false

# Whether to fully parenthesize Boolean expressions after '='
# statement, as in 'return  a && b > c;' => 'return (a && (b > c));'.
mod_full_paren_return_bool      = false    # true/false

# Whether to remove superfluous semicolons.
mod_remove_extra_semicolon      = false    # true/false

# Whether to remove duplicate include.
mod_remove_duplicate_include    = false    # true/false

# the following options (mod_XX_closebrace_comment) use different comment,
# depending of the setting of the next option.
# false: Use the c comment (default)
# true : Use the cpp comment
mod_add_force_c_closebrace_comment = false    # true/false

# If a function body exceeds the specified number of newlines and doesn't have
# a comment after the close brace, a comment will be added.
mod_add_long_function_closebrace_comment = 0        # unsigned number

# If a namespace body exceeds the specified number of newlines and doesn't
# have a comment after the close brace, a comment will be added.
mod_add_long_namespace_closebrace_comment = 0        # unsigned number

# If a class body exceeds the specified number of newlines and doesn't have a
# comment after the close brace, a comment will be added.
mod_add_long_class_closebrace_comment = 0        # unsigned number

# If a switch body exceeds the specified number of newlines and doesn't have a
# comment after the close brace, a comment will be added.
mod_add_long_switch_closebrace_comment = 0        # unsigned number

# If an #ifdef body exceeds the specified number of newlines and doesn't have
# a comment after the #endif, a comment will be added.
mod_add_long_ifdef_endif_comment = 0        # unsigned number

# If an #ifdef or #else body exceeds the specified number of newlines and
# doesn't have a comment after the #else, a comment will be added.
mod_add_long_ifdef_else_comment = 0        # unsigned number

# Whether to take care of the case by the mod_sort_xx options.
mod_sort_case_sensitive         = false    # true/false

# Whether to sort consecutive single-line 'import' statements.
mod_sort_import                 = false    # true/false

# (C#) Whether to sort consecutive single-line 'using' statements.
mod_sort_using                  = false    # true/false

# Whether to sort consecutive single-line '#include' statements (C/C++) and
# '#import' statements (Objective-C). Be aware that this has the potential to
# break your code if your includes/imports have ordering dependencies.
mod_sort_include                = false    # true/false

# Whether to prioritize '#include' and '#import' statements that contain
# filename without extension when sorting is enabled.
mod_sort_incl_import_prioritize_filename = false    # true/false

# Whether to prioritize '#include' and '#import' statements that does not
# contain extensions when sorting is enabled.
mod_sort_incl_import_prioritize_extensionless = false    # true/false

# Whether to prioritize '#include' and '#import' statements that contain
# angle over quotes when sorting is enabled.
mod_sort_incl_import_prioritize_angle_over_quotes = false    # true/false

# Whether to ignore file extension in '#include' and '#import' statements
# for sorting comparison.
mod_sort_incl_import_ignore_extension = false    # true/false

# Whether to group '#include' and '#import' statements when sorting is enabled.
mod_sort_incl_import_grouping_enabled = false    # true/false

# Whether to move a 'break' that appears after a fully braced 'case' before
# the close brace, as in 'case X: { ... } break;' => 'case X: { ... break; }'.
mod_move_case_break             = false    # true/false

# Whether to move a 'return' that appears after a fully braced 'case' before
# the close brace, as in 'case X: { ... } return;' => 'case X: { ... return; }'.
mod_move_case_return            = false    # true/false

# Add or remove braces around a fully braced case statement. Will only remove
# braces if there are no variable declarations in the block.
mod_case_brace                  = ignore   # ignore/add/remove/force

# Whether to remove a void 'return;' that appears as the last statement in a
# function.
mod_remove_empty_return         = false    # true/false

# Add or remove the comma after the last value of an enumeration.
mod_enum_last_comma             = ignore   # ignore/add/remove/force

# Syntax to use for infinite loops.
#
# 0: Leave syntax alone (default)
# 1: Rewrite as `for(;;)`
# 2: Rewrite as `while(true)`
# 3: Rewrite as `do`...`while(true);`
# 4: Rewrite as `while(1)`
# 5: Rewrite as `do`...`while(1);`
#
# Infinite loops that do not already match one of these syntaxes are ignored.
# Other options that affect loop formatting will be applied after transforming
# the syntax.
mod_infinite_loop               = 0        # unsigned number

# Add or remove the 'int' keyword in 'int short'.
mod_int_short                   = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'short int'.
mod_short_int                   = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'int long'.
mod_int_long                    = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'long int'.
mod_long_int                    = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'int signed'.
mod_int_signed                  = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'signed int'.
mod_signed_int                  = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'int unsigned'.
mod_int_unsigned                = ignore   # ignore/add/remove/force

# Add or remove the 'int' keyword in 'unsigned int'.
mod_unsigned_int                = ignore   # ignore/add/remove/force

# If there is a situation where mod_int_* and mod_*_int would result in
# multiple int keywords, whether to keep the rightmost int (the default) or the
# leftmost int.
mod_int_prefer_int_on_left      = false    # true/false

# (OC) Whether to organize the properties. If true, properties will be
# rearranged according to the mod_sort_oc_property_*_weight factors.
mod_sort_oc_properties          = false    # true/false

# (OC) Weight of a class property modifier.
mod_sort_oc_property_class_weight = 0        # number

# (OC) Weight of 'atomic' and 'nonatomic'.
mod_sort_oc_property_thread_safe_weight = 0        # number

# (OC) Weight of 'readwrite' when organizing properties.
mod_sort_oc_property_readwrite_weight = 0        # number

# (OC) Weight of a reference type specifier ('retain', 'copy', 'assign',
# 'weak', 'strong') when organizing properties.
mod_sort_oc_property_reference_weight = 0        # number

# (OC) Weight of getter type ('getter=') when organizing properties.
mod_sort_oc_property_getter_weight = 0        # number

# (OC) Weight of setter type ('setter=') when organizing properties.
mod_sort_oc_property_setter_weight = 0        # number

# (OC) Weight of nullability type ('nullable', 'nonnull', 'null_unspecified',
# 'null_resettable') when organizing properties.
mod_sort_oc_property_nullability_weight = 0        # number

#
# Preprocessor options
#

# How to use tabs when indenting preprocessor code.
#
# -1: Use 'indent_with_tabs' setting (default)
#  0: Spaces only
#  1: Indent with tabs to brace level, align with spaces
#  2: Indent and align with tabs, using spaces when not on a tabstop
#
# Default: -1
pp_indent_with_tabs             = -1       # number

# Add or remove indentation of preprocessor directives inside #if blocks
# at brace level 0 (file-level).
pp_indent                       = ignore   # ignore/add/remove/force

# Whether to indent #if/#else/#endif at the brace level. If false, these are
# indented from column 1.
pp_indent_at_level              = false    # true/false

# Whether to indent #if/#else/#endif at the parenthesis level if the brace
# level is 0. If false, these are indented from column 1.
pp_indent_at_level0             = false    # true/false

# Specifies the number of columns to indent preprocessors per level
# at brace level 0 (file-level). If pp_indent_at_level=false, also specifies
# the number of columns to indent preprocessors per level
# at brace level > 0 (function-level).
#
# Default: 1
pp_indent_count                 = 1        # unsigned number

# Add or remove space after # based on pp level of #if blocks.
pp_space_after                  = ignore   # ignore/add/remove/force

# Sets the number of spaces per level added with pp_space_after.
pp_space_count                  = 0        # unsigned number

# The indent for '#region' and '#endregion' in C# and '#pragma region' in
# C/C++. Negative values decrease indent down to the first column.
pp_indent_region                = 0        # number

# Whether to indent the code between #region and #endregion.
pp_region_indent_code           = false    # true/false

# If pp_indent_at_level=true, sets the indent for #if, #else and #endif when
# not at file-level. Negative values decrease indent down to the first column.
#
# =0: Indent preprocessors using output_tab_size
# >0: Column at which all preprocessors will be indented
pp_indent_if                    = 0        # number

# Whether to indent the code between #if, #else and #endif.
pp_if_indent_code               = false    # true/false

# Whether to indent the body of an #if that encompasses all the code in the file.
pp_indent_in_guard              = false    # true/false

# Whether to indent '#define' at the brace level. If false, these are
# indented from column 1.
pp_define_at_level              = false    # true/false

# Whether to indent '#include' at the brace level.
pp_include_at_level             = false    # true/false

# Whether to ignore the '#define' body while formatting.
pp_ignore_define_body           = false    # true/false

# An offset value that controls the indentation of the body of a multiline #define.
# 'body' refers to all the lines of a multiline #define except the first line.
# Requires 'pp_ignore_define_body = false'.
#
#  <0: Absolute column: the body indentation starts off at the specified column
#      (ex. -3 ==> the body is indented starting from column 3)
# >=0: Relative to the column of the '#' of '#define'
#      (ex.  3 ==> the body is indented starting 3 columns at the right of '#')
#
# Default: 8
pp_multiline_define_body_indent = 8        # number

# Whether to indent case statements between #if, #else, and #endif.
# Only applies to the indent of the preprocessor that the case statements
# directly inside of.
#
# Default: true
pp_indent_case                  = true     # true/false

# Whether to indent whole function definitions between #if, #else, and #endif.
# Only applies to the indent of the preprocessor that the function definition
# is directly inside of.
#
# Default: true
pp_indent_func_def              = true     # true/false

# Whether to indent extern C blocks between #if, #else, and #endif.
# Only applies to the indent of the preprocessor that the extern block is
# directly inside of.
#
# Default: true
pp_indent_extern                = true     # true/false

# How to indent braces directly inside #if, #else, and #endif.
# Requires pp_if_indent_code=true and only applies to the indent of the
# preprocessor that the braces are directly inside of.
#  0: No extra indent
#  1: Indent by one level
# -1: Preserve original indentation
#
# Default: 1
pp_indent_brace                 = 1        # number

# Action to perform when unbalanced #if and #else blocks are found.
# 0: do nothing
# 1: print a warning message
# 2: terminate the program with an error (EX_SOFTWARE)
#
# The action will be triggered in the following cases:
# - if an #ifdef block ends on a different indent level than
#   where it started from. Example:
#
#    #ifdef TEST
#      int i;
#      {
#        int j;
#    #endif
#
# - an #elif/#else block ends on a different indent level than
#   the corresponding #ifdef block. Example:
#
#    #ifdef TEST
#        int i;
#    #else
#        }
#      int j;
#    #endif
pp_unbalanced_if_action         = 0        # unsigned number

#
# Sort includes options
#

# The regex for include category with priority 0.
include_category_0              = ""         # string

# The regex for include category with priority 1.
include_category_1              = ""         # string

# The regex for include category with priority 2.
include_category_2              = ""         # string

#
# Use or Do not Use options
#

# true:  indent_func_call_param will be used (default)
# false: indent_func_call_param will NOT be used
#
# Default: true
use_indent_func_call_param      = true     # true/false

# The value of the indentation for a continuation line is calculated
# differently if the statement is:
# - a declaration: your case with QString fileName ...
# - an assignment: your case with pSettings = new QSettings( ...
#
# At the second case the indentation value might be used twice:
# - at the assignment
# - at the function call (if present)
#
# To prevent the double use of the indentation value, use this option with the
# value 'true'.
#
# true:  indent_continue will be used only once
# false: indent_continue will be used every time (default)
#
# Requires indent_ignore_first_continue=false.
use_indent_continue_only_once   = false    # true/false

# The indentation can be:
# - after the assignment, at the '[' character
# - at the beginning of the lambda body
#
# true:  indentation will be at the beginning of the lambda body
# false: indentation will be after the assignment (default)
indent_cpp_lambda_only_once     = false    # true/false

# Whether sp_after_angle takes precedence over sp_inside_fparen. This was the
# historic behavior, but is probably not the desired behavior, so this is off
# by default.
use_sp_after_angle_always       = false    # true/false

# Whether to apply special formatting for Qt SIGNAL/SLOT macros. Essentially,
# this tries to format these so that they match Qt's normalized form (i.e. the
# result of QMetaObject::normalizedSignature), which can slightly improve the
# performance of the QObject::connect call, rather than how they would
# otherwise be formatted.
#
# See options_for_QT.cpp for details.
#
# Default: true
use_options_overriding_for_qt_macros = true     # true/false

# If true: the form feed character is removed from the list of whitespace
# characters. See https://en.cppreference.com/w/cpp/string/byte/isspace.
use_form_feed_no_more_as_whitespace_character = false    # true/false

#
# Warn levels - 1: error, 2: warning (default), 3: note
#

# (C#) Warning is given if doing tab-to-\t replacement and we have found one
# in a C# verbatim string literal.
#
# Default: 2
warn_level_tabs_found_in_verbatim_string_literals = 2        # unsigned number

# Limit the number of loops.
# Used by uncrustify.cpp to exit from infinite loop.
# 0: no limit.
debug_max_number_of_loops       = 0        # number

# Set the number of the line to protocol;
# Used in the function prot_the_line if the 2. parameter is zero.
# 0: nothing protocol.
debug_line_number_to_protocol   = 0        # number

# Set the number of second(s) before terminating formatting the current file,
# 0: no timeout.
# only for linux
debug_timeout                   = 0        # number

# Set the number of characters to be printed if the text is too long,
# 0: do not truncate.
debug_truncate                  = 0        # unsigned number

# sort (or not) the tracking info.
#
# Default: true
debug_sort_the_tracks           = true     # true/false

# decode (or not) the flags as a new line.
# only if the -p option is set.
debug_decode_the_flags          = false    # true/false

# use (or not) the exit(EX_SOFTWARE) function.
#
# Default: true
debug_use_the_exit_function_pop = true     # true/false

# print (or not) the version in the file defined at the command option -o.
debug_print_version             = false    # true/false

# insert the number of the line at the beginning of each line
set_numbering_for_html_output   = false    # true/false

# Meaning of the settings:
#   Ignore - do not do any changes
#   Add    - makes sure there is 1 or more space/brace/newline/etc
#   Force  - makes sure there is exactly 1 space/brace/newline/etc,
#            behaves like Add in some contexts
#   Remove - removes space/brace/newline/etc
#
#
# - Token(s) can be treated as specific type(s) with the 'set' option:
#     `set tokenType tokenString [tokenString...]`
#
#     Example:
#       `set BOOL __AND__ __OR__`
#
#     tokenTypes are defined in src/token_enum.h, use them without the
#     'CT_' prefix: 'CT_BOOL' => 'BOOL'
#
#
# - Token(s) can be treated as type(s) with the 'type' option.
#     `type tokenString [tokenString...]`
#
#     Example:
#       `type int c_uint_8 Rectangle`
#
#     This can also be achieved with `set TYPE int c_uint_8 Rectangle`
#
#
# To embed whitespace in tokenStrings use the '\' escape character, or quote
# the tokenStrings. These quotes are supported: "'`
#
#
# - Support for the auto detection of languages through the file ending can be
#   added using the 'file_ext' command.
#     `file_ext langType langString [langString..]`
#
#     Example:
#       `file_ext CPP .ch .cxx .cpp.in`
#
#     langTypes are defined in uncrusify_types.h in the lang_flag_e enum, use
#     them without the 'LANG_' prefix: 'LANG_CPP' => 'CPP'
#
#
# - Custom macro-based indentation can be set up using 'macro-open',
#   'macro-else' and 'macro-close'.
#     `(macro-open | macro-else | macro-close) tokenString`
#
#     Example:
#       `macro-open  BEGIN_TEMPLATE_MESSAGE_MAP`
#       `macro-open  BEGIN_MESSAGE_MAP`
#       `macro-close END_MESSAGE_MAP`
#
#
# option(s) with 'not default' value: 0
#


================================================
FILE: inst/notebooks/benchmark_mix_vs_sp.R
================================================
# Benchmark: Multi-panel mixture vs single-panel
#
# Metrics:
#   ELBO:  mixture ELBO vs best single-panel ELBO (should be >=)
#   FDR:   fraction of 95% CS NOT containing a causal variable
#   Power: fraction of causal variables covered by at least one 95% CS
#
# True model: z ~ N(R_mix %*% beta, sigma2 * R_mix + lambda * I)
# where R_mix = w1 * R1 + w2 * R2 (true mixture).
#
# Usage: Rscript inst/notebooks/benchmark_mix_vs_sp.R
# Or:    source("inst/notebooks/benchmark_mix_vs_sp.R") after devtools::load_all()

# Load from the working tree to pick up uncommitted fixes.
if (requireNamespace("devtools", quietly = TRUE) &&
    file.exists("DESCRIPTION")) {
  devtools::load_all(".", quiet = TRUE)
} else {
  library(susieR)
  message("NOTE: using installed susieR; run from package root for working-tree version")
}

# ---------------------------------------------------------------------------
# Generate X with block-correlated LD structure
# ---------------------------------------------------------------------------
make_block_correlated_X <- function(n, p, rho, block_size = 10) {
  X <- matrix(rnorm(n * p), n, p)
  n_blocks <- p %/% block_size
  for (b in seq_len(n_blocks)) {
    idx <- ((b - 1) * block_size + 1):(b * block_size)
    shared <- rnorm(n)
    X[, idx] <- sqrt(1 - rho) * X[, idx] + sqrt(rho) * shared
  }
  X
}

# ---------------------------------------------------------------------------
# CS-based FDR/Power
#   FDR   = fraction of 95% CS that do NOT contain any causal variable
#   Power = fraction of causal variables covered by at least one 95% CS
# ---------------------------------------------------------------------------
cs_fdr_power <- function(fit, causal_idx) {
  cs_list <- fit$sets$cs
  if (is.null(cs_list) || length(cs_list) == 0)
    return(list(fdr = 0, power = 0, n_cs = 0))
  n_cs <- length(cs_list)
  cs_hits <- sapply(cs_list, function(cs) any(cs %in% causal_idx))
  fdr <- sum(!cs_hits) / n_cs
  covered <- sapply(causal_idx, function(j)
    any(sapply(cs_list, function(cs) j %in% cs)))
  power <- mean(covered)
  list(fdr = fdr, power = power, n_cs = n_cs)
}

# ---------------------------------------------------------------------------
# Single scenario runner
# ---------------------------------------------------------------------------
run_scenario <- function(scenario, n_reps = 50) {
  cat(sprintf("=== %s (p=%d, tw=%.1f/%.1f, B=%d/%d, rho=%.1f/%.1f, L=%d, sig=%.1f) ===\n",
              scenario$name, scenario$p,
              scenario$true_w[1], scenario$true_w[2],
              scenario$B1, scenario$B2,
              scenario$rho1, scenario$rho2,
              scenario$n_signals, scenario$signal_strength))

  p <- scenario$p
  n_signals <- scenario$n_signals
  signal_strength <- scenario$signal_strength
  lambda <- scenario$lambda
  max_iter <- scenario$max_iter
  L <- scenario$L

  # Accumulators
  mix_ge_sp     <- 0
  mix_better    <- 0
  safeguard_ct  <- 0
  elbo_diffs    <- numeric(n_reps)
  omega1_est    <- numeric(n_reps)

  # Track per-iteration ELBO decreases in mixture fits
  elbo_decrease_ct <- 0  # reps with at least one ELBO decrease

  # CS-based FDR/power: rows = reps, cols = methods
  methods <- c("sp1", "sp2", "best_sp", "mix")
  fdr_mat   <- matrix(NA, n_reps, 4, dimnames = list(NULL, methods))
  power_mat <- matrix(NA, n_reps, 4, dimnames = list(NULL, methods))
  ncs_mat   <- matrix(NA, n_reps, 4, dimnames = list(NULL, methods))

  for (rep in seq_len(n_reps)) {
    set.seed(scenario$seed_base + rep)

    X1 <- make_block_correlated_X(scenario$B1, p, scenario$rho1)
    X2 <- make_block_correlated_X(scenario$B2, p, scenario$rho2)

    R1 <- crossprod(X1) / scenario$B1
    R2 <- crossprod(X2) / scenario$B2
    R_true <- scenario$true_w[1] * R1 + scenario$true_w[2] * R2

    beta <- rep(0, p)
    causal <- sample(p, n_signals)
    beta[causal] <- signal_strength * sample(c(-1, 1), n_signals, replace = TRUE)
    z <- as.vector(R_true %*% beta) + rnorm(p, sd = sqrt(lambda))

    # Single-panel fits
    fit1 <- susie_rss(z = z, X = X1, L = L,
	                      max_iter = max_iter,
	                      estimate_residual_variance = TRUE, verbose = FALSE)
    fit2 <- susie_rss(z = z, X = X2, L = L,
	                      max_iter = max_iter,
	                      estimate_residual_variance = TRUE, verbose = FALSE)
    best_sp_elbo <- max(tail(fit1$elbo, 1), tail(fit2$elbo, 1))
    best_sp_fit <- if (tail(fit1$elbo, 1) >= tail(fit2$elbo, 1)) fit1 else fit2

    # Mixture fit (with all fixes + safeguard)
    fit_mix <- susie_rss(z = z, X = list(X1, X2), L = L,
	                         max_iter = max_iter,
	                         estimate_residual_variance = TRUE, verbose = FALSE,
                         check_prior = FALSE)
    mix_elbo <- tail(fit_mix$elbo, 1)

    # ELBO tracking
    elbo_diffs[rep] <- mix_elbo - best_sp_elbo
    omega1_est[rep] <- fit_mix$omega_weights[1]

    if (mix_elbo >= best_sp_elbo - 1e-6) mix_ge_sp <- mix_ge_sp + 1
    if (mix_elbo > best_sp_elbo + 0.1)   mix_better <- mix_better + 1
    if (any(fit_mix$omega_weights > 0.999)) safeguard_ct <- safeguard_ct + 1  # omega collapsed to single panel

    # Check for ELBO decreases within the mixture fit
    elbo_traj <- fit_mix$elbo
    if (length(elbo_traj) > 1 && any(diff(elbo_traj) < -1e-6))
      elbo_decrease_ct <- elbo_decrease_ct + 1

    # CS-based FDR / Power
    r1 <- cs_fdr_power(fit1, causal)
    r2 <- cs_fdr_power(fit2, causal)
    r_best <- cs_fdr_power(best_sp_fit, causal)
    r_mix <- cs_fdr_power(fit_mix, causal)

    fdr_mat[rep, ]   <- c(r1$fdr, r2$fdr, r_best$fdr, r_mix$fdr)
    power_mat[rep, ] <- c(r1$power, r2$power, r_best$power, r_mix$power)
    ncs_mat[rep, ]   <- c(r1$n_cs, r2$n_cs, r_best$n_cs, r_mix$n_cs)

    # Print detail for first 2 reps
    if (rep <= 2) {
      cat(sprintf("  Rep %d: SP1=%.1f SP2=%.1f | MIX=%.1f (w=%.2f,%.2f)\n",
                  rep,
                  tail(fit1$elbo, 1), tail(fit2$elbo, 1),
                  mix_elbo, fit_mix$omega_weights[1], fit_mix$omega_weights[2]))
      cat(sprintf("    MIX: %d CS, FDR=%.2f, Power=%.2f | bestSP: %d CS, FDR=%.2f, Power=%.2f\n",
                  r_mix$n_cs, r_mix$fdr, r_mix$power,
                  r_best$n_cs, r_best$fdr, r_best$power))
      cat(sprintf("    ELBO trajectory: %s\n",
                  paste(round(head(fit_mix$elbo, 8), 1), collapse = " -> ")))
    }
  }

  # Per-scenario summary
  cat(sprintf("  ELBO:  Mix>=SP %d/%d | Better %d/%d | Collapsed %d/%d | ELBO-decrease %d/%d\n",
              mix_ge_sp, n_reps, mix_better, n_reps,
              safeguard_ct, n_reps, elbo_decrease_ct, n_reps))
  cat(sprintf("         diff: mean=%.2f min=%.2f max=%.2f\n",
              mean(elbo_diffs), min(elbo_diffs), max(elbo_diffs)))
  cat(sprintf("  CS-FDR:   SP1=%.3f  SP2=%.3f  bestSP=%.3f  MIX=%.3f\n",
              mean(fdr_mat[,"sp1"]), mean(fdr_mat[,"sp2"]),
              mean(fdr_mat[,"best_sp"]), mean(fdr_mat[,"mix"])))
  cat(sprintf("  CS-Power: SP1=%.3f  SP2=%.3f  bestSP=%.3f  MIX=%.3f\n",
              mean(power_mat[,"sp1"]), mean(power_mat[,"sp2"]),
              mean(power_mat[,"best_sp"]), mean(power_mat[,"mix"])))
  cat(sprintf("  Avg #CS:  SP1=%.1f  SP2=%.1f  bestSP=%.1f  MIX=%.1f\n",
              mean(ncs_mat[,"sp1"]), mean(ncs_mat[,"sp2"]),
              mean(ncs_mat[,"best_sp"]), mean(ncs_mat[,"mix"])))
  if (all(scenario$true_w > 0))
    cat(sprintf("  True w1=%.1f, est w1: mean=%.2f sd=%.2f\n",
                scenario$true_w[1], mean(omega1_est), sd(omega1_est)))
  cat("\n")

  invisible(list(
    name = scenario$name,
    mix_ge_sp = mix_ge_sp, mix_better = mix_better,
    safeguard_ct = safeguard_ct, elbo_decrease_ct = elbo_decrease_ct,
    elbo_diffs = elbo_diffs, omega1_est = omega1_est, n_reps = n_reps,
    fdr_mat = fdr_mat, power_mat = power_mat, ncs_mat = ncs_mat
  ))
}

# ---------------------------------------------------------------------------
# Scenario definitions
# ---------------------------------------------------------------------------
scenarios <- list(

  # --- Stress tests (larger p, stronger signals, more LD structure) ---

  list(name = "equal_mix",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 10000),

  list(name = "asym_weight",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.3, 0.7), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 20000),

  list(name = "asym_B",
       p = 200, B1 = 200, B2 = 800, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 30000),

  list(name = "strong_dense",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 8, signal_strength = 5.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 40000),

  list(name = "one_correct",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.7, rho2 = 0.3,
       true_w = c(1.0, 0.0), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 50000),

  list(name = "extreme_LD",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.9, rho2 = 0.1,
       true_w = c(0.5, 0.5), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 60000),

  list(name = "small_B",
       p = 200, B1 = 150, B2 = 150, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 5, signal_strength = 3.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 70000),

  list(name = "weak_signals",
       p = 200, B1 = 500, B2 = 500, rho1 = 0.7, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 5, signal_strength = 1.5,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 80000),

  # --- Smaller-scale sanity checks (from earlier benchmark) ---

  list(name = "small_equal",
       p = 50, B1 = 200, B2 = 200, rho1 = 0.5, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 3, signal_strength = 2.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 90000),

  list(name = "small_asym_w",
       p = 50, B1 = 200, B2 = 200, rho1 = 0.5, rho2 = 0.3,
       true_w = c(0.3, 0.7), n_signals = 3, signal_strength = 2.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 100000),

  list(name = "small_asym_B",
       p = 50, B1 = 100, B2 = 400, rho1 = 0.5, rho2 = 0.3,
       true_w = c(0.5, 0.5), n_signals = 3, signal_strength = 2.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 110000),

  list(name = "small_one_true",
       p = 50, B1 = 200, B2 = 200, rho1 = 0.5, rho2 = 0.3,
       true_w = c(1.0, 0.0), n_signals = 3, signal_strength = 2.0,
       lambda = 0.1, max_iter = 100, L = 10, seed_base = 120000)
)

# ---------------------------------------------------------------------------
# Run all scenarios
# ---------------------------------------------------------------------------
n_reps <- 50

cat("================================================================\n")
cat("Benchmark: Multi-Panel Mixture vs Single Panel\n")
cat(sprintf("  %d scenarios x %d reps = %d total runs\n",
            length(scenarios), n_reps, length(scenarios) * n_reps))
cat("  FDR/Power based on 95%% credible sets\n")
cat("================================================================\n\n")

results <- lapply(scenarios, run_scenario, n_reps = n_reps)

# ---------------------------------------------------------------------------
# ELBO summary table
# ---------------------------------------------------------------------------
cat("================================================================\n")
cat("ELBO TABLE\n")
cat("================================================================\n\n")
cat(sprintf("%-18s %4s %8s %8s %9s %9s %10s %10s\n",
            "Scenario", "N", "Mix>=SP", "Better", "Safegrd", "ELBOdecr",
            "diff_mean", "diff_min"))
cat(paste(rep("-", 90), collapse = ""), "\n")
for (r in results) {
  cat(sprintf("%-18s %4d %5d/%-2d %5d/%-2d %5d/%-2d %6d/%-2d %10.2f %10.2f\n",
              r$name, r$n_reps,
              r$mix_ge_sp, r$n_reps,
              r$mix_better, r$n_reps,
              r$safeguard_ct, r$n_reps,
              r$elbo_decrease_ct, r$n_reps,
              mean(r$elbo_diffs),
              min(r$elbo_diffs)))
}
total_reps <- sum(sapply(results, "[[", "n_reps"))
total_pass <- sum(sapply(results, "[[", "mix_ge_sp"))
total_decr <- sum(sapply(results, "[[", "elbo_decrease_ct"))
cat(sprintf("\nOVERALL: %d/%d mixture >= SP | %d/%d had ELBO decrease\n",
            total_pass, total_reps, total_decr, total_reps))

# ---------------------------------------------------------------------------
# FDR table (95% CS)
# ---------------------------------------------------------------------------
cat("\n\n================================================================\n")
cat("FDR TABLE (95% Credible Sets)\n")
cat("  FDR = fraction of CS not containing any causal variable\n")
cat("================================================================\n\n")
cat(sprintf("%-18s %8s %8s %8s %8s\n",
            "Scenario", "SP1", "SP2", "bestSP", "MIX"))
cat(paste(rep("-", 52), collapse = ""), "\n")
for (r in results) {
  cat(sprintf("%-18s %8.3f %8.3f %8.3f %8.3f\n",
              r$name,
              mean(r$fdr_mat[,"sp1"]),
              mean(r$fdr_mat[,"sp2"]),
              mean(r$fdr_mat[,"best_sp"]),
              mean(r$fdr_mat[,"mix"])))
}

# ---------------------------------------------------------------------------
# Power table (95% CS)
# ---------------------------------------------------------------------------
cat("\n\n================================================================\n")
cat("POWER TABLE (95% Credible Sets)\n")
cat("  Power = fraction of causal vars covered by >= 1 CS\n")
cat("================================================================\n\n")
cat(sprintf("%-18s %8s %8s %8s %8s\n",
            "Scenario", "SP1", "SP2", "bestSP", "MIX"))
cat(paste(rep("-", 52), collapse = ""), "\n")
for (r in results) {
  cat(sprintf("%-18s %8.3f %8.3f %8.3f %8.3f\n",
              r$name,
              mean(r$power_mat[,"sp1"]),
              mean(r$power_mat[,"sp2"]),
              mean(r$power_mat[,"best_sp"]),
              mean(r$power_mat[,"mix"])))
}

# ---------------------------------------------------------------------------
# Average number of CS
# ---------------------------------------------------------------------------
cat("\n\n================================================================\n")
cat("AVG NUMBER OF CS\n")
cat("================================================================\n\n")
cat(sprintf("%-18s %8s %8s %8s %8s\n",
            "Scenario", "SP1", "SP2", "bestSP", "MIX"))
cat(paste(rep("-", 52), collapse = ""), "\n")
for (r in results) {
  cat(sprintf("%-18s %8.1f %8.1f %8.1f %8.1f\n",
              r$name,
              mean(r$ncs_mat[,"sp1"]),
              mean(r$ncs_mat[,"sp2"]),
              mean(r$ncs_mat[,"best_sp"]),
              mean(r$ncs_mat[,"mix"])))
}


================================================
FILE: inst/notebooks/small_sample_benchmark.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "1a065c06",
   "metadata": {},
   "source": [
    "# Small-Sample Benchmark SuSiE vs SuSiE-SS\n",
    "\n",
    "We observe in our data analysis that when sample sizes are small\n",
    "relative to the number of variants ($n \\ll p$),\n",
    "standard SuSiE can **overfit** by underestimating the residual variance $\\sigma^2$.\n",
    "This leads to inflated Bayes factors and spurious credible sets (CS).\n",
    "The Servin-Stephens prior integrates out $\\sigma^2$ analytically using a\n",
    "Normal-Inverse-Gamma (NIG) conjugate prior, producing $t$-distributed marginals\n",
    "that are naturally more conservative but calibrated in scenarios including and beyond small samples.\n",
    "\n",
    "In this notebook we show a benchmark focused on the small sample situation, using realistic simulations from\n",
    "eQTL data we analyze.\n",
    "\n",
    "### Data\n",
    "\n",
    "This particular example use real genotype and expression data from the Thyroid FMO2 locus,\n",
    "part of the GTEx project. The dataset contains $n = 574$ samples,\n",
    "$p = 7{,}651$ variants in a 1 Mb window, and 68 covariates\n",
    "(5 genotype PCs, 60 inferred covariates, PCR method, platform, and sex).\n",
    "We first regress covariates out of both $X$ and $y$ on the full cohort,\n",
    "then subsample $N \\in \\{30, 50, 70, 100\\}$ individuals per replicate.\n",
    "\n",
    "### Simulation design\n",
    "\n",
    "To create realistic noise that reproduces the overfitting\n",
    "pattern seen on real data, we:\n",
    "\n",
    "1. Fit **LASSO** (with `lambda.1se` from cross-validation) on the subsampled $(X, y)$\n",
    "   to obtain an empirical residual $r = y - X\\hat{\\beta}_{\\text{lasso}}$.\n",
    "   LASSO is agnostic of SuSiE vs SuSiE-SS and is a sparse regression method,\n",
    "   so it may best approximate the residual variances left that might be similar\n",
    "   to what SuSiE and SuSiE-SS will encounter.\n",
    "2. Compute $w = U^{\\top} r$, where $U$ contains the left singular vectors\n",
    "   of the centered genotype matrix, so each component $w_k$ captures an\n",
    "   independent direction of variance along the $k$-th principal axis of $X$.\n",
    "   This tells us how the residual is distributed across the directions that the\n",
    "   genotype matrix can explain. We expect this projection to be meaningful\n",
    "   because the overfitting problem arises precisely because real residual noise\n",
    "   concentrates its variance along these same principal axes, making it look\n",
    "   like genetic signal to the model.\n",
    "3. Using a wild bootstrap approach, we draw $s_k \\in \\lbrace -1, +1 \\rbrace$\n",
    "   independently for each component and form new noise\n",
    "   $\\tilde{r} = U(w \\odot s)$. This random sign flip will break any\n",
    "   association between the noise term and any columns in $X$ but will retain\n",
    "   the same per-eigencomponent variance profile because\n",
    "   $w_k^2 = (\\pm w_k)^2$ is unchanged due to sign flip, thus retaining\n",
    "   the realistic residual variance structure in the original data.\n",
    "4. The sign-flip noise is rescaled to a target standard deviation calibrated\n",
    "   from the full Z-adjusted cohort. We regress $y$ on the top 20 PCs of $X$\n",
    "   (on all 574 samples after covariate adjustment) and set\n",
    "   `noise_scale = sqrt(1 - R2)`. This captures the fraction of phenotypic\n",
    "   variance not explained by genotype and avoids overfitting that would occur\n",
    "   if calibration were done on the small subsample.\n",
    "5. Simulate causal signals by randomly drawing columns of $X$ with effect\n",
    "   sizes calibrated to a target signal-to-noise ratio `h2_sparse`.\n",
    "\n",
    "### Metrics\n",
    "\n",
    "| Metric | Definition |\n",
    "|--------|------------|\n",
    "| **Power** | (distinct causal variants found in any filtered CS) / (total causal) |\n",
    "| **Coverage** | (filtered CS containing $\\geq 1$ causal) / (total filtered CS) |\n",
    "| **CS size** | mean number of variants per filtered CS |\n",
    "| **CS / rep** | total filtered CS / number of replicates |\n",
    "| $\\hat{\\sigma}^2$ | estimated residual variance (overfitting diagnostic) |\n",
    "| $\\sum V$ | sum of estimated prior variances across $L$ effects |\n",
    "\n",
    "### References\n",
    "\n",
    "- Servin, B. & Stephens, M. (2007). *PLoS Genetics*, 3(7): e114.\n",
    "- Denault et al (2025). *bioRxiv* doi:10.1101/2025.05.16.654543."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "59f64421",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:34.101933Z",
     "iopub.status.busy": "2026-02-26T01:50:34.100590Z",
     "iopub.status.idle": "2026-02-26T01:50:35.365493Z",
     "shell.execute_reply": "2026-02-26T01:50:35.364895Z"
    }
   },
   "outputs": [],
   "source": [
    "library(susieR)\n",
    "library(glmnet)\n",
    "library(digest)\n",
    "library(future)\n",
    "library(future.apply)\n",
    "\n",
    "# --- Configuration ---\n",
    "ncores    <- max(1, parallelly::availableCores() - 2)\n",
    "n_rep     <- 200       # replicates per setting\n",
    "L         <- 10\n",
    "N_vals    <- c(30, 50, 70, 100)\n",
    "h2_sparse <- c(0.25, 0.50, 0.75)\n",
    "L_causal  <- c(1, 2, 3, 4, 5)\n",
    "\n",
    "# Use multisession (PSOCK) to avoid fork + BLAS crashes\n",
    "plan(multisession, workers = ncores)\n",
    "\n",
    "cat(sprintf(\"susieR version : %s\\n\", packageVersion(\"susieR\")))\n",
    "cat(sprintf(\"Workers        : %d  (multisession / PSOCK)\\n\", ncores))\n",
    "cat(sprintf(\"N values       : %s\\n\", paste(N_vals, collapse = \", \")))\n",
    "cat(sprintf(\"h2_sparse      : %s\\n\", paste(h2_sparse, collapse = \", \")))\n",
    "cat(sprintf(\"n_causal       : %s\\n\", paste(L_causal, collapse = \", \")))\n",
    "cat(sprintf(\"Settings       : %d\\n\", length(N_vals) * length(h2_sparse) * length(L_causal)))\n",
    "cat(sprintf(\"Total reps     : %d\\n\",\n",
    "    length(N_vals) * length(h2_sparse) * length(L_causal) * n_rep))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "f545a794",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:35.376293Z",
     "iopub.status.busy": "2026-02-26T01:50:35.366673Z",
     "iopub.status.idle": "2026-02-26T01:50:35.688546Z",
     "shell.execute_reply": "2026-02-26T01:50:35.687791Z"
    }
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Raw data: n = 574, p = 7651, ncov = 68\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "var(y_raw) = 0.9827\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "\n",
      "After Z adjustment (full cohort, n = 574):\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  var(y_raw)  = 0.9827\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  var(y_adj)  = 0.3317\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  R2(y ~ Z)   = 0.6625\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "  n = 574, p = 7651\n"
     ]
    }
   ],
   "source": [
    "# --- Load Thyroid FMO2 data ---\n",
    "dat <- readRDS(\"Thyroid.FMO2.1Mb.RDS\")\n",
    "X_raw <- dat$X      # 574 x 7651 integer genotype (0/1/2)\n",
    "y_raw <- dat$y      # 574 normalized expression\n",
    "Z     <- dat$Z      # 574 x 68 covariates\n",
    "\n",
    "cat(sprintf(\"Raw data: n = %d, p = %d, ncov = %d\\n\",\n",
    "    nrow(X_raw), ncol(X_raw), ncol(Z)))\n",
    "cat(sprintf(\"var(y_raw) = %.4f\\n\", var(y_raw)))\n",
    "\n",
    "# --- Full-cohort covariate adjustment ---\n",
    "# Regress Z out of both y and X via hat matrix H = Z1 (Z1'Z1)^{-1} Z1'\n",
    "# where Z1 = [1, Z] includes an intercept\n",
    "Z1 <- cbind(1, Z)\n",
    "H  <- Z1 %*% solve(crossprod(Z1), t(Z1))\n",
    "\n",
    "y_full <- as.vector(y_raw - H %*% y_raw)\n",
    "X_full <- X_raw - H %*% X_raw\n",
    "\n",
    "# Summary\n",
    "R2_Z <- 1 - var(y_full) / var(y_raw)\n",
    "cat(sprintf(\"\\nAfter Z adjustment (full cohort, n = %d):\\n\", length(y_full)))\n",
    "cat(sprintf(\"  var(y_raw)  = %.4f\\n\", var(y_raw)))\n",
    "cat(sprintf(\"  var(y_adj)  = %.4f\\n\", var(y_full)))\n",
    "cat(sprintf(\"  R2(y ~ Z)   = %.4f\\n\", R2_Z))\n",
    "cat(sprintf(\"  n = %d, p = %d\\n\", nrow(X_full), ncol(X_full)))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d812bf07",
   "metadata": {},
   "source": [
    "## Sign-flip noise model\n",
    "\n",
    "The sign-flip (wild bootstrap) procedure generates realistic null noise that preserves the variance structure of LASSO residuals projected onto the principal axes of $X$, while breaking any true genotype-phenotype association. The noise level is calibrated once on the full Z-adjusted cohort using a top-20 PC regression, then applied consistently across all subsample sizes."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "184807a2",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:35.691099Z",
     "iopub.status.busy": "2026-02-26T01:50:35.690502Z",
     "iopub.status.idle": "2026-02-26T01:50:36.356752Z",
     "shell.execute_reply": "2026-02-26T01:50:36.355984Z"
    }
   },
   "outputs": [],
   "source": [
    "# --- Noise calibration on full Z-adjusted data ---\n",
    "Xs_cal    <- scale(X_full, center = TRUE, scale = FALSE)\n",
    "svd_cal   <- svd(Xs_cal, nu = min(20, nrow(X_full)), nv = 0)\n",
    "PC20      <- svd_cal$u[, 1:min(20, nrow(X_full))]\n",
    "R2_20     <- summary(lm(y_full ~ PC20))$r.squared\n",
    "noise_scale_factor <- sqrt(1 - R2_20)\n",
    "\n",
    "cat(sprintf(\"Noise calibration (top-20 PC regression on full Z-adjusted data):\\n\"))\n",
    "cat(sprintf(\"  n = %d (full cohort after Z adjustment)\\n\", nrow(X_full)))\n",
    "cat(sprintf(\"  R2(20 PCs) = %.4f  ->  noise_scale = sqrt(1 - R2) = %.4f\\n\",\n",
    "    R2_20, noise_scale_factor))\n",
    "cat(sprintf(\"  For a subsample with sd(y) = s, noise_sd = s * %.4f\\n\",\n",
    "    noise_scale_factor))\n",
    "\n",
    "# ============================================================\n",
    "# Seed management\n",
    "# ============================================================\n",
    "# Each random operation uses a deterministic seed derived from the\n",
    "# simulation coordinates (rep_id, N, h2, n_causal).  This ensures:\n",
    "#\n",
    "#   1. Reproducibility \u2014 rerunning the same rep_id always yields\n",
    "#      identical results.\n",
    "#   2. No collisions \u2014 different (rep, setting) pairs get different\n",
    "#      seeds because each \"purpose\" uses a different set of prime\n",
    "#      multipliers.\n",
    "#   3. Safe extension \u2014 adding reps 11-200 to an existing 1-10 run\n",
    "#      produces genuinely new draws (different rep_ids -> different seeds).\n",
    "#      The checkpoint system (below) tracks completed rep_ids and never\n",
    "#      reruns them, preventing accidental duplication.\n",
    "\n",
    "make_seed <- function(rep_i, N,\n",
    "                      purpose = c(\"subsample\", \"flip\", \"causal\"),\n",
    "                      h2 = 0, nc = 0) {\n",
    "  purpose <- match.arg(purpose)\n",
    "  base <- switch(purpose,\n",
    "    subsample = rep_i * 7919L + N,\n",
    "    flip      = rep_i * 1009L + N * 17L + nc * 101L + round(h2 * 1000),\n",
    "    causal    = rep_i * 3331L + N * 23L + nc * 107L + round(h2 * 1000)\n",
    "  )\n",
    "  as.integer(abs(base) %% (.Machine$integer.max - 1L) + 1L)\n",
    "}\n",
    "\n",
    "# ============================================================\n",
    "# Checkpoint utilities\n",
    "# ============================================================\n",
    "# The checkpoint system uses an MD5 hash of all simulation parameters\n",
    "# (data fingerprint + design settings) to detect configuration changes.\n",
    "# Results are stored per-setting as individual .rds files in outdir.\n",
    "#\n",
    "# Workflow:\n",
    "#   1. compute_config_md5()  \u2014 hash all parameters\n",
    "#   2. checkpoint_init()     \u2014 verify existing results or clear\n",
    "#   3. checkpoint_completed_reps()  \u2014 which rep_ids are done?\n",
    "#   4. checkpoint_save()     \u2014 merge new results, deduplicate\n",
    "#   5. checkpoint_save_meta() \u2014 write _meta.rds after completion\n",
    "\n",
    "#' Compute MD5 signature of all simulation parameters.\n",
    "#' Any change in data, design, or noise calibration produces a\n",
    "#' different hash, triggering automatic invalidation.\n",
    "compute_config_md5 <- function(X, y, N_vals, h2_sparse, L_causal,\n",
    "                               L, noise_scale) {\n",
    "  nr <- min(50, nrow(X)); nc_dim <- min(50, ncol(X))\n",
    "  config <- list(\n",
    "    data_nrow   = nrow(X),\n",
    "    data_ncol   = ncol(X),\n",
    "    data_corner = sum(X[1:nr, 1:nc_dim]),\n",
    "    var_y       = round(var(as.vector(y)), 8),\n",
    "    noise_scale = round(noise_scale, 8),\n",
    "    L           = as.integer(L),\n",
    "    N_vals      = sort(as.integer(N_vals)),\n",
    "    h2_sparse   = sort(round(h2_sparse, 6)),\n",
    "    L_causal    = sort(as.integer(L_causal))\n",
    "  )\n",
    "  md5 <- digest(config, algo = \"md5\")\n",
    "  list(config = config, md5 = md5)\n",
    "}\n",
    "\n",
    "#' Initialize checkpoint directory.\n",
    "#' Returns list(status, meta) where status is \"match\" or \"fresh\".\n",
    "#' On mismatch, all existing .rds files are deleted.\n",
    "checkpoint_init <- function(outdir, config_sig) {\n",
    "  dir.create(outdir, showWarnings = FALSE, recursive = TRUE)\n",
    "  meta_path <- file.path(outdir, \"_meta.rds\")\n",
    "\n",
    "  if (file.exists(meta_path)) {\n",
    "    old_meta <- tryCatch(readRDS(meta_path), error = function(e) NULL)\n",
    "    if (!is.null(old_meta) && !is.null(old_meta$md5) &&\n",
    "        identical(old_meta$md5, config_sig$md5)) {\n",
    "      cat(sprintf(\"Config MD5 verified: %s\\n\", config_sig$md5))\n",
    "      cat(sprintf(\"  Previous run: n_rep=%d, timestamp=%s\\n\",\n",
    "          old_meta$n_rep, old_meta$timestamp))\n",
    "      return(list(status = \"match\", meta = old_meta))\n",
    "    }\n",
    "    old_md5 <- if (!is.null(old_meta$md5)) old_meta$md5 else \"(missing/corrupt)\"\n",
    "    cat(sprintf(\"Config MD5 MISMATCH \u2014 clearing old results.\\n\"))\n",
    "    cat(sprintf(\"  Old: %s\\n  New: %s\\n\", old_md5, config_sig$md5))\n",
    "    old_files <- list.files(outdir, pattern = \"[.]rds$\", full.names = TRUE)\n",
    "    if (length(old_files) > 0) {\n",
    "      file.remove(old_files)\n",
    "      cat(sprintf(\"  Removed %d old file(s).\\n\", length(old_files)))\n",
    "    }\n",
    "    return(list(status = \"fresh\", meta = NULL))\n",
    "  }\n",
    "\n",
    "  cat(sprintf(\"No existing checkpoint. Config MD5: %s\\n\", config_sig$md5))\n",
    "  list(status = \"fresh\", meta = NULL)\n",
    "}\n",
    "\n",
    "#' Get sorted vector of completed rep_ids for one setting tag.\n",
    "checkpoint_completed_reps <- function(outdir, tag) {\n",
    "  path <- file.path(outdir, paste0(tag, \".rds\"))\n",
    "  if (!file.exists(path)) return(integer(0))\n",
    "  tryCatch({\n",
    "    x <- readRDS(path)\n",
    "    if (is.data.frame(x) && \"rep\" %in% names(x) && nrow(x) > 0)\n",
    "      sort(unique(as.integer(x$rep)))\n",
    "    else\n",
    "      integer(0)\n",
    "  }, error = function(e) integer(0))\n",
    "}\n",
    "\n",
    "#' Load checkpoint data for one setting (NULL if absent/corrupt).\n",
    "checkpoint_load <- function(outdir, tag) {\n",
    "  path <- file.path(outdir, paste0(tag, \".rds\"))\n",
    "  if (!file.exists(path)) return(NULL)\n",
    "  tryCatch({\n",
    "    x <- readRDS(path)\n",
    "    if (is.data.frame(x) && nrow(x) > 0 && \"rep\" %in% names(x)) x\n",
    "    else NULL\n",
    "  }, error = function(e) NULL)\n",
    "}\n",
    "\n",
    "#' Save new results, merging with existing and deduplicating by rep_id.\n",
    "#' Returns the combined data.frame (invisibly).\n",
    "checkpoint_save <- function(outdir, tag, new_data) {\n",
    "  path <- file.path(outdir, paste0(tag, \".rds\"))\n",
    "  existing <- checkpoint_load(outdir, tag)\n",
    "  if (!is.null(existing)) {\n",
    "    # Safety: remove any pre-existing rows for rep_ids we're about to add\n",
    "    overlap <- existing$rep %in% new_data$rep\n",
    "    if (any(overlap)) {\n",
    "      n_dup <- length(unique(existing$rep[overlap]))\n",
    "      warning(sprintf(\"%s: deduplicating %d overlapping rep_id(s)\", tag, n_dup))\n",
    "      existing <- existing[!overlap, ]\n",
    "    }\n",
    "    combined <- rbind(existing, new_data)\n",
    "  } else {\n",
    "    combined <- new_data\n",
    "  }\n",
    "  saveRDS(combined, path)\n",
    "  invisible(combined)\n",
    "}\n",
    "\n",
    "#' Write checkpoint metadata after successful completion.\n",
    "checkpoint_save_meta <- function(outdir, config_sig, n_rep) {\n",
    "  saveRDS(list(\n",
    "    config    = config_sig$config,\n",
    "    md5       = config_sig$md5,\n",
    "    n_rep     = n_rep,\n",
    "    timestamp = Sys.time()\n",
    "  ), file.path(outdir, \"_meta.rds\"))\n",
    "}\n",
    "\n",
    "# ============================================================\n",
    "# Simulation functions\n",
    "# ============================================================\n",
    "\n",
    "get_lasso_residual <- function(X, y, seed = 42) {\n",
    "  set.seed(seed)\n",
    "  n <- nrow(X)\n",
    "  cv_fit    <- cv.glmnet(X, y, alpha = 1, nfolds = min(10, n))\n",
    "  lasso_fit <- glmnet(X, y, alpha = 1, lambda = cv_fit$lambda.1se)\n",
    "  as.vector(y - predict(lasso_fit, X))\n",
    "}\n",
    "\n",
    "gen_signflip_noise <- function(U, resid, target_sd, seed = 1) {\n",
    "  set.seed(seed)\n",
    "  r_centered <- resid - mean(resid)\n",
    "  proj  <- as.vector(crossprod(U, r_centered))\n",
    "  k     <- length(proj)\n",
    "  signs <- sample(c(-1, 1), k, replace = TRUE)\n",
    "  noise <- as.vector(U[, 1:k] %*% (proj * signs))\n",
    "  noise * target_sd / sd(noise)\n",
    "}\n",
    "\n",
    "run_one_rep <- function(rep_i, n_causal, h2_sp, X, y_real,\n",
    "                        U_pre = NULL, resid_pre = NULL, L = 10,\n",
    "                        noise_scale = noise_scale_factor) {\n",
    "  suppressWarnings({\n",
    "    n <- nrow(X); p <- ncol(X)\n",
    "\n",
    "    if (!is.null(U_pre) && !is.null(resid_pre)) {\n",
    "      U     <- U_pre\n",
    "      resid <- resid_pre\n",
    "    } else {\n",
    "      seed_sub <- make_seed(rep_i, n, \"subsample\")\n",
    "      resid    <- get_lasso_residual(X, y_real, seed = seed_sub)\n",
    "      Xs       <- scale(X, center = TRUE, scale = FALSE)\n",
    "      svd_X    <- svd(Xs, nu = n, nv = 0)\n",
    "      U        <- svd_X$u\n",
    "    }\n",
    "\n",
    "    # Sign-flip noise, scaled to match real data's noise level\n",
    "    target_noise_sd <- sd(y_real) * noise_scale\n",
    "    seed_flip <- make_seed(rep_i, n, \"flip\", h2 = h2_sp, nc = n_causal)\n",
    "    noise <- gen_signflip_noise(U, resid, target_noise_sd, seed = seed_flip)\n",
    "\n",
    "    # Causal signal: h2 = var(signal) / var(y)\n",
    "    seed_causal <- make_seed(rep_i, n, \"causal\", h2 = h2_sp, nc = n_causal)\n",
    "    set.seed(seed_causal)\n",
    "    causal_idx <- sample(p, n_causal)\n",
    "    y <- noise\n",
    "    for (j in causal_idx) {\n",
    "      bj <- sqrt(h2_sp * var(noise) / ((1 - h2_sp) * n_causal * var(X[, j])))\n",
    "      y  <- y + X[, j] * bj\n",
    "    }\n",
    "\n",
    "    # Fit both methods\n",
    "    fit_gaus <- tryCatch(\n",
    "      susie(X, y, L = L, verbose = FALSE),\n",
    "      error = function(e) NULL)\n",
    "    fit_ss <- tryCatch(\n",
    "      susie(X, y, L = L, estimate_residual_method = \"NIG\",\n",
    "            verbose = FALSE),\n",
    "      error = function(e) NULL)\n",
    "\n",
    "    extract <- function(fit, tag) {\n",
    "      na_row <- data.frame(\n",
    "        method = tag, rep = rep_i,\n",
    "        discovered = NA_real_, n_true_cs = NA_real_, n_cs = NA_real_,\n",
    "        mean_size = NA_real_, sigma2 = NA_real_,\n",
    "        mean_V = NA_real_, max_V = NA_real_, sum_V = NA_real_,\n",
    "        stringsAsFactors = FALSE)\n",
    "      if (is.null(fit)) return(na_row)\n",
    "\n",
    "      cs_obj <- susie_get_cs(fit, X = X, min_abs_corr = 0.5)\n",
    "      cs     <- cs_obj$cs\n",
    "      ncs    <- length(cs)\n",
    "\n",
    "      discovered <- 0; n_true_cs <- 0; avg_size <- NA_real_\n",
    "      if (ncs > 0) {\n",
    "        discovered <- length(intersect(unique(unlist(cs)), causal_idx))\n",
    "        n_true_cs  <- sum(sapply(cs, function(s) any(causal_idx %in% s)))\n",
    "        avg_size   <- mean(sapply(cs, length))\n",
    "      }\n",
    "\n",
    "      V_vec <- fit$V\n",
    "      if (is.null(V_vec)) V_vec <- rep(NA_real_, L)\n",
    "      if (length(V_vec) == 1) V_vec <- rep(V_vec, L)\n",
    "\n",
    "      data.frame(\n",
    "        method     = tag,\n",
    "        rep        = rep_i,\n",
    "        discovered = discovered,\n",
    "        n_true_cs  = n_true_cs,\n",
    "        n_cs       = ncs,\n",
    "        mean_size  = avg_size,\n",
    "        sigma2     = fit$sigma2,\n",
    "        mean_V     = mean(V_vec, na.rm = TRUE),\n",
    "        max_V      = max(V_vec, na.rm = TRUE),\n",
    "        sum_V      = sum(V_vec, na.rm = TRUE),\n",
    "        stringsAsFactors = FALSE)\n",
    "    }\n",
    "\n",
    "    rbind(extract(fit_gaus, \"Gaussian\"), extract(fit_ss, \"SS\"))\n",
    "  })\n",
    "}\n",
    "\n",
    "cat(\"Functions defined:\\n\")\n",
    "cat(\"  Seeds:       make_seed(rep_i, N, purpose, h2, nc)\\n\")\n",
    "cat(\"  Checkpoint:  compute_config_md5, checkpoint_init, checkpoint_completed_reps,\\n\")\n",
    "cat(\"               checkpoint_load, checkpoint_save, checkpoint_save_meta\\n\")\n",
    "cat(\"  Simulation:  get_lasso_residual, gen_signflip_noise, run_one_rep\\n\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e3cabf45",
   "metadata": {},
   "source": [
    "## Run simulation\n",
    "\n",
    "Per-setting results are checkpointed as individual `.rds` files.\n",
    "An MD5 hash of the full configuration (data fingerprint, noise calibration,\n",
    "all design parameters) is stored in `_meta.rds` and verified before every run.\n",
    "\n",
    "**Checkpoint behavior:**\n",
    "- **MD5 matches** \u2192 existing results are loaded; only new `rep_id`s are computed.\n",
    "  Changing `n_rep` from 10 to 200 runs only reps 11\u2013200.\n",
    "- **MD5 mismatch** \u2192 all old results are automatically deleted and the\n",
    "  simulation starts fresh. This triggers whenever the data, noise calibration,\n",
    "  sample sizes, heritabilities, or causal counts change.\n",
    "- `checkpoint_save()` deduplicates by `rep_id` as a safety net against\n",
    "  accidental re-runs.\n",
    "\n",
    "**Seed management:**\n",
    "- Each random operation (subsampling, sign-flip, causal placement) uses a\n",
    "  deterministic seed derived from `(rep_id, N, h2, n_causal)` via `make_seed()`.\n",
    "- Same `rep_id` always produces the same result (reproducibility).\n",
    "- Different `rep_id`s always produce different draws (no collisions).\n",
    "- The checkpoint tracks which `rep_id`s are complete and never re-runs them."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3f6af90a",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:36.359175Z",
     "iopub.status.busy": "2026-02-26T01:50:36.358571Z",
     "iopub.status.idle": "2026-02-26T01:50:36.453676Z",
     "shell.execute_reply": "2026-02-26T01:50:36.452682Z"
    }
   },
   "outputs": [],
   "source": [
    "outdir  <- \"benchmark_results\"\n",
    "all_rds <- file.path(outdir, \"all_results.rds\")\n",
    "\n",
    "# --- Compute and verify config signature ---\n",
    "config_sig <- compute_config_md5(X_full, y_full, N_vals, h2_sparse,\n",
    "                                 L_causal, L, noise_scale_factor)\n",
    "init <- checkpoint_init(outdir, config_sig)\n",
    "\n",
    "# --- Main simulation (incremental) ---\n",
    "all_results <- list()\n",
    "t_total     <- proc.time()\n",
    "n_full      <- nrow(X_full)\n",
    "ns          <- noise_scale_factor\n",
    "any_new     <- FALSE\n",
    "\n",
    "for (N in N_vals) {\n",
    "  # \u2500\u2500 Which rep_ids does ANY setting at this N still need? \u2500\u2500\n",
    "  # We precompute LASSO+SVD only for these, saving time when extending.\n",
    "  needed_reps <- integer(0)\n",
    "  for (h2 in h2_sparse) {\n",
    "    for (nc in L_causal) {\n",
    "      tag  <- sprintf(\"N%d_h2%03d_nc%d\", N, round(h2 * 100), nc)\n",
    "      done <- checkpoint_completed_reps(outdir, tag)\n",
    "      todo <- setdiff(seq_len(n_rep), done)\n",
    "      needed_reps <- union(needed_reps, todo)\n",
    "    }\n",
    "  }\n",
    "  needed_reps <- sort(needed_reps)\n",
    "\n",
    "  if (length(needed_reps) == 0) {\n",
    "    # Everything cached \u2014 just load\n",
    "    cat(sprintf(\"\\n=== N = %d: all settings complete, loading ===\\n\", N))\n",
    "    for (h2 in h2_sparse) {\n",
    "      for (nc in L_causal) {\n",
    "        tag <- sprintf(\"N%d_h2%03d_nc%d\", N, round(h2 * 100), nc)\n",
    "        res <- checkpoint_load(outdir, tag)\n",
    "        # Trim to exactly n_rep reps\n",
    "        done_ids <- sort(unique(res$rep))\n",
    "        if (length(done_ids) > n_rep)\n",
    "          res <- res[res$rep %in% done_ids[1:n_rep], ]\n",
    "        all_results[[length(all_results) + 1]] <- res\n",
    "      }\n",
    "    }\n",
    "    next\n",
    "  }\n",
    "\n",
    "  # \u2500\u2500 Precompute LASSO + SVD only for needed reps \u2500\u2500\n",
    "  cat(sprintf(\"\\n=== N = %d: precomputing %d / %d subsamples ===\\n\",\n",
    "      N, length(needed_reps), n_rep))\n",
    "  t_pre <- proc.time()\n",
    "\n",
    "  keep_list  <- vector(\"list\", n_rep)\n",
    "  U_list     <- vector(\"list\", n_rep)\n",
    "  resid_list <- vector(\"list\", n_rep)\n",
    "\n",
    "  for (i in needed_reps) {\n",
    "    seed_i <- make_seed(i, N, \"subsample\")\n",
    "    set.seed(seed_i)\n",
    "    keep <- sample(n_full, N)\n",
    "    keep_list[[i]] <- keep\n",
    "    Xi <- X_full[keep, ]\n",
    "    yi <- y_full[keep]\n",
    "    resid_list[[i]] <- get_lasso_residual(Xi, yi, seed = seed_i)\n",
    "    Xs <- scale(Xi, center = TRUE, scale = FALSE)\n",
    "    svd_i <- svd(Xs, nu = N, nv = 0)\n",
    "    U_list[[i]] <- svd_i$u\n",
    "  }\n",
    "  cat(sprintf(\"  Precompute: %.0f sec\\n\", (proc.time() - t_pre)[3]))\n",
    "\n",
    "  # \u2500\u2500 Run or extend each setting \u2500\u2500\n",
    "  for (h2 in h2_sparse) {\n",
    "    for (nc in L_causal) {\n",
    "      tag       <- sprintf(\"N%d_h2%03d_nc%d\", N, round(h2 * 100), nc)\n",
    "      done_reps <- checkpoint_completed_reps(outdir, tag)\n",
    "      todo_reps <- sort(setdiff(seq_len(n_rep), done_reps))\n",
    "\n",
    "      if (length(todo_reps) == 0) {\n",
    "        # Already complete \u2014 load\n",
    "        cat(sprintf(\"[DONE] %s (%d reps)\\n\", tag, length(done_reps)))\n",
    "        res <- checkpoint_load(outdir, tag)\n",
    "        done_ids <- sort(unique(res$rep))\n",
    "        if (length(done_ids) > n_rep)\n",
    "          res <- res[res$rep %in% done_ids[1:n_rep], ]\n",
    "        all_results[[length(all_results) + 1]] <- res\n",
    "        next\n",
    "      }\n",
    "\n",
    "      if (length(done_reps) > 0) {\n",
    "        cat(sprintf(\"[EXT]  %s: %d -> %d reps ... \",\n",
    "            tag, length(done_reps), length(done_reps) + length(todo_reps)))\n",
    "      } else {\n",
    "        cat(sprintf(\"[RUN]  %s (%d reps) ... \", tag, length(todo_reps)))\n",
    "      }\n",
    "      t0 <- proc.time()\n",
    "      any_new <- TRUE\n",
    "\n",
    "      new_res <- do.call(rbind, future_lapply(todo_reps, function(i) {\n",
    "        run_one_rep(i, nc, h2,\n",
    "                    X_full[keep_list[[i]], ], y_full[keep_list[[i]]],\n",
    "                    U_pre = U_list[[i]], resid_pre = resid_list[[i]],\n",
    "                    L = L, noise_scale = ns)\n",
    "      }, future.seed = TRUE))\n",
    "      new_res$N         <- N\n",
    "      new_res$h2_sparse <- h2\n",
    "      new_res$n_causal  <- nc\n",
    "\n",
    "      # Save with dedup, then collect\n",
    "      res <- checkpoint_save(outdir, tag, new_res)\n",
    "      all_results[[length(all_results) + 1]] <- res\n",
    "      cat(sprintf(\"done (%.0f sec)\\n\", (proc.time() - t0)[3]))\n",
    "    }\n",
    "  }\n",
    "}\n",
    "\n",
    "# --- Finalize ---\n",
    "results <- do.call(rbind, all_results)\n",
    "saveRDS(results, all_rds)\n",
    "checkpoint_save_meta(outdir, config_sig, n_rep)\n",
    "\n",
    "total_settings <- length(N_vals) * length(h2_sparse) * length(L_causal)\n",
    "if (any_new) {\n",
    "  cat(sprintf(\"\\nCompleted: %d rows across %d settings, %.1f min\\n\",\n",
    "      nrow(results), total_settings, (proc.time() - t_total)[3] / 60))\n",
    "} else {\n",
    "  cat(sprintf(\"\\nAll %d settings x %d reps loaded from cache (%d rows)\\n\",\n",
    "      total_settings, n_rep, nrow(results)))\n",
    "}\n",
    "cat(sprintf(\"Config MD5: %s\\nSaved: %s\\n\", config_sig$md5, all_rds))"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "0711cbfc",
   "metadata": {},
   "source": [
    "## Aggregate results"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "b9dcf67e",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:36.456160Z",
     "iopub.status.busy": "2026-02-26T01:50:36.455343Z",
     "iopub.status.idle": "2026-02-26T01:50:36.596256Z",
     "shell.execute_reply": "2026-02-26T01:50:36.595603Z"
    }
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Aggregated: 150 rows\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "method       N    h2  nc   power  cover cs/rep   size   sigma2    sum_V\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "---------------------------------------------------------------------------------- \n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Gaussian    30  0.25   1   0.000  0.000   0.00    0.0   0.3548   0.0492\n",
      "SS          30  0.25   1   0.000  0.000   0.00    0.0   0.9885   0.0144\n",
      "Gaussian    30  0.25   2   0.000  0.000   0.00    0.0   0.3524   0.0804\n",
      "SS          30  0.25   2   0.000  0.000   0.00    0.0   0.9383   0.0618\n",
      "Gaussian    30  0.25   3   0.000  0.000   0.10  114.0   0.3595   0.0652\n",
      "SS          30  0.25   3   0.000  0.000   0.10    1.0   0.9507   0.0629\n",
      "Gaussian    30  0.25   4   0.025  1.000   0.10   38.0   0.3594   0.0737\n",
      "SS          30  0.25   4   0.050  1.000   0.10   51.0   0.9465   0.0588\n",
      "Gaussian    30  0.25   5   0.000  0.000   0.00    0.0   0.3946   0.0461\n",
      "SS          30  0.25   5   0.000  0.000   0.00    0.0   0.9937   0.0209\n",
      "Gaussian    30  0.50   1   0.500  1.000   0.50   16.4   0.3096   0.3436\n",
      "SS          30  0.50   1   0.400  1.000   0.40   17.0   0.9013   0.3583\n",
      "Gaussian    30  0.50   2   0.050  0.500   0.20   18.5   0.4310   0.1511\n",
      "SS          30  0.50   2   0.050  1.000   0.10   44.0   0.9558   0.1640\n",
      "Gaussian    30  0.50   3   0.033  0.500   0.20   57.0   0.4689   0.2099\n",
      "SS          30  0.50   3   0.033  1.000   0.10   98.0   0.9008   0.2110\n",
      "Gaussian    30  0.50   4   0.000  0.000   0.00    0.0   0.5539   0.1411\n",
      "SS          30  0.50   4   0.000  0.000   0.00    0.0   0.9414   0.1234\n",
      "Gaussian    30  0.50   5   0.040  0.667   0.30   50.0   0.4545   0.2121\n",
      "SS          30  0.50   5   0.040  0.667   0.30   55.2   0.9480   0.1966\n",
      "Gaussian    30  0.75   1   0.900  0.818   1.10   23.5   0.2857   0.9284\n",
      "SS          30  0.75   1   0.900  0.818   1.10   26.4   0.9149   0.9965\n",
      "Gaussian    30  0.75   2   0.200  1.000   0.40   55.0   0.7479   0.4598\n",
      "SS          30  0.75   2   0.500  0.833   1.20   36.3   0.8881   0.7568\n",
      "Gaussian    30  0.75   3   0.000  0.000   0.10    9.0   0.7925   0.5512\n",
      "SS          30  0.75   3   0.333  0.909   1.10   35.1   0.8612   0.9012\n",
      "Gaussian    30  0.75   4   0.075  0.667   0.30   35.0   0.7472   0.3571\n",
      "SS          30  0.75   4   0.050  0.250   0.40   30.5   0.9647   0.4515\n",
      "Gaussian    30  0.75   5   0.000  0.000   0.00    0.0   0.9627   0.2646\n",
      "SS          30  0.75   5   0.000  0.000   0.10   23.0   0.9031   0.3866\n",
      "Gaussian    50  0.25   1   0.400  0.800   0.50   42.4   0.2792   0.0959\n",
      "SS          50  0.25   1   0.100  0.500   0.20   36.5   0.9503   0.0923\n",
      "Gaussian    50  0.25   2   0.050  1.000   0.10   29.0   0.2984   0.0357\n",
      "SS          50  0.25   2   0.000  0.000   0.00    0.0   0.9930   0.0162\n",
      "Gaussian    50  0.25   3   0.000  0.000   0.00    0.0   0.3112   0.0282\n",
      "SS          50  0.25   3   0.000  0.000   0.00    0.0   0.9744   0.0176\n",
      "Gaussian    50  0.25   4   0.000  0.000   0.00    0.0   0.3148   0.0428\n",
      "SS          50  0.25   4   0.000  0.000   0.00    0.0   0.9804   0.0313\n",
      "Gaussian    50  0.25   5   0.000  0.000   0.00    0.0   0.3183   0.0248\n",
      "SS          50  0.25   5   0.000  0.000   0.00    0.0   0.9564   0.0139\n",
      "Gaussian    50  0.50   1   0.900  0.900   1.00   15.1   0.2538   0.2636\n",
      "SS          50  0.50   1   1.000  1.000   1.00   16.7   0.9277   0.2673\n",
      "Gaussian    50  0.50   2   0.300  1.000   0.60   43.3   0.3392   0.1998\n",
      "SS          50  0.50   2   0.200  1.000   0.40   28.0   0.8777   0.1949\n",
      "Gaussian    50  0.50   3   0.033  0.500   0.20   26.5   0.4075   0.1107\n",
      "SS          50  0.50   3   0.067  1.000   0.20   34.0   0.9443   0.1132\n",
      "Gaussian    50  0.50   4   0.025  1.000   0.10   22.0   0.4229   0.1048\n",
      "SS          50  0.50   4   0.000  0.000   0.00    0.0   0.9089   0.1230\n",
      "Gaussian    50  0.50   5   0.000  0.000   0.10   30.0   0.4312   0.1046\n",
      "SS          50  0.50   5   0.000  0.000   0.10   27.0   0.9386   0.0893\n",
      "Gaussian    50  0.75   1   1.000  0.909   1.10    6.6   0.2515   0.8487\n",
      "SS          50  0.75   1   1.000  0.909   1.10    6.7   0.9099   0.8861\n",
      "Gaussian    50  0.75   2   0.700  1.000   1.40   24.8   0.4038   0.7157\n",
      "SS          50  0.75   2   0.950  0.950   2.00   19.6   0.8456   0.8858\n",
      "Gaussian    50  0.75   3   0.167  0.714   0.70   31.9   0.5996   0.3930\n",
      "SS          50  0.75   3   0.333  0.833   1.20   20.5   0.8834   0.5194\n",
      "Gaussian    50  0.75   4   0.225  0.889   0.90   35.9   0.6118   0.5291\n",
      "SS          50  0.75   4   0.400  0.833   1.80   20.6   0.7905   0.7236\n",
      "Gaussian    50  0.75   5   0.100  0.833   0.60   36.8   0.6291   0.4547\n",
      "SS          50  0.75   5   0.100  0.714   0.70   37.7   0.9247   0.4804\n",
      "Gaussian    80  0.25   1   0.600  1.000   0.60   28.2   0.2611   0.1065\n",
      "SS          80  0.25   1   0.600  1.000   0.60   30.2   0.9336   0.0973\n",
      "Gaussian    80  0.25   2   0.250  1.000   0.50   56.6   0.2843   0.0845\n",
      "SS          80  0.25   2   0.150  0.750   0.40   36.5   0.9195   0.0892\n",
      "Gaussian    80  0.25   3   0.067  1.000   0.20   89.0   0.3009   0.0632\n",
      "SS          80  0.25   3   0.067  1.000   0.20   90.0   0.8980   0.0669\n",
      "Gaussian    80  0.25   4   0.000  0.000   0.10   30.0   0.2949   0.0544\n",
      "SS          80  0.25   4   0.000  0.000   0.10   34.0   0.9421   0.0381\n",
      "Gaussian    80  0.25   5   0.000  0.000   0.00    0.0   0.3067   0.0277\n",
      "SS          80  0.25   5   0.000  0.000   0.00    0.0   0.9648   0.0162\n",
      "Gaussian    80  0.50   1   1.000  1.000   1.00   17.0   0.2579   0.2698\n",
      "SS          80  0.50   1   1.000  1.000   1.00   17.7   0.9116   0.2729\n",
      "Gaussian    80  0.50   2   0.600  1.000   1.20   21.5   0.2772   0.2060\n",
      "SS          80  0.50   2   0.600  0.923   1.30   28.3   0.8533   0.2110\n",
      "Gaussian    80  0.50   3   0.433  0.929   1.40   32.7   0.3041   0.2599\n",
      "SS          80  0.50   3   0.467  0.933   1.50   30.8   0.8257   0.2854\n",
      "Gaussian    80  0.50   4   0.150  0.833   0.60   26.9   0.3662   0.1682\n",
      "SS          80  0.50   4   0.125  0.571   0.70   34.1   0.8593   0.1838\n",
      "Gaussian    80  0.50   5   0.080  0.667   0.60   22.9   0.3730   0.1622\n",
      "SS          80  0.50   5   0.060  0.600   0.50   21.6   0.8765   0.1570\n",
      "Gaussian    80  0.75   1   1.000  1.000   1.00    4.7   0.2544   0.7452\n",
      "SS          80  0.75   1   1.000  1.000   1.00    5.0   0.8956   0.7553\n",
      "Gaussian    80  0.75   2   1.000  1.000   2.00   17.8   0.2589   0.7821\n",
      "SS          80  0.75   2   1.000  1.000   2.00   17.5   0.8198   0.8006\n",
      "Gaussian    80  0.75   3   0.800  0.889   2.70   31.6   0.2832   0.8133\n",
      "SS          80  0.75   3   0.900  0.931   2.90   24.8   0.7295   0.8457\n",
      "Gaussian    80  0.75   4   0.625  0.926   2.70   25.2   0.3933   0.6343\n",
      "SS          80  0.75   4   0.650  0.839   3.10   22.2   0.7387   0.7104\n",
      "Gaussian    80  0.75   5   0.420  0.875   2.40   33.4   0.4467   0.5773\n",
      "SS          80  0.75   5   0.520  0.867   3.00   21.3   0.7128   0.7192\n",
      "Gaussian   120  0.25   1   0.900  1.000   0.90   15.4   0.2832   0.1210\n",
      "SS         120  0.25   1   0.900  1.000   0.90   16.0   0.8931   0.1145\n",
      "Gaussian   120  0.25   2   0.200  0.667   0.60   33.6   0.3196   0.0771\n",
      "SS         120  0.25   2   0.150  0.600   0.50   41.7   0.8975   0.0719\n",
      "Gaussian   120  0.25   3   0.067  0.667   0.30   18.3   0.3153   0.0803\n",
      "SS         120  0.25   3   0.067  0.667   0.30   18.3   0.8969   0.0719\n",
      "Gaussian   120  0.25   4   0.100  1.000   0.30   65.0   0.3403   0.0916\n",
      "SS         120  0.25   4   0.100  1.000   0.30   67.7   0.8850   0.0897\n",
      "Gaussian   120  0.25   5   0.060  0.750   0.40   28.2   0.3080   0.0747\n",
      "SS         120  0.25   5   0.040  0.667   0.30   23.3   0.9096   0.0619\n",
      "Gaussian   120  0.50   1   0.900  0.900   1.00   11.3   0.2829   0.3406\n",
      "SS         120  0.50   1   0.900  0.900   1.00   11.6   0.9004   0.3385\n",
      "Gaussian   120  0.50   2   0.900  0.947   1.90   11.0   0.2910   0.3074\n",
      "SS         120  0.50   2   0.900  0.947   1.90   11.4   0.8295   0.3099\n",
      "Gaussian   120  0.50   3   0.767  0.920   2.50   16.0   0.3004   0.2663\n",
      "SS         120  0.50   3   0.800  0.923   2.60   16.0   0.7698   0.2687\n",
      "Gaussian   120  0.50   4   0.500  0.833   2.40   28.6   0.3304   0.2843\n",
      "SS         120  0.50   4   0.550  0.846   2.60   29.4   0.7332   0.2988\n",
      "Gaussian   120  0.50   5   0.240  0.800   1.50   32.5   0.3810   0.2403\n",
      "SS         120  0.50   5   0.280  0.778   1.80   39.0   0.7369   0.2632\n",
      "Gaussian   120  0.75   1   1.000  1.000   1.00    2.6   0.2822   0.9560\n",
      "SS         120  0.75   1   1.000  1.000   1.00    2.6   0.9080   0.9646\n",
      "Gaussian   120  0.75   2   0.950  0.950   2.00   10.1   0.2855   0.9066\n",
      "SS         120  0.75   2   0.950  0.950   2.00   10.1   0.8121   0.9149\n",
      "Gaussian   120  0.75   3   0.967  0.967   3.00   11.8   0.2873   0.8667\n",
      "SS         120  0.75   3   0.967  0.967   3.00   11.8   0.7551   0.8784\n",
      "Gaussian   120  0.75   4   0.900  0.900   4.00   10.9   0.2893   0.9612\n",
      "SS         120  0.75   4   0.875  0.897   3.90    8.8   0.6696   0.9916\n",
      "Gaussian   120  0.75   5   0.840  0.913   4.60   12.3   0.3234   0.8059\n",
      "SS         120  0.75   5   0.880  0.936   4.70   12.8   0.6356   0.8142\n",
      "Gaussian   200  0.25   1   0.900  1.000   0.90    4.7   0.2628   0.1010\n",
      "SS         200  0.25   1   0.900  1.000   0.90    4.7   0.8614   0.0943\n",
      "Gaussian   200  0.25   2   0.900  0.947   1.90   32.5   0.2629   0.1123\n",
      "SS         200  0.25   2   0.900  1.000   1.80   37.8   0.8019   0.1058\n",
      "Gaussian   200  0.25   3   0.433  0.867   1.50   24.4   0.2801   0.0901\n",
      "SS         200  0.25   3   0.467  0.778   1.80   16.9   0.7260   0.1001\n",
      "Gaussian   200  0.25   4   0.150  0.600   1.00   23.2   0.2853   0.0935\n",
      "SS         200  0.25   4   0.200  0.667   1.20   30.9   0.7289   0.1040\n",
      "Gaussian   200  0.25   5   0.180  0.800   1.00   61.7   0.3001   0.0900\n",
      "SS         200  0.25   5   0.180  0.615   1.30   54.8   0.7085   0.0930\n",
      "Gaussian   200  0.50   1   1.000  1.000   1.00    8.1   0.2602   0.2946\n",
      "SS         200  0.50   1   1.000  1.000   1.00    7.9   0.8746   0.2890\n",
      "Gaussian   200  0.50   2   0.900  0.857   2.10   15.1   0.2601   0.2799\n",
      "SS         200  0.50   2   0.950  0.950   2.00   15.4   0.7852   0.2852\n",
      "Gaussian   200  0.50   3   0.867  0.897   2.90   12.7   0.2691   0.3097\n",
      "SS         200  0.50   3   0.933  0.933   3.00   12.9   0.7355   0.3154\n",
      "Gaussian   200  0.50   4   0.800  0.842   3.80   17.6   0.2630   0.2855\n",
      "SS         200  0.50   4   0.850  0.895   3.80   13.5   0.6648   0.2901\n",
      "Gaussian   200  0.50   5   0.600  0.833   3.60   20.8   0.2824   0.2796\n",
      "SS         200  0.50   5   0.700  0.833   4.20   18.7   0.5515   0.2996\n",
      "Gaussian   200  0.75   1   0.900  0.900   1.00    6.3   0.2625   0.8121\n",
      "SS         200  0.75   1   0.900  0.900   1.00    6.5   0.9204   0.8088\n",
      "Gaussian   200  0.75   2   0.950  0.864   2.20    8.1   0.2581   0.8527\n",
      "SS         200  0.75   2   0.950  0.864   2.20    8.1   0.7703   0.8553\n",
      "Gaussian   200  0.75   3   0.967  1.000   2.90    8.1   0.2702   0.9140\n",
      "SS         200  0.75   3   0.967  1.000   2.90    8.3   0.7229   0.9178\n",
      "Gaussian   200  0.75   4   1.000  1.000   4.00   12.5   0.2693   0.7982\n",
      "SS         200  0.75   4   1.000  0.976   4.10   12.2   0.6519   0.8058\n",
      "Gaussian   200  0.75   5   0.960  0.941   5.10   12.0   0.2643   0.8823\n",
      "SS         200  0.75   5   0.960  0.941   5.10   11.4   0.5335   0.8937\n"
     ]
    }
   ],
   "source": [
    "# Ensure numeric types\n",
    "for (col in c(\"discovered\", \"n_true_cs\", \"n_cs\", \"mean_size\",\n",
    "              \"sigma2\", \"mean_V\", \"max_V\", \"sum_V\",\n",
    "              \"N\", \"h2_sparse\", \"n_causal\")) {\n",
    "  if (col %in% names(results))\n",
    "    results[[col]] <- as.numeric(results[[col]])\n",
    "}\n",
    "\n",
    "# Aggregate across replicates\n",
    "groups   <- unique(results[, c(\"method\", \"N\", \"h2_sparse\", \"n_causal\")])\n",
    "agg_list <- vector(\"list\", nrow(groups))\n",
    "\n",
    "for (gi in seq_len(nrow(groups))) {\n",
    "  m  <- groups$method[gi]\n",
    "  nn <- groups$N[gi]\n",
    "  h2 <- groups$h2_sparse[gi]\n",
    "  nc <- groups$n_causal[gi]\n",
    "  df <- results[results$method == m & results$N == nn &\n",
    "                results$h2_sparse == h2 & results$n_causal == nc, ]\n",
    "  if (nrow(df) == 0) next\n",
    "\n",
    "  nr           <- nrow(df)\n",
    "  total_causal <- nc * nr\n",
    "  s  <- function(x) sum(x, na.rm = TRUE)\n",
    "  mn <- function(x) mean(x, na.rm = TRUE)\n",
    "\n",
    "  agg_list[[gi]] <- data.frame(\n",
    "    method      = m,\n",
    "    N           = nn,\n",
    "    h2_sparse   = h2,\n",
    "    n_causal    = nc,\n",
    "    power       = s(df$discovered) / total_causal,\n",
    "    coverage    = ifelse(s(df$n_cs) > 0, s(df$n_true_cs) / s(df$n_cs), NA),\n",
    "    total_cs    = s(df$n_cs),\n",
    "    cs_size     = mn(df$mean_size),\n",
    "    mean_sigma2 = mn(df$sigma2),\n",
    "    mean_V      = mn(df$mean_V),\n",
    "    max_V       = mn(df$max_V),\n",
    "    sum_V       = mn(df$sum_V),\n",
    "    stringsAsFactors = FALSE)\n",
    "}\n",
    "\n",
    "agg <- do.call(rbind, agg_list)\n",
    "rownames(agg) <- NULL\n",
    "\n",
    "# Factor columns for plotting\n",
    "agg$BF        <- factor(agg$method, levels = c(\"SS\", \"Gaussian\"))\n",
    "agg$L         <- agg$n_causal\n",
    "agg$n         <- agg$N\n",
    "agg$cs_per_rep <- agg$total_cs / n_rep\n",
    "\n",
    "cat(sprintf(\"Aggregated: %d rows\\n\\n\", nrow(agg)))\n",
    "\n",
    "# Print summary table\n",
    "cat(sprintf(\"%-10s %3s %5s %3s  %6s %6s %6s %6s %8s %8s\\n\",\n",
    "    \"method\", \"N\", \"h2\", \"nc\", \"power\", \"cover\", \"cs/rep\", \"size\", \"sigma2\", \"sum_V\"))\n",
    "cat(paste(rep(\"-\", 82), collapse = \"\"), \"\\n\")\n",
    "for (i in seq_len(nrow(agg))) {\n",
    "  a <- agg[i, ]\n",
    "  cat(sprintf(\"%-10s %3d %5.2f %3d  %6.3f %6.3f %6.2f %6.1f %8.4f %8.4f\\n\",\n",
    "      a$method, a$N, a$h2_sparse, a$n_causal,\n",
    "      a$power,\n",
    "      ifelse(is.na(a$coverage), 0, a$coverage),\n",
    "      a$cs_per_rep,\n",
    "      ifelse(is.na(a$cs_size), 0, a$cs_size),\n",
    "      a$mean_sigma2,\n",
    "      a$sum_V))\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "b4129cd6",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:36.598116Z",
     "iopub.status.busy": "2026-02-26T01:50:36.597625Z",
     "iopub.status.idle": "2026-02-26T01:50:36.625088Z",
     "shell.execute_reply": "2026-02-26T01:50:36.624478Z"
    }
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Plot theme set.\n"
     ]
    }
   ],
   "source": [
    "library(ggplot2)\n",
    "library(cowplot)\n",
    "library(gridExtra)\n",
    "library(grid)\n",
    "\n",
    "figdir <- \"benchmark_results\"\n",
    "\n",
    "methods_colors <- c(\"SS\" = \"#D41159\", \"Gaussian\" = \"#1A85FF\")\n",
    "\n",
    "perf_theme <- theme_cowplot(font_size = 16) +\n",
    "  theme(\n",
    "    legend.position  = \"none\",\n",
    "    panel.grid.major.y = element_line(color = \"gray80\"),\n",
    "    panel.grid.major.x = element_blank(),\n",
    "    panel.grid.minor   = element_blank(),\n",
    "    axis.line   = element_line(linewidth = 1, color = \"black\"),\n",
    "    axis.ticks  = element_line(linewidth = 1, color = \"black\"),\n",
    "    axis.ticks.length = unit(0.25, \"cm\"),\n",
    "    plot.margin = margin(t = 2, r = 2, b = 2, l = 2, unit = \"mm\"),\n",
    "    axis.text   = element_text(size = 14, face = \"bold\"),\n",
    "    axis.title  = element_text(size = 16, face = \"bold\"),\n",
    "    plot.title  = element_text(size = 16, face = \"bold\")\n",
    "  )\n",
    "dot_size <- 4\n",
    "cat(\"Plot theme set.\\n\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "177d7260",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:36.627107Z",
     "iopub.status.busy": "2026-02-26T01:50:36.626651Z",
     "iopub.status.idle": "2026-02-26T01:50:42.131843Z",
     "shell.execute_reply": "2026-02-26T01:50:42.131168Z"
    }
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Saved: benchmark_h2025.{pdf,png}\n",
      "Saved: benchmark_h2050.{pdf,png}\n",
      "Saved: benchmark_h2075.{pdf,png}\n"
     ]
    }
   ],
   "source": [
    "# --- Replace NA/NaN with 0 so every dot is plotted ---\n",
    "agg$coverage_plot  <- ifelse(is.na(agg$coverage), 0, agg$coverage)\n",
    "agg$cs_size_plot   <- ifelse(is.na(agg$cs_size) | is.nan(agg$cs_size), 0, agg$cs_size)\n",
    "\n",
    "# Dodge width: horizontally separate the two methods\n",
    "dodge <- position_dodge(width = 0.4)\n",
    "\n",
    "for (h2 in h2_sparse) {\n",
    "  d <- agg[agg$h2_sparse == h2, ]\n",
    "\n",
    "  plots <- list()\n",
    "  for (ni in seq_along(N_vals)) {\n",
    "    nn <- N_vals[ni]\n",
    "    dd <- d[d$N == nn, ]\n",
    "    ylab_fn <- function(lab) if (ni == 1) lab else \"\"\n",
    "\n",
    "    # \u2500\u2500 Coverage (use coverage_plot: NA \u2192 0) \u2500\u2500\n",
    "    p_cov <- ggplot(dd, aes(x = as.factor(L), y = coverage_plot, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      geom_hline(yintercept = 0.95, linetype = \"dashed\", linewidth = 1) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.02, 1.02)) +\n",
    "      ylab(ylab_fn(\"Coverage\")) + xlab(\"\") + perf_theme\n",
    "    plots[[paste0(\"cov_\", nn)]] <- p_cov\n",
    "\n",
    "    # \u2500\u2500 Power (linear scale, 0 shown at bottom) \u2500\u2500\n",
    "    p_pow <- ggplot(dd, aes(x = as.factor(L), y = power, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.02, 1.02)) +\n",
    "      ylab(ylab_fn(\"Power\")) + xlab(\"\") + perf_theme\n",
    "    plots[[paste0(\"pow_\", nn)]] <- p_pow\n",
    "\n",
    "    # \u2500\u2500 CS per replicate \u2500\u2500\n",
    "    p_ncs <- ggplot(dd, aes(x = as.factor(L), y = cs_per_rep, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.05, max(agg$cs_per_rep, na.rm = TRUE) * 1.05)) +\n",
    "      ylab(ylab_fn(\"CS / replicate\")) + xlab(\"\") + perf_theme\n",
    "    plots[[paste0(\"ncs_\", nn)]] <- p_ncs\n",
    "\n",
    "    # \u2500\u2500 CS size (use cs_size_plot: NaN \u2192 0) \u2500\u2500\n",
    "    cs_max <- max(agg$cs_size_plot, na.rm = TRUE)\n",
    "    p_size <- ggplot(dd, aes(x = as.factor(L), y = cs_size_plot, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.5, cs_max * 1.05)) +\n",
    "      ylab(ylab_fn(\"CS size\")) + xlab(\"\") + perf_theme\n",
    "    plots[[paste0(\"size_\", nn)]] <- p_size\n",
    "\n",
    "    # \u2500\u2500 sum V (prior variance diagnostic) \u2500\u2500\n",
    "    p_sumv <- ggplot(dd, aes(x = as.factor(L), y = sum_V, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.01, max(agg$sum_V, na.rm = TRUE) * 1.05)) +\n",
    "      ylab(ylab_fn(expression(Sigma~V))) + xlab(\"\") + perf_theme\n",
    "    plots[[paste0(\"sumv_\", nn)]] <- p_sumv\n",
    "\n",
    "    # \u2500\u2500 sigma2 \u2500\u2500\n",
    "    p_sig <- ggplot(dd, aes(x = as.factor(L), y = mean_sigma2, col = BF)) +\n",
    "      geom_point(size = dot_size, position = dodge) +\n",
    "      scale_color_manual(values = methods_colors) +\n",
    "      coord_cartesian(ylim = c(-0.01, max(agg$mean_sigma2, na.rm = TRUE) * 1.1)) +\n",
    "      ylab(ylab_fn(expression(hat(sigma)^2))) +\n",
    "      xlab(\"Number of causal variants\") + perf_theme\n",
    "    plots[[paste0(\"sig_\", nn)]] <- p_sig\n",
    "  }\n",
    "\n",
    "  # Column headers\n",
    "  titles <- lapply(N_vals, function(nn)\n",
    "    textGrob(label = paste0(\"N = \", nn),\n",
    "             gp = gpar(fontsize = 16, fontface = \"bold\")))\n",
    "\n",
    "  metric_rows <- c(\"cov\", \"pow\", \"ncs\", \"size\", \"sumv\", \"sig\")\n",
    "  plot_grobs <- lapply(metric_rows, function(r)\n",
    "    lapply(N_vals, function(nn) plots[[paste0(r, \"_\", nn)]]))\n",
    "  plot_grobs <- do.call(c, plot_grobs)\n",
    "\n",
    "  n_cols <- length(N_vals)\n",
    "  fig <- arrangeGrob(\n",
    "    arrangeGrob(grobs = titles, ncol = n_cols),\n",
    "    arrangeGrob(grobs = plot_grobs, ncol = n_cols, nrow = 6),\n",
    "    heights = c(0.04, 1),\n",
    "    top = textGrob(sprintf(\"h2_sparse = %d%%\", round(h2 * 100)),\n",
    "                   gp = gpar(fontsize = 18, fontface = \"bold\")))\n",
    "\n",
    "  fn <- sprintf(\"benchmark_h2%03d\", round(h2 * 100))\n",
    "  pdf(file.path(figdir, paste0(fn, \".pdf\")), width = 26, height = 20)\n",
    "  grid.draw(fig); dev.off()\n",
    "  png(file.path(figdir, paste0(fn, \".png\")), width = 26, height = 20,\n",
    "      units = \"in\", res = 150)\n",
    "  grid.draw(fig); dev.off()\n",
    "  cat(sprintf(\"Saved: %s.{pdf,png}\\n\", fn))\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "ebd9214a",
   "metadata": {
    "execution": {
     "iopub.execute_input": "2026-02-26T01:50:42.133533Z",
     "iopub.status.busy": "2026-02-26T01:50:42.133062Z",
     "iopub.status.idle": "2026-02-26T01:50:42.192191Z",
     "shell.execute_reply": "2026-02-26T01:50:42.191600Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<strong>agg_record_497274838:</strong> 2"
      ],
      "text/latex": [
       "\\textbf{agg\\textbackslash{}\\_record\\textbackslash{}\\_497274838:} 2"
      ],
      "text/markdown": [
       "**agg_record_497274838:** 2"
      ],
      "text/plain": [
       "agg_record_497274838 \n",
       "                   2 "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<strong>agg_record_497274838:</strong> 2"
      ],
      "text/latex": [
       "\\textbf{agg\\textbackslash{}\\_record\\textbackslash{}\\_497274838:} 2"
      ],
      "text/markdown": [
       "**agg_record_497274838:** 2"
      ],
      "text/plain": [
       "agg_record_497274838 \n",
       "                   2 "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Saved: benchmark_legend.{pdf,png}\n"
     ]
    }
   ],
   "source": [
    "# --- Standalone legend ---\n",
    "legend_df <- data.frame(\n",
    "  x = c(1, 1), y = c(1, 2),\n",
    "  grp = factor(c(\"SS (Servin-Stephens)\", \"Gaussian (standard)\"),\n",
    "               levels = c(\"SS (Servin-Stephens)\", \"Gaussian (standard)\")))\n",
    "legend_colors <- c(\"SS (Servin-Stephens)\" = \"#D41159\",\n",
    "                   \"Gaussian (standard)\"  = \"#1A85FF\")\n",
    "p_leg <- ggplot(legend_df, aes(x, y, col = grp)) +\n",
    "  geom_point(size = 5) +\n",
    "  scale_color_manual(values = legend_colors, name = \"Method\") +\n",
    "  theme_void() +\n",
    "  theme(legend.position  = \"bottom\",\n",
    "        legend.text  = element_text(size = 14, face = \"bold\"),\n",
    "        legend.title = element_text(size = 16, face = \"bold\"))\n",
    "legend_grob <- cowplot::get_legend(p_leg)\n",
    "\n",
    "pdf(file.path(figdir, \"benchmark_legend.pdf\"), width = 8, height = 1)\n",
    "grid::grid.draw(legend_grob); dev.off()\n",
    "png(file.path(figdir, \"benchmark_legend.png\"), width = 8, height = 1,\n",
    "    units = \"in\", res = 150)\n",
    "grid::grid.draw(legend_grob); dev.off()\n",
    "cat(\"Saved: benchmark_legend.{pdf,png}\\n\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4328be95",
   "metadata": {},
   "source": [
    "## Results\n",
    "\n",
    "*Results will be summarized here after reviewing the simulation output.*\n",
    "\n",
    "## How to run\n",
    "\n",
    "From the `inst/notebooks/` directory:\n",
    "\n",
    "```bash\n",
    "jupyter nbconvert --to notebook --execute \\\n",
    "  --ExecutePreprocessor.timeout=0 \\\n",
    "  --output small_sample_benchmark_executed.ipynb \\\n",
    "  small_sample_benchmark.ipynb\n",
    "```\n",
    "\n",
    "The `--ExecutePreprocessor.timeout=0` flag disables the cell timeout so the\n",
    "simulation can run as long as needed. With 60 settings x 200 replicates and\n",
    "10 parallel workers, expect roughly 4-8 hours on a modern machine.\n",
    "\n",
    "The simulation is **incremental**: existing results in `benchmark_results/`\n",
    "are preserved and only new replicates are computed. To extend from 200 to 400\n",
    "replicates, change `n_rep` in the config cell and re-run. To start fresh\n",
    "(e.g., after switching to a different dataset), either delete\n",
    "`benchmark_results/_meta.rds` or simply change the data file; the config\n",
    "signature check will detect the mismatch and clear old results automatically."
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "R",
   "language": "R",
   "name": "ir"
  },
  "language_info": {
   "codemirror_mode": "r",
   "file_extension": ".r",
   "mimetype": "text/x-r-source",
   "name": "R",
   "pygments_lexer": "r",
   "version": "4.4.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}

================================================
FILE: inst/notebooks/stochastic_ld_benchmark.ipynb
================================================
{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": "# Stochastic LD Correction Benchmark\n\n## Does the SER variance inflation correction control FDR when using stochastic LD?\n\nWhen individual-level genotype data is unavailable, SuSiE-RSS can use a **stochastic LD sketch** to approximate the LD matrix. The sketch is formed by random projection:\n\n$$\\hat{R} = \\frac{1}{B} U U^\\top, \\quad U = X_{\\text{std}}^\\top W, \\quad W \\sim N(0, I_B / n)$$\n\nwhere $X_{\\text{std}}$ is the column-standardized genotype matrix ($n \\times p$) and $B$ is the sketch size.\n\nHowever, the noise in $\\hat{R}$ inflates the variance of the SER residuals under the null, leading to **elevated false discovery rate (FDR)** if uncorrected. The `stochastic_ld_sample` parameter in `susie_rss()` activates a dynamic variance inflation correction in the single-effect regression (SER) that accounts for this noise at every IBSS iteration.\n\nThis notebook benchmarks the correction across different sketch sizes $B \\in \\{2000, 5000, 10000\\}$, comparing:\n1. **Gold standard** -- in-sample LD ($R = \\text{cor}(X)$)\n2. **Subsample** -- $R$ from a subsample of $B$ individuals\n3. **Stochastic sketch, no correction** -- sketch $U$ passed as `X`, no `stochastic_ld_sample`\n4. **Stochastic sketch, with correction** -- sketch $U$ passed as `X`, `stochastic_ld_sample = B`\n5. **Stochastic sketch + NIG prior, with correction** -- sketch $U$ with `estimate_residual_method = \"NIG\"` and `stochastic_ld_sample = B`\n\nMethod 5 uses the Normal-Inverse-Gamma (NIG) prior which integrates out the residual variance $\\sigma^2$ analytically, producing t-distributed marginals instead of Gaussian. This tests whether the NIG prior interacts properly with the stochastic LD variance inflation correction."
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Background: Stochastic LD Sketch\n",
    "\n",
    "Given a standardized genotype matrix $X_{\\text{std}} \\in \\mathbb{R}^{n \\times p}$, the true LD matrix is:\n",
    "\n",
    "$$R = \\frac{1}{n-1} X_{\\text{std}}^\\top X_{\\text{std}}$$\n",
    "\n",
    "The stochastic sketch approximates $R$ using a random projection matrix $W \\in \\mathbb{R}^{n \\times B}$ with $W_{ij} \\sim N(0, 1/n)$:\n",
    "\n",
    "$$U = X_{\\text{std}}^\\top W \\in \\mathbb{R}^{p \\times B}$$\n",
    "\n",
    "Each column of $U$ is approximately drawn from $N(0, R)$, so $\\hat{R} = U U^\\top / B \\to R$ as $B \\to \\infty$.\n",
    "\n",
    "In `susie_rss()`, we pass `X = t(U)` (a $B \\times p$ matrix) and the function treats it as a \"genotype-like\" input whose cross-product approximates the LD structure."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": "## SER Variance Inflation Correction\n\nIn each IBSS iteration, the SER computes a residual for variant $j$ after removing the effect of the $l$-th single effect:\n\n$$\\hat{r}_j = z_j - \\hat{R}_{j,:} \\bar{\\beta}_{-l}$$\n\nUnder the null $H_0: \\beta_j = 0$, the variance of $\\hat{r}_j$ when using the noisy sketch $\\hat{R}$ is:\n\n$$\\tau_j^2 = \\sigma^2 + \\frac{\\eta_j^2 + v_g}{B}$$\n\nwhere:\n- $\\sigma^2$ is the current residual variance estimate (updated each IBSS iteration),\n- $\\eta_j = \\hat{R}_{j,:} \\bar{\\beta}_{-l}$ is the predicted effect at variant $j$ from other effects,\n- $v_g = \\bar{\\beta}_{-l}^\\top \\hat{R} \\bar{\\beta}_{-l}$ is the total genetic variance from other effects.\n\nThe inflation factor $\\tau_j^2 / \\sigma^2 = 1 + (\\eta_j^2 + v_g) / (B \\sigma^2)$ is **dynamic**: it depends on the current IBSS state and is recomputed at every iteration for every single-effect regression. This means the correction is strongest near active signals (where $\\eta_j^2$ is large due to LD) and vanishes under the global null ($\\bar{\\beta}_{-l} = 0$).\n\nSetting `stochastic_ld_sample = B` in `susie_rss()` activates this correction."
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Setup: parameters and logging\n# ============================================================\nlibrary(susieR)\n\nif (requireNamespace(\"Rfast\", quietly = TRUE)) {\n  library(Rfast)\n  fast_cor <- Rfast::cora\n  cat(\"Using Rfast::cora for correlation matrices (much faster)\\n\")\n} else {\n  fast_cor <- cor\n  cat(\"Rfast not available, using base cor() (consider installing Rfast)\\n\")\n}\n\n# --- Simulation parameters ---\np         <- 5000\nn         <- 100000\nn_causal  <- 4\npve_per   <- 0.0012      # PVE per causal\nB_values  <- c(2000, 5000, 10000)\nn_rep     <- 50         # set to 250 for full run\nL         <- 10\nseed      <- 999\n\n# --- Log file for monitoring progress from the terminal ---\n# When running via jupyter nbconvert, cat() output is captured into the\n# notebook and NOT shown on screen. To monitor progress, open a second\n# terminal and run:   tail -f stochastic_ld_benchmark.log\nLOG_FILE <- \"stochastic_ld_benchmark.log\"\nlog_con  <- file(LOG_FILE, open = \"w\")\n\nlog_msg <- function(fmt, ...) {\n  msg <- sprintf(paste0(\"[%s] \", fmt, \"\\n\"), format(Sys.time(), \"%H:%M:%S\"), ...)\n  cat(msg)                           # notebook cell output\n  cat(msg, file = log_con)           # log file for tail -f\n  flush(log_con)\n}\n\nset.seed(seed)\nlog_msg(\"Stochastic LD Benchmark started\")\nlog_msg(\"  susieR version: %s\", packageVersion(\"susieR\"))\nlog_msg(\"  Parameters: p=%d, n=%d, n_causal=%d, pve_per=%.4f, n_rep=%d\",\n        p, n, n_causal, pve_per, n_rep)\nlog_msg(\"  B values: %s\", paste(B_values, collapse = \", \"))\nlog_msg(\"  Log file: %s  (run 'tail -f %s' to monitor)\", LOG_FILE, LOG_FILE)"
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Function Definitions\n",
    "\n",
    "All simulation functions are defined here. The main execution cell below calls them."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Function: build_ld_structure\n# Build block-diagonal AR(1) LD structure\n# Returns: list with blocks, block_membership, n_blocks\n# ============================================================\nbuild_ld_structure <- function(p, seed = 42) {\n  set.seed(seed)\n  blocks <- list()\n  block_membership <- integer(p)\n  pos <- 1\n  block_id <- 0\n  while (pos <= p) {\n    block_id <- block_id + 1\n    bsize <- min(sample(20:50, 1), p - pos + 1)\n    rho <- runif(1, 0.4, 0.98)\n    idx <- pos:(pos + bsize - 1)\n    block_membership[idx] <- block_id\n    R_block <- rho^abs(outer(1:bsize, 1:bsize, \"-\"))\n    blocks[[block_id]] <- list(idx = idx, R = R_block, rho = rho, size = bsize)\n    pos <- pos + bsize\n  }\n  list(blocks = blocks, block_membership = block_membership, n_blocks = block_id)\n}\n\n# ============================================================\n# Function: generate_genotypes\n# Generate X (n x p) with block-diagonal LD, standardize columns,\n# compute true in-sample R = cor(X).\n# Returns: list(X, R_true)\n# ============================================================\ngenerate_genotypes <- function(n, ld_struct, seed = 43) {\n  set.seed(seed)\n  p <- sum(sapply(ld_struct$blocks, function(b) b$size))\n  log_msg(\"  Allocating X (%d x %d), ~%.1f GB\", n, p, n * p * 8 / 1e9)\n  X <- matrix(0, nrow = n, ncol = p)\n  n_blocks <- length(ld_struct$blocks)\n  for (b in seq_along(ld_struct$blocks)) {\n    block <- ld_struct$blocks[[b]]\n    L_chol <- chol(block$R)\n    Z <- matrix(rnorm(n * block$size), nrow = n, ncol = block$size)\n    X[, block$idx] <- Z %*% L_chol\n    if (b %% 25 == 0 || b == n_blocks)\n      log_msg(\"    Block %d/%d done (variants %d-%d)\",\n              b, n_blocks, min(block$idx), max(block$idx))\n  }\n  log_msg(\"  Standardizing columns...\")\n  X <- scale(X)\n  attr(X, \"scaled:center\") <- NULL\n  attr(X, \"scaled:scale\") <- NULL\n  log_msg(\"  Computing R = fast_cor(X) [%d x %d]...\", p, p)\n  R_true <- fast_cor(X)\n  list(X = X, R_true = R_true)\n}\n\n# ============================================================\n# Function: compute_ld_approximations\n# For each B, compute stochastic sketch and subsample R.\n# Returns: list(sketches, R_subs)\n# ============================================================\ncompute_ld_approximations <- function(X, B_values, seed = 44) {\n  set.seed(seed)\n  n <- nrow(X); p <- ncol(X)\n  sketches <- list()\n  R_subs   <- list()\n  for (B in B_values) {\n    Bstr <- as.character(B)\n    log_msg(\"  B=%d: generating sketch W(%d x %d), U = X'W (%d x %d)...\",\n            B, n, B, p, B)\n    t0 <- proc.time()\n    W <- matrix(rnorm(n * B, sd = 1 / sqrt(n)), nrow = n, ncol = B)\n    U <- crossprod(X, W)\n    sketches[[Bstr]] <- t(U)\n    rm(W, U)\n    log_msg(\"    Sketch done in %.1f sec (%d x %d)\",\n            (proc.time() - t0)[3], nrow(sketches[[Bstr]]), ncol(sketches[[Bstr]]))\n    log_msg(\"  B=%d: computing subsample R from %d individuals...\", B, B)\n    t0 <- proc.time()\n    R_subs[[Bstr]] <- fast_cor(X[sample(n, B), ])\n    log_msg(\"    Subsample R done in %.1f sec\", (proc.time() - t0)[3])\n  }\n  list(sketches = sketches, R_subs = R_subs)\n}\n\n# ============================================================\n# Function: simulate_phenotype\n# Pick causal variants from different blocks, generate y.\n# ============================================================\nsimulate_phenotype <- function(X, ld_struct, n_causal, pve_per) {\n  n <- nrow(X); p <- ncol(X)\n  causal_blocks <- sample(ld_struct$n_blocks, n_causal)\n  causal_idx <- sapply(causal_blocks, function(b) sample(ld_struct$blocks[[b]]$idx, 1))\n  total_pve <- pve_per * n_causal\n  sigma_e2 <- 1 - total_pve\n  beta_j <- sqrt(pve_per * sigma_e2 / (1 - total_pve))\n  beta <- rep(0, p)\n  beta[causal_idx] <- beta_j\n  y <- as.vector(X %*% beta + rnorm(n, sd = sqrt(sigma_e2)))\n  list(y = y, causal_idx = causal_idx, beta = beta)\n}\n\n# ============================================================\n# Function: compute_zscores\n# Marginal z-scores via individual-level univariate regressions.\n# ============================================================\ncompute_zscores <- function(X, y) {\n  n <- nrow(X); p <- ncol(X)\n  z <- numeric(p)\n  for (j in seq_len(p)) {\n    fit <- .lm.fit(cbind(1, X[, j]), y)\n    bhat <- fit$coefficients[2]\n    rss  <- sum(fit$residuals^2)\n    se   <- sqrt(rss / (n - 2)) / sqrt(sum((X[, j] - mean(X[, j]))^2))\n    z[j] <- bhat / se\n  }\n  z\n}\n\n# ============================================================\n# Function: evaluate_fit\n# Extract CS, return RAW COUNTS for proper aggregation.\n# FDR and power are computed from accumulated counts across replicates.\n# ============================================================\nevaluate_fit <- function(fit, true_causal) {\n  cs <- susie_get_cs(fit)$cs\n  n_cs <- length(cs)\n  if (n_cs == 0) {\n    return(list(n_cs = 0, n_true_cs = 0, n_false_cs = 0,\n                n_found = 0, n_causal = length(true_causal), mean_size = 0))\n  }\n  n_true_cs <- sum(sapply(cs, function(s) any(true_causal %in% s)))\n  n_false_cs <- n_cs - n_true_cs\n  n_found <- sum(sapply(true_causal, function(c)\n                   any(sapply(cs, function(s) c %in% s))))\n  list(n_cs = n_cs, n_true_cs = n_true_cs, n_false_cs = n_false_cs,\n       n_found = n_found, n_causal = length(true_causal),\n       mean_size = mean(sapply(cs, length)))\n}\n\n# ============================================================\n# Function: run_one_method\n# Run susie_rss with given inputs, evaluate, return one-row df.\n# ============================================================\nrun_one_method <- function(method_name, z, causal_idx, n, L, ...) {\n  t0 <- proc.time()\n  fit <- tryCatch(\n    susie_rss(z = z, n = n, L = L, max_iter = 200, verbose = FALSE, ...),\n    error = function(e) { log_msg(\"    %s ERROR: %s\", method_name, e$message); NULL }\n  )\n  if (is.null(fit)) return(NULL)\n  ev <- evaluate_fit(fit, causal_idx)\n  elapsed <- (proc.time() - t0)[3]\n  # Compute per-replicate rates for the log line\n  rep_power <- ev$n_found / ev$n_causal\n  rep_fdr   <- if (ev$n_cs > 0) ev$n_false_cs / ev$n_cs else 0\n  log_msg(\"    %-25s %5.1fs | power=%.2f  fdr=%.2f  n_cs=%d  size=%.0f\",\n          method_name, elapsed, rep_power, rep_fdr, ev$n_cs, ev$mean_size)\n  data.frame(method = method_name,\n             n_cs = ev$n_cs, n_true_cs = ev$n_true_cs, n_false_cs = ev$n_false_cs,\n             n_found = ev$n_found, n_causal = ev$n_causal,\n             mean_size = ev$mean_size,\n             stringsAsFactors = FALSE)\n}\n\n# ============================================================\n# Function: summarize_results\n# Aggregate raw counts across replicates, compute FDR and power.\n# ============================================================\nsummarize_results <- function(results) {\n  methods <- unique(results$method)\n  # Order methods logically\n  method_order <- c(\"insample_R\")\n  for (B in B_values) {\n    method_order <- c(method_order,\n                      paste0(\"subsample_B\", B),\n                      paste0(\"stoch_B\", B, \"_nocorr\"),\n                      paste0(\"stoch_B\", B, \"_corr\"),\n                      paste0(\"stoch_B\", B, \"_NIG_corr\"))\n  }\n  methods <- method_order[method_order %in% methods]\n\n  summary_rows <- list()\n  for (m in methods) {\n    rows <- results[results$method == m, ]\n    total_cs       <- sum(rows$n_cs)\n    total_false_cs <- sum(rows$n_false_cs)\n    total_found    <- sum(rows$n_found)\n    total_causal   <- sum(rows$n_causal)\n    # Weighted mean CS size (weight by n_cs per replicate)\n    if (total_cs > 0) {\n      avg_size <- sum(rows$mean_size * rows$n_cs) / total_cs\n    } else {\n      avg_size <- 0\n    }\n    summary_rows[[length(summary_rows) + 1]] <- data.frame(\n      method = m,\n      total_cs = total_cs,\n      total_false_cs = total_false_cs,\n      total_found = total_found,\n      total_causal = total_causal,\n      FDR = if (total_cs > 0) total_false_cs / total_cs else 0,\n      power = total_found / total_causal,\n      mean_size = avg_size,\n      n_rep = nrow(rows),\n      stringsAsFactors = FALSE\n    )\n  }\n  do.call(rbind, summary_rows)\n}\n\n# ============================================================\n# Function: run_simulation\n# Main loop: for each replicate, simulate phenotype, compute z,\n# run all methods, collect results. Print final summary.\n# ============================================================\nrun_simulation <- function(X, R_true, sketches, R_subs, ld_struct,\n                           B_values, n_rep, n_causal, pve_per, L, seed) {\n  set.seed(seed)\n  n <- nrow(X)\n  results <- list()\n  rep_times <- numeric()\n  t_total <- proc.time()\n\n  for (rep_i in seq_len(n_rep)) {\n    eta_str <- \"\"\n    if (rep_i > 1) {\n      eta_min <- mean(rep_times) * (n_rep - rep_i + 1) / 60\n      eta_str <- sprintf(\"  (ETA: %.0f min)\", eta_min)\n    }\n    log_msg(\"=== Replicate %d / %d ===%s\", rep_i, n_rep, eta_str)\n    t_rep <- proc.time()\n\n    # Simulate phenotype\n    sim <- simulate_phenotype(X, ld_struct, n_causal, pve_per)\n    log_msg(\"  Causal variants: %s\", paste(sim$causal_idx, collapse = \", \"))\n\n    # Compute z-scores\n    t_z <- proc.time()\n    log_msg(\"  Computing z-scores (%d variants)...\", ncol(X))\n    z <- compute_zscores(X, sim$y)\n    log_msg(\"  z-scores done in %.1f sec, max|z|=%.2f\",\n            (proc.time() - t_z)[3], max(abs(z)))\n\n    # Gold standard\n    row <- run_one_method(\"insample_R\", z, sim$causal_idx, n, L, R = R_true)\n    if (!is.null(row)) { row$rep <- rep_i; results[[length(results) + 1]] <- row }\n\n    # For each B\n    for (B in B_values) {\n      Bstr <- as.character(B)\n      # Subsample\n      row <- run_one_method(sprintf(\"subsample_B%d\", B), z, sim$causal_idx,\n                            n, L, R = R_subs[[Bstr]])\n      if (!is.null(row)) { row$rep <- rep_i; results[[length(results) + 1]] <- row }\n      # Stochastic, no correction\n      row <- run_one_method(sprintf(\"stoch_B%d_nocorr\", B), z, sim$causal_idx,\n                            n, L, X = sketches[[Bstr]])\n      if (!is.null(row)) { row$rep <- rep_i; results[[length(results) + 1]] <- row }\n      # Stochastic, with correction\n      row <- run_one_method(sprintf(\"stoch_B%d_corr\", B), z, sim$causal_idx,\n                            n, L, X = sketches[[Bstr]], stochastic_ld_sample = B)\n      if (!is.null(row)) { row$rep <- rep_i; results[[length(results) + 1]] <- row }\n      # Stochastic + NIG prior, with correction\n      row <- run_one_method(sprintf(\"stoch_B%d_NIG_corr\", B), z, sim$causal_idx,\n                            n, L, X = sketches[[Bstr]], stochastic_ld_sample = B,\n                            estimate_residual_method = \"NIG\")\n      if (!is.null(row)) { row$rep <- rep_i; results[[length(results) + 1]] <- row }\n    }\n\n    elapsed_rep <- (proc.time() - t_rep)[3]\n    rep_times <- c(rep_times, elapsed_rep)\n    log_msg(\"  Replicate %d done in %.1f sec (%.1f min)\",\n            rep_i, elapsed_rep, elapsed_rep / 60)\n  }\n\n  elapsed_total <- (proc.time() - t_total)[3]\n  log_msg(\"All %d replicates completed in %.1f min (avg %.1f sec/rep)\",\n          n_rep, elapsed_total / 60, mean(rep_times))\n\n  results_df <- do.call(rbind, results)\n\n  # --- Final summary (accumulated across all replicates) ---\n  summary_df <- summarize_results(results_df)\n  log_msg(\"\")\n  log_msg(\"====================================================\")\n  log_msg(\"  FINAL SUMMARY (accumulated over %d replicates)\", n_rep)\n  log_msg(\"====================================================\")\n  log_msg(\"%-30s %6s %6s %6s %8s %8s\",\n          \"method\", \"FDR\", \"power\", \"n_cs\", \"false\", \"size\")\n  log_msg(\"%-30s %6s %6s %6s %8s %8s\",\n          \"------------------------------\", \"------\", \"------\", \"------\", \"--------\", \"--------\")\n  for (i in seq_len(nrow(summary_df))) {\n    s <- summary_df[i, ]\n    log_msg(\"%-30s %6.3f %6.3f %6d %8d %8.0f\",\n            s$method, s$FDR, s$power, s$total_cs, s$total_false_cs, s$mean_size)\n  }\n  log_msg(\"====================================================\")\n\n  list(results = results_df, summary = summary_df)\n}\n\nlog_msg(\"All functions defined.\")"
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Run Simulation\n",
    "\n",
    "Execution proceeds in four phases:\n",
    "1. Build LD structure (fast)\n",
    "2. Generate genotype matrix and true LD (slow \u2014 several minutes)\n",
    "3. Pre-compute stochastic sketches and subsample LD for each $B$\n",
    "4. Run replicates: simulate phenotype, compute z-scores, run all methods\n",
    "\n",
    "**To monitor progress**, open a second terminal and run:\n",
    "```bash\n",
    "tail -f stochastic_ld_benchmark.log\n",
    "```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Phase 1: Build LD structure\n# ============================================================\nlog_msg(\"Phase 1: Building LD structure (p=%d)...\", p)\nld_struct <- build_ld_structure(p, seed = seed)\nlog_msg(\"  %d blocks, sizes %d-%d, rho %.2f-%.2f\",\n        ld_struct$n_blocks,\n        min(sapply(ld_struct$blocks, function(b) b$size)),\n        max(sapply(ld_struct$blocks, function(b) b$size)),\n        min(sapply(ld_struct$blocks, function(b) b$rho)),\n        max(sapply(ld_struct$blocks, function(b) b$rho)))\n\n# ============================================================\n# Phase 2: Generate genotypes and true LD\n# ============================================================\nlog_msg(\"Phase 2: Generating genotypes (%d x %d)...\", n, p)\nt0 <- proc.time()\ngeno <- generate_genotypes(n, ld_struct, seed = seed + 1)\nX      <- geno$X\nR_true <- geno$R_true\nrm(geno)\nlog_msg(\"Phase 2 complete in %.1f min\", (proc.time() - t0)[3] / 60)\n\n# ============================================================\n# Phase 3: Pre-compute LD approximations\n# ============================================================\nlog_msg(\"Phase 3: Computing LD approximations for B = {%s}...\",\n        paste(B_values, collapse = \", \"))\nt0 <- proc.time()\nld_approx <- compute_ld_approximations(X, B_values, seed = seed + 2)\nsketches <- ld_approx$sketches\nR_subs   <- ld_approx$R_subs\nrm(ld_approx)\nlog_msg(\"Phase 3 complete in %.1f min\", (proc.time() - t0)[3] / 60)\n\n# ============================================================\n# Phase 4: Run simulation replicates\n# ============================================================\nn_methods <- 1 + length(B_values) * 4  # insample + 4 per B\nlog_msg(\"Phase 4: Running %d replicates x %d methods...\", n_rep, n_methods)\nsim_output <- run_simulation(X, R_true, sketches, R_subs, ld_struct,\n                             B_values, n_rep, n_causal, pve_per, L,\n                             seed = seed + 100)\nresults <- sim_output$results\nsummary_df <- sim_output$summary\nlog_msg(\"Simulation complete. %d result rows.\", nrow(results))"
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# ============================================================\n",
    "# Save results to RDS (both per-replicate and summary)\n",
    "# ============================================================\n",
    "rds_file <- sprintf(\"stochastic_ld_benchmark_n%d_p%d_nrep%d.rds\", n, p, n_rep)\n",
    "saveRDS(list(results = results, summary = summary_df), file = rds_file)\n",
    "log_msg(\"Results saved to %s\", rds_file)\n",
    "close(log_con)  # close log file\n",
    "\n",
    "cat(\"\\n=== FINAL SUMMARY ===\\n\")\n",
    "print(summary_df[, c(\"method\", \"FDR\", \"power\", \"total_cs\", \"total_false_cs\", \"mean_size\")],\n",
    "      row.names = FALSE)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Results and Visualization\n",
    "\n",
    "Three plots:\n",
    "1. **FDR bar plot** \u2014 with a horizontal line at the nominal 0.05 level\n",
    "2. **Power bar plot**\n",
    "3. **Power vs. FDR scatter** \u2014 summarizing the trade-off"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Load and display summary (from accumulated raw counts)\n# ============================================================\n# To reload from saved file:\n# dat <- readRDS(rds_file)\n# results <- dat$results\n# summary_df <- dat$summary\n\n# Order methods logically\nmethod_order <- c(\"insample_R\")\nfor (B in B_values) {\n  method_order <- c(method_order,\n                    paste0(\"subsample_B\", B),\n                    paste0(\"stoch_B\", B, \"_nocorr\"),\n                    paste0(\"stoch_B\", B, \"_corr\"),\n                    paste0(\"stoch_B\", B, \"_NIG_corr\"))\n}\nsummary_df$method <- factor(summary_df$method, levels = method_order)\nsummary_df <- summary_df[order(summary_df$method), ]\n\ncat(\"\\n=== Summary (accumulated over all replicates) ===\\n\")\nprint(summary_df[, c(\"method\", \"FDR\", \"power\", \"total_cs\", \"total_false_cs\",\n                      \"total_found\", \"total_causal\", \"mean_size\")], row.names = FALSE)"
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# FDR bar plot (from accumulated counts)\n# ============================================================\nmethod_colors <- c(\"insample_R\" = \"gray50\")\nfor (B in B_values) {\n  method_colors[paste0(\"subsample_B\", B)]        <- \"steelblue\"\n  method_colors[paste0(\"stoch_B\", B, \"_nocorr\")]  <- \"tomato\"\n  method_colors[paste0(\"stoch_B\", B, \"_corr\")]    <- \"seagreen\"\n  method_colors[paste0(\"stoch_B\", B, \"_NIG_corr\")] <- \"mediumpurple\"\n}\n\npar(mar = c(12, 4, 3, 1))\nbp <- barplot(summary_df$FDR, names.arg = summary_df$method,\n              col = method_colors[as.character(summary_df$method)],\n              las = 2, ylab = \"FDR\", main = \"False Discovery Rate by Method\",\n              ylim = c(0, max(summary_df$FDR, 0.1) * 1.2))\nabline(h = 0.05, col = \"darkred\", lty = 2, lwd = 2)\ntext(max(bp), 0.05, \"  0.05\", adj = c(0, -0.3), col = \"darkred\", cex = 0.8)\nlegend(\"topright\",\n       legend = c(\"In-sample R\", \"Subsample\", \"Stoch (no corr)\",\n                  \"Stoch (corrected)\", \"NIG (corrected)\"),\n       fill = c(\"gray50\", \"steelblue\", \"tomato\", \"seagreen\",\n                \"mediumpurple\"), cex = 0.7, bty = \"n\")"
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Power bar plot (from accumulated counts)\n# ============================================================\npar(mar = c(12, 4, 3, 1))\nbp <- barplot(summary_df$power, names.arg = summary_df$method,\n              col = method_colors[as.character(summary_df$method)],\n              las = 2, ylab = \"Power\", main = \"Power by Method\",\n              ylim = c(0, 1))\nlegend(\"topright\",\n       legend = c(\"In-sample R\", \"Subsample\", \"Stoch (no corr)\",\n                  \"Stoch (corrected)\", \"NIG (corrected)\"),\n       fill = c(\"gray50\", \"steelblue\", \"tomato\", \"seagreen\",\n                \"mediumpurple\"), cex = 0.7, bty = \"n\")"
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": "# ============================================================\n# Power vs FDR scatter plot (from accumulated counts)\n# ============================================================\npar(mar = c(5, 4, 3, 1))\nmethod_pch <- c(\"insample_R\" = 16)\npch_vals <- c(17, 15, 18)\nfor (i in seq_along(B_values)) {\n  B <- B_values[i]\n  method_pch[paste0(\"subsample_B\", B)]        <- pch_vals[i]\n  method_pch[paste0(\"stoch_B\", B, \"_nocorr\")]  <- pch_vals[i]\n  method_pch[paste0(\"stoch_B\", B, \"_corr\")]    <- pch_vals[i]\n  method_pch[paste0(\"stoch_B\", B, \"_NIG_corr\")] <- pch_vals[i]\n}\n\nplot(summary_df$FDR, summary_df$power, type = \"n\",\n     xlim = c(0, max(summary_df$FDR, 0.1) * 1.3), ylim = c(0, 1),\n     xlab = \"FDR\", ylab = \"Power\", main = \"Power vs FDR\")\npoints(summary_df$FDR, summary_df$power,\n       col = method_colors[as.character(summary_df$method)],\n       pch = method_pch[as.character(summary_df$method)], cex = 2)\ntext(summary_df$FDR, summary_df$power, labels = summary_df$method,\n     pos = 4, cex = 0.5, col = \"gray30\")\nabline(v = 0.05, col = \"darkred\", lty = 2, lwd = 2)\ntext(0.05, 0, \"FDR = 0.05\", adj = c(-0.1, -0.3), col = \"darkred\", cex = 0.8)\nlegend(\"bottomright\",\n       legend = c(\"In-sample R\", \"Subsample\", \"Stoch (no corr)\",\n                  \"Stoch (corrected)\", \"NIG (corrected)\",\n                  paste0(\"B=\", B_values)),\n       col = c(\"gray50\", \"steelblue\", \"tomato\", \"seagreen\",\n               \"mediumpurple\", rep(\"black\", 3)),\n       pch = c(16, 16, 16, 16, 16, pch_vals),\n       pt.cex = 1.5, cex = 0.6, bty = \"n\")"
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Command-Line Execution\n",
    "\n",
    "```bash\n",
    "cd /path/to/notebooks\n",
    "\n",
    "# Terminal 1: run the notebook\n",
    "jupyter nbconvert --execute --to notebook \\\n",
    "    --output stochastic_ld_benchmark_executed.ipynb \\\n",
    "    --ExecutePreprocessor.timeout=7200 \\\n",
    "    stochastic_ld_benchmark.ipynb\n",
    "\n",
    "# Terminal 2: monitor progress\n",
    "tail -f stochastic_ld_benchmark.log\n",
    "```\n",
    "\n",
    "For the full run, edit the setup cell to set `n_rep <- 100`.\n",
    "\n",
    "Results are saved to `stochastic_ld_benchmark_n100000_p5000_nrep100.rds`."
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "R",
   "language": "R",
   "name": "ir"
  },
  "language_info": {
   "codemirror_mode": "r",
   "file_extension": ".r",
   "mimetype": "text/x-r-source",
   "name": "R",
   "pygments_lexer": "r",
   "version": "4.4.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}

================================================
FILE: man/FinemappingConvergence.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{FinemappingConvergence}
\alias{FinemappingConvergence}
\title{Simulated Fine-mapping Data with Convergence Problem.}
\format{
\code{FinemappingConvergence} is a list with the following
elements:

\describe{

  \item{XtX}{Summary statistics computed using the centered and
    scaled genotype matrix.}

  \item{Xty}{Summary statistics computed using the centered and
    scaled genotype data, and the centered simulated response.}

  \item{yty}{yty is computed using the centered simulated response.}

  \item{n}{The sample size (50,000).}

  \item{true_coef}{The coefficients used to simulate the responses.}

  \item{z}{z-scores from a simple (single-SNP) linear regression.}}
}
\description{
Data simulated using real genotypes from 50,000
  individuals and 200 SNPs. Two of the SNPs have non-zero effects
  on the multivariate response. The response data are generated under
  a linear regression model. The simulated response and the columns
  of the genotype matrix are centered.
}
\examples{
data(FinemappingConvergence)
}
\seealso{
A similar data set with more SNPs is used in the
  \dQuote{Refine SuSiE model} vignette.
}
\keyword{data}


================================================
FILE: man/N2finemapping.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{N2finemapping}
\alias{N2finemapping}
\title{Simulated Fine-mapping Data with Two Effect Variables}
\format{
\code{N2finemapping} is a list with the following elements:

\describe{

  \item{X}{Centered and scaled genotype data.}

  \item{chrom}{Chromomsome of the original data, in hg38 coordinates.}

  \item{pos}{Chromomosomal position of the original data, in hg38
    coordinates. The information can be used to compare impact of using
    other genotype references of the same variables in \code{susie_rss}
    application.}

  \item{true_coef}{Simulated effect sizes.}

  \item{residual_variance}{Simulated residual covariance matrix.}

  \item{Y}{Simulated multivariate response.}

  \item{allele_freq}{Allele frequencies based on the original
    genotype data.}

  \item{V}{Suggested prior covariance matrix for effect sizes of
     the two non-zero effect variables.}
}
}
\description{
This data set contains a genotype matrix for 574
  individuals and 1,002 variables. The variables are genotypes after
  centering and scaling, and therefore retain the correlation
  structure of the original genotype data. Two of the variables have
  non-zero effects on the multivariate response. The response data
  are generated under a multivariate linear regression model. See
  Wang \emph{et al} (2020) for details.
}
\examples{
data(N2finemapping)
}
\references{
G. Wang, A. Sarkar, P. Carbonetto and M. Stephens (2020). A simple
  new approach to variable selection in regression, with application
  to genetic fine-mapping. \emph{Journal of the Royal Statistical
  Society, Series B} \doi{10.1101/501114}.
}
\keyword{data}


================================================
FILE: man/N3finemapping.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{N3finemapping}
\alias{N3finemapping}
\title{Simulated Fine-mapping Data with Three Effect Variables.}
\format{
\code{N3finemapping} is a list with the following elements:

\describe{

  \item{X}{N by P variable matrix of centered and scaled genotype
data.}

  \item{chrom}{Chromomsome of the original data, in hg38 coordinate.}

  \item{pos}{Chromomosomal positoin of the original data, in hg38
coordinate. The information can be used to compare impact of using
other genotype references of the same variables in susie_rss
application.}

  \item{true_coef}{The simulated effect sizes.}

  \item{residual_variance}{The simulated residual covariance matrix.}

  \item{Y}{The simulated response variables.}

  \item{allele_freq}{Allele frequency of the original genotype data.}

  \item{V}{Prior covariance matrix for effect size of the three
non-zero effect variables.}  }
}
\description{
The data-set contains a matrix of 574
individuals and 1,001 variables. These variables are real-world
genotypes centered and scaled, and therefore retains the
correlation structure of variables in the original genotype data. 3
out of the variables have non-zero effects.  The response data is
generated under a multivariate linear regression model. See Wang
\emph{et al} (2020) for more details.
}
\examples{
data(N3finemapping)
}
\references{
G. Wang, A. Sarkar, P. Carbonetto and M. Stephens (2020). A simple
  new approach to variable selection in regression, with application
  to genetic fine-mapping. \emph{Journal of the Royal Statistical
  Society, Series B} \doi{10.1101/501114}.
}
\keyword{data}


================================================
FILE: man/SummaryConsistency.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{SummaryConsistency}
\alias{SummaryConsistency}
\title{Simulated Fine-mapping Data with LD matrix From Reference Panel.}
\format{
\code{SummaryConsistency} is a list with the following
elements:

\describe{

  \item{z}{z-scores computed by fitting univariate simple regression
    variable-by-variable.}

  \item{ldref}{LD matrix estimated from the reference panel.}

  \item{flip_id}{The index of the SNP with the flipped allele.}

  \item{signal_id}{The index of the SNP with the non-zero effect.}}
}
\description{
Data simulated using real genotypes from 10,000
  individuals and 200 SNPs. One SNP have non-zero effect
  on the multivariate response. The response data are generated under
  a linear regression model. There is also one SNP with flipped allele
  between summary statistics and the reference panel.
}
\examples{
data(SummaryConsistency)
}
\seealso{
A similar data set with more samples is used in the
  \dQuote{Diagnostic for fine-mapping with summary statistics}
  vignette.
}
\keyword{data}


================================================
FILE: man/absolute.order.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/univariate_regression.R
\name{absolute.order}
\alias{absolute.order}
\title{Ordering of Predictors from Coefficient Estimates}
\usage{
absolute.order(beta)
}
\arguments{
\item{beta}{A vector of estimated regression coefficients.}
}
\value{
An ordering of the predictors.
}
\description{
This function orders the predictors by decreasing
  order of the magnitude of the estimated regression coefficient.
}
\examples{
### generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

### order predictors by magnitude of univariate regression coefficient
beta.hat    = univariate_regression(X,y)$betahat
order       = absolute.order(beta.hat)

}


================================================
FILE: man/add_delta_features.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{add_delta_features}
\alias{add_delta_features}
\title{Add per-slot delta features (change from previous iteration)}
\usage{
add_delta_features(df)
}
\arguments{
\item{df}{data.frame from collect_ash_diag + label_diag_truth}
}
\value{
df with added delta_, lag1_, and cum_ columns
}
\description{
Computes delta_c_hat, delta_V, delta_lbf, delta_max_alpha,
delta_alpha_entropy, delta_purity for each slot across iterations.
Also adds lag1 features (previous iteration values) and
cumulative features (max c_hat ever, min alpha_entropy ever).
These temporal features help ML models detect trajectories
(e.g., a slot that was strong then weakened = collapse signal).
}
\examples{
\dontrun{
df <- susieR:::collect_ash_diag(fit)
df <- susieR:::label_diag_truth(df, fit, causal)
df <- susieR:::add_delta_features(df)
# Now df has delta_c_hat, lag1_c_hat, cum_max_c_hat, etc.
# Use for decision tree: rpart::rpart(cs_label ~ ., data = df_last_iter)
}

}
\keyword{internal}


================================================
FILE: man/block_coordinate_ascent.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/refinement.R
\name{block_coordinate_ascent}
\alias{block_coordinate_ascent}
\title{Block coordinate ascent for iterative model refinement.}
\usage{
block_coordinate_ascent(
  model,
  data,
  step_fn,
  max_iter = 100,
  tol = 0.001,
  verbose = FALSE
)
}
\arguments{
\item{model}{Fitted model (e.g., from \code{susie_workhorse} or
\code{mvsusie_workhorse}).}

\item{data}{Data object passed to \code{step_fn}.}

\item{step_fn}{A function with signature
\code{function(model, data, iter)} that performs one block coordinate
update.  Must return a named list with elements:
\describe{
  \item{model}{(required) The updated model.}
  \item{data}{(optional) Updated data object, e.g. after changing
    residual variance.  If \code{NULL}, the data is unchanged.}
  \item{converged}{(optional) Logical; if \code{TRUE}, stop
    iterating.}
  \item{log_msg}{(optional) Character string appended to verbose
    output.}
}}

\item{max_iter}{Maximum number of block ascent iterations
(default 100).}

\item{tol}{Convergence tolerance for relative ELBO change
(default 1e-3).}

\item{verbose}{If \code{TRUE}, print progress each iteration
(default \code{FALSE}).}
}
\value{
The refined model, with \code{model$converged} set to
  \code{TRUE} or \code{FALSE}.
}
\description{
Generic framework for post-convergence refinement of fitted models.
Repeatedly applies a block update (\code{step_fn}) to a fitted model,
monitoring ELBO for convergence and stability.  Both CS refinement
(\code{\link{run_refine}}) and residual variance estimation (mvsusieR)
are instances of block coordinate ascent over different parameter blocks.
}
\details{
Convergence is reached when either:
\itemize{
  \item \code{step_fn} returns \code{converged = TRUE}
        (the block update signals no further improvement), or
  \item the relative ELBO change falls below \code{tol}
        (ELBO stabilized across block updates).
}

A warning is issued if the ELBO decreases between iterations.
}


================================================
FILE: man/calculate_posterior_moments_mixture_common.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mixture_prior.R
\name{calculate_posterior_moments_mixture_common}
\alias{calculate_posterior_moments_mixture_common}
\title{Compute mixture posterior moments}
\usage{
calculate_posterior_moments_mixture_common(params, model, l)
}
\arguments{
\item{params}{Params object with prior_variance_grid and mixture_weights}

\item{model}{Model with lbf_grid[[l]] (p x K), alpha[l,] already computed,
and ser_stats cached from loglik_mixture_common}

\item{l}{Effect index}
}
\value{
Updated model with mu[l,] and mu2[l,]
}
\description{
For each grid point k, computes the conjugate normal posterior moments
(mean, variance) given prior variance V_k. Forms the mixture posterior
using responsibility weights r_jk = w_k * BF_jk / sum_k' w_k' * BF_jk'.
}
\details{
Uses betahat and shat2 from ser_stats (produced by the data-type-specific
compute_ser_statistics), so this function is data-type-agnostic.
}
\keyword{internal}


================================================
FILE: man/check_alpha_pip_cycle_convergence.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_utils.R
\name{check_alpha_pip_cycle_convergence}
\alias{check_alpha_pip_cycle_convergence}
\title{Check alpha/PIP fixed-point or short-cycle convergence}
\usage{
check_alpha_pip_cycle_convergence(data, params, model)
}
\description{
Uses one tolerance for both marginal PIPs and alpha. Lag 1 is ordinary
convergence; larger lags detect a periodic orbit and average alpha over it.
}
\keyword{internal}


================================================
FILE: man/cleanup_extra_fields.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/generic_methods.R
\name{cleanup_extra_fields}
\alias{cleanup_extra_fields}
\title{Class-specific extra fields to strip in cleanup_model.default}
\usage{
cleanup_extra_fields(data)
}
\description{
Default returns `character(0)`. Subclasses (e.g., mfsusieR's
`raw_residuals`, mvsusieR's `Y_imputed`/`llik_cache`) override
to add their per-class scratch fields. Result is unioned with
the standard temp_fields list inside `cleanup_model.default`.
}
\keyword{internal}


================================================
FILE: man/coef.mr.ash.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mr.ash.R
\name{coef.mr.ash}
\alias{coef.mr.ash}
\title{Extract Regression Coefficients from Mr.ASH Fit}
\usage{
\method{coef}{mr.ash}(object, ...)
}
\arguments{
\item{object}{A Mr.ASH fit, usually the result of calling
\code{mr.ash}.}

\item{...}{Additional arguments passed to the default S3 method.}
}
\value{
A p+1 vector. The first element gives the estimated
  intercept, and the remaining p elements are the estimated
  regression coefficients.
  
## generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X %*% beta + rnorm(n)

## fit mr.ash
fit.mr.ash  = mr.ash(X, y)

## coefficient
coef.mr.ash = coef(fit.mr.ash)
intercept   = coef.mr.ash[1]
beta        = coef.mr.ash[-1]
}
\description{
Retrieve posterior mean estimates of the regression
  coefficients in a Mr.ASH model.
}


================================================
FILE: man/coef.susie.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/predict.susie.R
\name{coef.susie}
\alias{coef.susie}
\title{Extract regression coefficients from susie fit}
\usage{
\method{coef}{susie}(object, ...)
}
\arguments{
\item{object}{A susie fit.}

\item{\dots}{Additional arguments passed to the generic \code{coef}
method.}
}
\value{
A p+1 vector, the first element being an intercept, and the
  remaining p elements being estimated regression coefficients.
}
\description{
Extract regression coefficients from susie fit
}


================================================
FILE: man/collect_ash_diag.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{collect_ash_diag}
\alias{collect_ash_diag}
\title{Collect diagnostic data.frames across iterations}
\usage{
collect_ash_diag(fit)
}
\arguments{
\item{fit}{SuSiE fit object (must have been run with .ash_debug = TRUE)}
}
\value{
data.frame with nrow = L * n_ash_iters, or NULL if no diagnostics
}
\description{
Call this after running susie() to rbind all per-iteration diagnostics
into a single ML-ready data.frame.
}
\examples{
\dontrun{
# Full ML pipeline:
data(unmappable_data)
X <- unmappable_data$X; y <- as.vector(unmappable_data$y)
causal <- which(unmappable_data$beta != 0)

fit <- susie(X, y, L=10, slot_prior=slot_prior_betabinom(),
             unmappable_effects="ash", max_iter=50)

df <- susieR:::collect_ash_diag(fit)         # all iterations
df <- susieR:::label_diag_truth(df, fit, causal) # TP/FP labels
df <- susieR:::add_delta_features(df)         # temporal features

# Inspect FP slot across iterations:
subset(df, cs_label == "FP", select = c(iter, slot, sentinel,
       c_hat, lbf, max_alpha, alpha_entropy, mask_tier, delta_c_hat))

# 4-way comparison (BB+ash vs V0, with/without mr.ash):
options(susie.skip_mrash = TRUE)
fit_nomrash <- susie(X, y, L=10, slot_prior=slot_prior_betabinom(),
                     unmappable_effects="ash", max_iter=50)
options(susie.skip_mrash = FALSE)
df_nomrash <- susieR:::collect_ash_diag(fit_nomrash)

# Decision tree analysis:
# library(rpart)
# last_iter <- df[df$iter == max(df$iter) & df$V > 0, ]
# tree <- rpart(cs_label ~ c_hat + lbf + max_alpha + alpha_entropy +
#               purity + mask_tier + delta_c_hat, data = last_iter)
}

}
\keyword{internal}


================================================
FILE: man/compare_ash_methods.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{compare_ash_methods}
\alias{compare_ash_methods}
\title{Compare two diagnostic runs side by side}
\usage{
compare_ash_methods(df1, df2, label1 = "Method1", label2 = "Method2")
}
\arguments{
\item{df1}{First diagnostic data.frame}

\item{df2}{Second diagnostic data.frame}

\item{label1}{Label for first run (e.g., "BB+ash")}

\item{label2}{Label for second run (e.g., "V0")}
}
\description{
Takes two data.frames (from diagnose_bb_ash_iter or
diagnose_ash_filter_archived_iter) at the same iteration
and prints a side-by-side comparison.
}
\keyword{internal}


================================================
FILE: man/compute_marginal_bhat_shat.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/univariate_regression.R
\name{compute_marginal_bhat_shat}
\alias{compute_marginal_bhat_shat}
\title{Per-Position Marginal OLS Regression of `Y` on Each Column of `X`}
\usage{
compute_marginal_bhat_shat(X, Y, predictor_weights = NULL, sigma2 = NULL)
}
\arguments{
\item{X}{numeric matrix `n x J`, expected column-centred.}

\item{Y}{numeric matrix `n x T` or numeric vector of length `n`.
When a vector, is treated as a one-column matrix.}

\item{predictor_weights}{optional numeric vector of length `J`
giving `colSums(X^2)`. Computed internally when `NULL`.
Callers that have this cached on the data object pass it
through to avoid recomputation.}

\item{sigma2}{optional numeric scalar giving a known residual
variance. When supplied, `Shat[j, t] = sqrt(sigma2 /
predictor_weights[j])` (single-effect-residual form). When
`NULL`, `Shat` is the per-pair empirical residual standard
error: for each `(j, t)` pair, the sample SD of `Y[, t] -
X[, j] * Bhat[j, t]` divided by `sqrt(n - 1)`. The latter
matches the form used by data-driven prior init routines
(e.g., for fitting a normal-mixture prior via `ashr::ash`).}
}
\value{
list with elements `Bhat` (`J x T`) and `Shat` (`J x T`).
}
\description{
Computes the marginal OLS regression coefficient and
  standard error for each `(X column, Y column)` pair, treating
  the regressions as independent. `X` is assumed column-centred
  (no intercept term in the per-pair regression); each `Y`
  column is treated independently. Returns the J x T matrices
  `Bhat` and `Shat`.

Used internally by single-effect-regression style routines that
need a per-position marginal estimate. Vectorised across columns
of `Y` so callers can pass either a numeric vector (T = 1) or a
numeric matrix (T > 1) without looping at the call site.
}
\examples{
set.seed(1)
X <- matrix(rnorm(50 * 5), 50, 5)
X <- scale(X, center = TRUE, scale = FALSE)
Y <- matrix(rnorm(50 * 3), 50, 3)
out <- compute_marginal_bhat_shat(X, Y)
dim(out$Bhat)   # 5 x 3
dim(out$Shat)   # 5 x 3

}


================================================
FILE: man/compute_suff_stat.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_rss_utils.R
\name{compute_suff_stat}
\alias{compute_suff_stat}
\title{Compute sufficient statistics for input to \code{susie_ss}}
\usage{
compute_suff_stat(X, y, standardize = FALSE)
}
\arguments{
\item{X}{An n by p matrix of covariates.}

\item{y}{An n vector.}

\item{standardize}{Logical flag indicating whether to standardize
columns of X to unit variance prior to computing summary data}
}
\value{
A list of sufficient statistics (\code{XtX, Xty, yty, n})
  and \code{X_colmeans}, \code{y_mean}.
}
\description{
Computes the sufficient statistics \eqn{X'X, X'y, y'y}
  and \eqn{n} after centering (and possibly standardizing) the
  columns of \eqn{X} and centering \eqn{y} to have mean zero. We also
  store the column means of \eqn{X} and mean of \eqn{y}.
}
\examples{
data(N2finemapping)
ss <- compute_suff_stat(N2finemapping$X, N2finemapping$Y[, 1])

}


================================================
FILE: man/data_small.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{data_small}
\alias{data_small}
\title{Simulated Small-sample eQTL Data.}
\format{
\code{data_small} is a list with the following elements:

\describe{

  \item{y}{Simulated gene expression response.}

  \item{X}{Genotype matrix.}}
}
\description{
A simulated eQTL data set with 47 individuals and 7,430
  variables. The response is a simulated gene expression phenotype and
  the variables are genotypes. This data set illustrates the small
  sample-size setting considered in Denault \emph{et al} (2025).
}
\examples{
data(data_small)
}
\references{
W. R. P. Denault \emph{et al} (2025). Accounting for uncertainty in
  residual variances improves fine-mapping in small sample studies.
  \emph{bioRxiv} \doi{10.1101/2025.05.16.654543}.
}
\seealso{
The \dQuote{Small data example} vignette.
}
\keyword{data}


================================================
FILE: man/diagnose_ash_filter_archived_iter.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{diagnose_ash_filter_archived_iter}
\alias{diagnose_ash_filter_archived_iter}
\title{V0 archived filter per-iteration diagnostic}
\usage{
diagnose_ash_filter_archived_iter(
  model,
  Xcorr,
  masked,
  b_confident,
  sentinels,
  effect_purity,
  current_case,
  current_collision,
  mrash_output
)
}
\value{
data.frame with one row per slot, all features
}
\description{
V0 archived filter per-iteration diagnostic
}
\keyword{internal}


================================================
FILE: man/diagnose_bb_ash_iter.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{diagnose_bb_ash_iter}
\alias{diagnose_bb_ash_iter}
\title{BB+ash per-iteration diagnostic}
\usage{
diagnose_bb_ash_iter(
  model,
  Xcorr,
  mask,
  b_confident,
  sentinels,
  sentinel_collision,
  is_confident_now,
  is_trusted,
  emerging_slots,
  active_slots,
  c_hat,
  ash_result,
  p,
  high_chat = NULL,
  low_chat = NULL,
  collision_threshold = 0.9,
  purity_threshold = 0.5,
  masking_threshold = 0.5,
  nPIP_threshold = 0.05,
  c_hat_excess_threshold = 0.2,
  alpha_entropy_threshold = log(5),
  slot_prior = NULL,
  mask_smoothness = NULL,
  mask_amount = NULL,
  mask_concentration = NULL,
  mask_burnin = NULL,
  mask_spread_pip_at_sent = NULL,
  mask_pip_prot_at_sent = NULL
)
}
\value{
data.frame with one row per slot, all features
}
\description{
BB+ash per-iteration diagnostic
}
\keyword{internal}


================================================
FILE: man/estimate_s_rss.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_rss_utils.R
\name{estimate_s_rss}
\alias{estimate_s_rss}
\title{Estimate s in \code{susie_rss} Model Using Regularized LD}
\usage{
estimate_s_rss(z, R, n, r_tol = 1e-08, method = "null-mle")
}
\arguments{
\item{z}{A p-vector of z scores.}

\item{R}{A p by p symmetric, positive semidefinite correlation
matrix.}

\item{n}{The sample size. (Optional, but highly recommended.)}

\item{r_tol}{Tolerance level for eigenvalue check of positive
semidefinite matrix of R.}

\item{method}{a string specifies the method to estimate \eqn{s}.}
}
\value{
A number between 0 and 1.
}
\description{
The estimated s gives information about the
  consistency between the z scores and LD matrix. A larger \eqn{s}
  means there is a strong inconsistency between z scores and LD
  matrix. The \dQuote{null-mle} method obtains mle of \eqn{s} under
  \eqn{z | R ~ N(0,(1-s)R + s I)}, \eqn{0 < s < 1}. The
  \dQuote{null-partialmle} method obtains mle of \eqn{s} under
  \eqn{U^T z | R ~ N(0,s I)}, in which \eqn{U} is a matrix containing
  the of eigenvectors that span the null space of R; that is, the
  eigenvectors corresponding to zero eigenvalues of R. The estimated
  \eqn{s} from \dQuote{null-partialmle} could be greater than 1. The
  \dQuote{null-pseudomle} method obtains mle of \eqn{s} under
  pseudolikelihood \eqn{L(s) = \prod_{j=1}^{p} p(z_j | z_{-j}, s,
  R)}, \eqn{0 < s < 1}.
}
\examples{
set.seed(1)
n <- 500
p <- 1000
beta <- rep(0, p)
beta[1:4] <- 0.01
X <- matrix(rnorm(n * p), nrow = n, ncol = p)
X <- scale(X, center = TRUE, scale = TRUE)
y <- drop(X \%*\% beta + rnorm(n))
input_ss <- compute_suff_stat(X, y, standardize = TRUE)
ss <- univariate_regression(X, y)
R <- cor(X)
attr(R, "eigen") <- eigen(R, symmetric = TRUE)
zhat <- with(ss, betahat / sebetahat)

# Estimate s using the unadjusted z-scores.
s0 <- estimate_s_rss(zhat, R)

# Estimate s using the adjusted z-scores.
s1 <- estimate_s_rss(zhat, R, n)

}


================================================
FILE: man/extract_bb_ash_features.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{extract_bb_ash_features}
\alias{extract_bb_ash_features}
\title{Extract ML feature table from a completed BB+ash fit}
\usage{
extract_bb_ash_features(fit, X, causal = NULL)
}
\arguments{
\item{fit}{Completed susie fit (with slot_prior + ash)}

\item{X}{Design matrix (used to compute Xcorr if needed)}

\item{causal}{Integer vector of true causal indices (for labeling)}
}
\value{
data.frame with one row per slot, all features + TP/FP label
}
\description{
Computes per-slot features from the converged model. Call with
susieR:::extract_bb_ash_features(fit, X_or_Xcorr, causal).
}
\keyword{internal}


================================================
FILE: man/format_extra_diag.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{format_extra_diag}
\alias{format_extra_diag}
\title{Append class-specific extra-diag columns to the verbose row}
\usage{
format_extra_diag(model)
}
\description{
Default returns an empty string. Subclasses override to inject
columns such as `max_pi_null`, `max_KL_l`, alpha-entropy
n_eff. Output is appended after the V column in the per-iter
tabular line.
}
\keyword{internal}


================================================
FILE: man/format_sigma2_summary.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{format_sigma2_summary}
\alias{format_sigma2_summary}
\title{Format the per-iter sigma2 cell for verbose output}
\usage{
format_sigma2_summary(model)
}
\description{
Default returns the scalar sigma2 in `%.4f`. Subclasses
(e.g., mfsusieR's list-of-vectors sigma2; mvsusieR's
matrix sigma2) override to a compact summary string of
fixed width.
}
\keyword{internal}


================================================
FILE: man/get.full.posterior.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mr.ash.R
\name{get.full.posterior}
\alias{get.full.posterior}
\title{Approximation Posterior Expectations from Mr.ASH Fit}
\usage{
get.full.posterior(fit)
}
\arguments{
\item{fit}{A Mr.ASH fit obtained, for example, by running
\code{mr.ash}.}
}
\value{
A list object with the following elements:

\item{phi}{An p x K matrix containing the posterior assignment
  probabilities, where p is the number of predictors, and K is the
  number of mixture components. (Each row of \code{phi} should sum to
  1.)}

\item{m}{An p x K matrix containing the posterior means conditional
  on assignment to each mixture component.}

\item{s2}{An p x K matrix containing the posterior variances
  conditional on assignment to each mixture component.}
}
\description{
Recover the parameters specifying the variational
  approximation to the posterior distribution of the regression
  coefficients. To streamline the model fitting implementation, and
  to reduce memory requirements, \code{\link{mr.ash}} does not store
  all the parameters needed to specify the approximate posterior.
}
\examples{
## generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

## fit mr.ash
fit.mr.ash  = mr.ash(X, y)

## recover full posterior
full.post   = get.full.posterior(fit.mr.ash)

}


================================================
FILE: man/get_alpha_l.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_alpha_l}
\alias{get_alpha_l}
\title{Get posterior inclusion probabilities for effect l}
\usage{
get_alpha_l(model, l)
}
\description{
Get posterior inclusion probabilities for effect l
}
\keyword{internal}


================================================
FILE: man/get_cs_correlation.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_get_functions.R
\name{get_cs_correlation}
\alias{get_cs_correlation}
\title{Get Correlations Between CSs, using Variable with Maximum PIP From Each CS}
\usage{
get_cs_correlation(model, X = NULL, Xcorr = NULL, max = FALSE)
}
\arguments{
\item{model}{A SuSiE fit, typically an output from
\code{\link{susie}} or one of its variants.}

\item{X}{n by p matrix of values of the p variables (covariates) in
n samples. When provided, correlation between variables will be
computed and used to remove CSs whose minimum correlation among
variables is smaller than \code{min_abs_corr}.}

\item{Xcorr}{p by p matrix of correlations between variables
(covariates). When provided, it will be used to remove CSs whose
minimum correlation among variables is smaller than
\code{min_abs_corr}.}

\item{max}{When \code{max = FAFLSE}, return a matrix of CS
correlations. When \code{max = TRUE}, return only the maximum
absolute correlation among all pairs of correlations.}
}
\value{
A matrix of correlations between CSs, or the maximum
  absolute correlation when \code{max = TRUE}.
}
\description{
This function evaluates the correlation between single effect
  CSs. It is not part of the SuSiE inference. Rather, it is designed as
  a diagnostic tool to assess how correlated the reported CS are.
}


================================================
FILE: man/get_objective.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_objective}
\alias{get_objective}
\title{Compute the SuSiE ELBO (evidence lower bound)}
\usage{
get_objective(data, params, model)
}
\arguments{
\item{data}{Data object.}

\item{params}{Params object.}

\item{model}{Model object.}
}
\value{
Scalar ELBO value.
}
\description{
Building-block function used by downstream packages implementing
custom IBSS loops.
}
\keyword{internal}


================================================
FILE: man/get_posterior_mean_l.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_posterior_mean_l}
\alias{get_posterior_mean_l}
\title{Get PIP-weighted posterior mean for effect l (alpha * mu)}
\usage{
get_posterior_mean_l(model, l)
}
\description{
Get PIP-weighted posterior mean for effect l (alpha * mu)
}
\keyword{internal}


================================================
FILE: man/get_posterior_mean_sum.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_posterior_mean_sum}
\alias{get_posterior_mean_sum}
\title{Get sum of PIP-weighted posterior means across all effects}
\usage{
get_posterior_mean_sum(model)
}
\description{
Get sum of PIP-weighted posterior means across all effects
}
\keyword{internal}


================================================
FILE: man/get_posterior_moments_l.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_posterior_moments_l}
\alias{get_posterior_moments_l}
\title{Get posterior moments for effect l (for EM prior variance update)}
\usage{
get_posterior_moments_l(model, l)
}
\description{
Get posterior moments for effect l (for EM prior variance update)
}
\keyword{internal}


================================================
FILE: man/get_prior_variance_l.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{get_prior_variance_l}
\alias{get_prior_variance_l}
\title{Get prior variance for effect l}
\usage{
get_prior_variance_l(model, l)
}
\description{
Get prior variance for effect l
}
\keyword{internal}


================================================
FILE: man/get_slot_weight.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/generic_methods.R
\name{get_slot_weight}
\alias{get_slot_weight}
\title{Get the slot weight for effect l}
\usage{
get_slot_weight(model, l)
}
\arguments{
\item{model}{SuSiE model object.}

\item{l}{Effect index.}
}
\value{
Scalar weight (default 1).
}
\description{
Returns the weight by which effect l's contribution to the fitted
values is scaled. When \code{model$slot_weights} is NULL (the default),
all effects have weight 1 and standard SuSiE behavior is recovered.
}
\details{
Slot weights enable a natural mechanism for adaptively estimating the
number of effects: each slot l can have a weight in [0,1] reflecting
the posterior probability that the slot is active. With a suitable
prior on the number of active effects, this generalizes SuSiE's fixed
L to a data-driven estimate.
}
\keyword{internal}


================================================
FILE: man/ibss_finalize.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/iterative_bayesian_stepwise_selection.R
\name{ibss_finalize}
\alias{ibss_finalize}
\title{Finalize IBSS model}
\usage{
ibss_finalize(
  data,
  params,
  model,
  elbo = NULL,
  iter = NA_integer_,
  tracking = NULL
)
}
\arguments{
\item{data}{Data object (individual, ss, or rss_lambda)}

\item{params}{Validated params object}

\item{model}{Converged model object}

\item{elbo}{ELBO values (optional)}

\item{iter}{Number of iterations completed}

\item{tracking}{Tracking data (optional)}
}
\value{
Finalized model object with credible sets and PIPs.
}
\description{
Computes credible sets, PIPs, z-scores, and cleans up temporary
fields from the model object.
}
\keyword{internal}


================================================
FILE: man/ibss_initialize.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/iterative_bayesian_stepwise_selection.R
\name{ibss_initialize}
\alias{ibss_initialize}
\alias{ibss_initialize.default}
\title{Initialize IBSS model}
\usage{
ibss_initialize(data, params)

\method{ibss_initialize}{default}(data, params)
}
\arguments{
\item{data}{Data object (individual, ss, or rss_lambda)}

\item{params}{Validated params object}
}
\value{
Initialized model object ready for the IBSS iteration loop.
}
\description{
Creates and initializes the model object for the IBSS algorithm.
}
\keyword{internal}


================================================
FILE: man/is_symmetric_matrix.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_utils.R
\name{is_symmetric_matrix}
\alias{is_symmetric_matrix}
\title{Check for symmetric matrix}
\usage{
is_symmetric_matrix(x)
}
\arguments{
\item{x}{A matrix to check}
}
\value{
Logical indicating if x is symmetric
}
\description{
Check for symmetric matrix
}
\keyword{internal}


================================================
FILE: man/kriging_rss.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_rss_utils.R
\name{kriging_rss}
\alias{kriging_rss}
\title{Compute Distribution of z-scores of Variant j Given Other z-scores, and Detect Possible Allele Switch Issue}
\usage{
kriging_rss(
  z,
  R,
  n,
  r_tol = 1e-08,
  s = estimate_s_rss(z, R, n, r_tol, method = "null-mle")
)
}
\arguments{
\item{z}{A p-vector of z scores.}

\item{R}{A p by p symmetric, positive semidefinite correlation
matrix.}

\item{n}{The sample size. (Optional, but highly recommended.)}

\item{r_tol}{Tolerance level for eigenvalue check of positive
semidefinite matrix of R.}

\item{s}{an estimated s from \code{estimate_s_rss}}
}
\value{
a list containing a ggplot2 plot object and a table. The plot
  compares observed z score vs the expected value. The possible allele
  switched variants are labeled as red points (log LR > 2 and abs(z) > 2).
  The table summarizes the conditional distribution for each variant
  and the likelihood ratio test. The table has the following columns:
  the observed z scores, the conditional expectation, the conditional
  variance, the standardized differences between the observed z score
  and expected value, the log likelihood ratio statistics.
}
\description{
Under the null, the rss model with regularized LD
  matrix is \eqn{z|R,s ~ N(0, (1-s)R + s I))}. We use a mixture of
  normals to model the conditional distribution of z_j given other z
  scores, \eqn{z_j | z_{-j}, R, s ~ \sum_{k=1}^{K} \pi_k
  N(-\Omega_{j,-j} z_{-j}/\Omega_{jj}, \sigma_{k}^2/\Omega_{jj})},
  \eqn{\Omega = ((1-s)R + sI)^{-1}}, \eqn{\sigma_1, ..., \sigma_k}
  is a grid of fixed positive numbers. We estimate the mixture
  weights \eqn{\pi}  We detect the possible allele switch issue
  using likelihood ratio for each variant.
}
\examples{
# See also the vignette, "Diagnostic for fine-mapping with summary
# statistics."
set.seed(1)
n <- 500
p <- 1000
beta <- rep(0, p)
beta[1:4] <- 0.01
X <- matrix(rnorm(n * p), nrow = n, ncol = p)
X <- scale(X, center = TRUE, scale = TRUE)
y <- drop(X \%*\% beta + rnorm(n))
ss <- univariate_regression(X, y)
R <- cor(X)
attr(R, "eigen") <- eigen(R, symmetric = TRUE)
zhat <- with(ss, betahat / sebetahat)
cond_dist <- kriging_rss(zhat, R, n = n)
cond_dist$plot

}


================================================
FILE: man/label_diag_truth.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/diagnosis_reports.R
\name{label_diag_truth}
\alias{label_diag_truth}
\title{Label diagnostic table with ground truth TP/FP}
\usage{
label_diag_truth(df, fit, causal)
}
\arguments{
\item{df}{Diagnostic data.frame (from collect_ash_diag or single iter)}

\item{fit}{SuSiE fit object}

\item{causal}{Integer vector of causal variant indices}
}
\value{
df with added 'cs_label' column: "TP", "FP", or "-" (no CS)
}
\description{
For each slot at the final iteration, check if its CS (if any) contains
a causal variant.
}
\keyword{internal}


================================================
FILE: man/loglik_mixture_common.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mixture_prior.R
\name{loglik_mixture_common}
\alias{loglik_mixture_common}
\title{Compute mixture log-Bayes factors and posterior inclusion probabilities}
\usage{
loglik_mixture_common(params, model, ser_stats, l)
}
\arguments{
\item{params}{Params object with prior_variance_grid (K-vector) and
mixture_weights (K-vector summing to 1)}

\item{model}{Current model object with pi (prior weights)}

\item{ser_stats}{List with betahat (p-vector) and shat2 (p-vector)}

\item{l}{Effect index}
}
\value{
Updated model with alpha[l,], lbf[l], lbf_variable[l,], lbf_grid[[l]]
}
\description{
For each grid point k and variant j, computes the Wakefield approximate
Bayes factor (ABF), then forms the mixture BF as a weighted sum over grid
points. Stores the full p x K log-BF matrix in model$lbf_grid[[l]] for
downstream use (e.g., mixsqp M-step in susieAnn).
}
\keyword{internal}


================================================
FILE: man/mr.ash.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mr.ash.R
\name{mr.ash}
\alias{mr.ash}
\title{Multiple Regression with Adaptive Shrinkage}
\usage{
mr.ash(
  X,
  y,
  Z = NULL,
  sa2 = NULL,
  method_q = c("sigma_dep_q", "sigma_indep_q"),
  method_g = c("caisa", "accelerate", "block"),
  max.iter = 1000,
  min.iter = 1,
  beta.init = NULL,
  update.pi = TRUE,
  pi = NULL,
  update.sigma2 = TRUE,
  sigma2 = NULL,
  update.order = NULL,
  standardize = FALSE,
  intercept = TRUE,
  tol = set_default_tolerance(),
  verbose = TRUE
)
}
\arguments{
\item{X}{The input matrix, of dimension (n,p); each column is a
single predictor; and each row is an observation vector. Here, n is
the number of samples and p is the number of predictors. The matrix
cannot be sparse.}

\item{y}{The observed continuously-valued responses, a vector of
length p.}

\item{Z}{The covariate matrix, of dimension (n,k), where k is the
number of covariates. This feature is not yet implemented;
\code{Z} must be set to \code{NULL}.}

\item{sa2}{The vector of prior mixture component variances. The
variances should be in increasing order, starting at zero; that is,
\code{sort(sa2)} should be the same as \code{sa2}. When \code{sa2}
is \code{NULL}, the default setting is used, \code{sa2[k] =
(2^(0.05*(k-1)) - 1)^2}, for \code{k = 1:20}. For this default
setting, \code{sa2[1] = 0}, and \code{sa2[20]} is roughly 1.}

\item{method_q}{The algorithm used to update the variational
approximation to the posterior distribution of the regression
coefficients, \code{method = "sigma_dep_q"} and \code{method =
"sigma_indep_q"}, take different approaches to updating the
residual variance \eqn{sigma^2}.}

\item{method_g}{\code{method = "caisa"}, an abbreviation of
"Cooridinate Ascent Iterative Shinkage Algorithm", fits the model
by approximate EM; it iteratively updates the variational
approximation to the posterior distribution of the regression
coefficients (the approximate E-step) and the model parameters
(mixture weights and residual covariance) in an approximate
M-step. Settings \code{method = "block"} and
\code{method = "accelerate"} are considered experimental.}

\item{max.iter}{The maximum number of outer loop iterations allowed.}

\item{min.iter}{The minimum number of outer loop iterations allowed.}

\item{beta.init}{The initial estimate of the (approximate)
posterior mean regression coefficients. This should be \code{NULL},
or a vector of length p. When \code{beta.init} is \code{NULL}, the
posterior mean coefficients are all initially set to zero.}

\item{update.pi}{If \code{update.pi = TRUE}, the mixture
proportions in the mixture-of-normals prior are estimated from the
data. In the manuscript, \code{update.pi = TRUE}.}

\item{pi}{The initial estimate of the mixture proportions
\eqn{\pi_1, \ldots, \pi_K}. If \code{pi} is \code{NULL}, the
mixture weights are initialized to \code{rep(1/K,K)}}, where
\code{K = length(sa2).}

\item{update.sigma2}{If \code{update.sigma2 = TRUE}, the residual
variance \eqn{sigma^2} is estimated from the data.  In the manuscript,
\code{update.sigma = TRUE}.}

\item{sigma2}{The initial estimate of the residual variance,
\eqn{\sigma^2}. If \code{sigma2 = NULL}, the residual variance is
initialized to the empirical variance of the residuals based on the
initial estimates of the regression coefficients, \code{beta.init},
after removing linear effects of the intercept and any covariances.}

\item{update.order}{The order in which the co-ordinate ascent
updates for estimating the posterior mean coefficients are
performed. \code{update.order} can be \code{NULL}, \code{"random"},
or any permutation of \eqn{(1,\ldots,p)}, where \code{p} is the number
of columns in the input matrix \code{X}. When \code{update.order}
is \code{NULL}, the co-ordinate ascent updates are performed in
order in which they appear in \code{X}; this is equivalent to
setting \code{update.order = 1:p}. When \code{update.order =
"random"}, the co-ordinate ascent updates are performed in a
randomly generated order, and this random ordering is different at
each outer-loop iteration.}

\item{standardize}{The logical flag for standardization of the
columns of X variable, prior to the model fitting. The coefficients
are always returned on the original scale.}

\item{intercept}{When \code{intercept = TRUE}, an intercept is
included in the regression model.}

\item{tol}{Additional settings controlling behaviour of the model
fitting algorithm. \code{tol$convtol} controls the termination
criterion for the model fitting. The outer-loop updates stop when
the relative L2 change in the estimates of the posterior mean
coefficients is less than \code{convtol}, i.e., \code{||beta_new -
beta_old||_2 / max(1, ||beta_old||_2) < convtol}.
\code{tol$epstol} is a small, positive number added to the
likelihoods to avoid logarithms of zero.}

\item{verbose}{If \code{verbose = TRUE}, some information about the
status of the model fitting is printed to the console.}
}
\value{
A list object with the following elements:

\item{intercept}{The estimated intercept.}

\item{beta}{A vector containing posterior mean estimates of the
  regression coefficients for all predictors.}

\item{sigma2}{The estimated residual variance.}

\item{pi}{A vector of containing the estimated mixture
  proportions.}

\item{iter}{The number of outer-loop iterations that were
  performed.}

\item{update.order}{The ordering used for performing the
  coordinate-wise updates. For \code{update.order = "random"}, the
  orderings for outer-loop iterations are provided in a vector of
  length \code{p*max.iter}, where \code{p} is the number of predictors.}

\item{varobj}{A vector of length \code{numiter}, containing the
  value of the variational objective (equal to the negative "evidence
  lower bound") attained at each (outer-loop) model fitting
  iteration. Note that the objective does not account for the
  intercept term, even when \code{intercept = TRUE}; therefore, this
  value shoudl be interpreted as being an approximation to the
  marginal likelihood \emph{conditional} on the estimate of the
  intercept.}

\item{data}{The preprocessed data (X, Z, y) provided as input to the model
  fitting algorithm. \code{data$w} is equal to
  \code{diag(crossprod(X))}, in which \code{X} is the preprocessed
  data matrix. Additionally, \code{data$sa2} gives the prior variances
  used.}
}
\description{
Model fitting algorithms for Multiple Regression with
  Adaptive Shrinkage ("Mr.ASH"). Mr.ASH is a variational empirical
  Bayes (VEB) method for multiple linear regression. The fitting
 algorithms (locally) maximize the approximate marginal likelihood
  (the "evidence lower bound", or ELBO) via coordinate-wise updates.
}
\details{
Mr.ASH is a statistical inference method for the following
multiple linear regression model: \deqn{y | X, \beta, \sigma^2 ~
N(X \beta, \sigma I_n),} in which the regression coefficients
\eqn{\beta} admit a mixture-of-normals prior, \deqn{\beta | \pi,
\sigma ~ g = \sum_{k=1}^K N(0, \sigma^2 \sigma_k^2).} Each mixture
component in the prior, \eqn{g}, is a normal density centered at
zero, with variance \eqn{\sigma^2 \sigma_k^2}. 

The fitting algorithm, it run for a large enough number of
iterations, will find an approximate posterior for the regression
coefficients, denoted by \eqn{q(\beta)}, residual variance
parameter \eqn{sigma^2}, and prior mixture weights \eqn{\pi_1,
\ldots, \pi_K} maximizing the evidence lower bound, \deqn{F(q, \pi,
\sigma^2) = E_q \log p(y | X, \beta, \sigma^2) - \sum_{j=1}^p
D_{KL}(q_j || g),} where \eqn{D_{KL}(q_j || g)} denotes the
Kullback-Leibler (KL) divergence, a measure of the "distance"
between (approximate) posterior \eqn{q_j(\beta_j)} and prior
\eqn{g(\beta_j)}. The fitting algorithm iteratively updates the
approximate posteriors \eqn{q_1, \ldots, q_p}, separately for each
\eqn{j = 1, \ldots, p} (in an order determined by
\code{update.order}), then separately updates the mixture weights
and \eqn{\pi} and residual variance \eqn{\sigma^2}. This
coordinate-wise update scheme iterates until the convergence
criterion is met, or until the algorithm hits an upper bound on
the number of iterations (specified by \code{max.iter}). Coordinate-wise 
optimization algorithms for model fitting are implemented in C++ for 
efficient handling of large-scale data

See \sQuote{References} for more details about the model and
algorithm.
}
\examples{
### generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

### fit Mr.ASH
fit.mr.ash  = mr.ash(X,y, method_q = "sigma_indep_q")
#' fit.mr.ash  = mr.ash(X,y, method_q = "sigma_dep_q")

### prediction routine
Xnew        = matrix(rnorm(n*p),n,p)
ynew        = Xnew \%*\% beta + rnorm(n)
ypred       = predict(fit.mr.ash, Xnew)

### test error
rmse        = norm(ynew - ypred, '2') / sqrt(n)

### coefficients
betahat     = predict(fit.mr.ash, type = "coefficients")
# this equals c(fit.mr.ash$intercept, fit.mr.ash$beta)

}
\references{
Y. Kim (2020), Bayesian shrinkage methods for high dimensional
regression. Ph.D. thesis, University of Chicago.
}
\seealso{
\code{\link{get.full.posterior}}, \code{\link{predict.mr.ash}}
}


================================================
FILE: man/mr.ash.rss.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mr.ash.rss.R
\name{mr.ash.rss}
\alias{mr.ash.rss}
\title{Bayesian Multiple Regression with Mixture-of-Normals Prior (RSS)}
\usage{
mr.ash.rss(
  bhat,
  shat,
  R,
  var_y,
  n,
  s0,
  w0,
  sigma2_e = NULL,
  mu1_init = numeric(0),
  tol = 1e-08,
  max_iter = 1e+05,
  z = numeric(0),
  update_w0 = TRUE,
  update_sigma = TRUE,
  compute_ELBO = TRUE,
  standardize = FALSE
)
}
\arguments{
\item{bhat}{Numeric vector of observed effect sizes (standardized).}

\item{shat}{Numeric vector of standard errors of effect sizes.}

\item{R}{Numeric matrix of the correlation matrix.}

\item{var_y}{Numeric value of the variance of the outcome.
If NULL, it is set to Inf (effects on standardized scale).}

\item{n}{Integer value of the sample size.}

\item{s0}{Numeric vector of prior variances for the mixture components.}

\item{w0}{Numeric vector of prior weights for the mixture components.}

\item{sigma2_e}{Numeric value of the initial error variance estimate.
If \code{NULL} (default), initialized to \code{var_y} (matching
\code{mr.ash} behavior of using residual variance with zero
initialization), or 1 when \code{var_y = Inf}.}

\item{mu1_init}{Numeric vector of initial values for the posterior mean of
the coefficients. Default is \code{numeric(0)} (initialize to zero).}

\item{tol}{Numeric value of the convergence tolerance. Default is 1e-8.}

\item{max_iter}{Integer value of the maximum number of iterations.
Default is 1e5.}

\item{z}{Numeric vector of Z-scores. If not provided, computed as
\code{bhat / shat}.}

\item{update_w0}{Logical value indicating whether to update the mixture
weights. Default is TRUE.}

\item{update_sigma}{Logical value indicating whether to update the error
variance. Default is TRUE.}

\item{compute_ELBO}{Logical value indicating whether to compute the
Evidence Lower Bound (ELBO). Default is TRUE.}

\item{standardize}{Logical value indicating whether to standardize the
input data. Default is FALSE.}
}
\value{
A list containing the following components:
\describe{
  \item{beta}{Numeric vector of posterior mean coefficients (same as mu1).}
  \item{sigma2}{Numeric value of the residual variance (same as sigma2_e).}
  \item{pi}{Numeric vector of mixture weights (same as w0).}
  \item{iter}{Integer, number of iterations performed.}
  \item{varobj}{Numeric vector of ELBO values per iteration.}
  \item{mu1}{Numeric vector of the posterior mean of the coefficients.}
  \item{sigma2_1}{Numeric vector of the posterior variance of the coefficients.}
  \item{w1}{Numeric matrix of the posterior assignment probabilities.}
  \item{sigma2_e}{Numeric value of the error variance.}
  \item{w0}{Numeric vector of the mixture weights.}
  \item{ELBO}{Numeric value of the Evidence Lower Bound (if \code{compute_ELBO = TRUE}).}
}
}
\description{
This function performs Bayesian multiple regression with a
  mixture-of-normals prior using summary statistics (RSS: Regression with
  Summary Statistics). It uses a C++ implementation for efficient computation.
}
\examples{
# Generate example data
set.seed(985115)
n <- 350
p <- 16
sigmasq_error <- 0.5
zeroes <- rbinom(p, 1, 0.6)
beta.true <- rnorm(p, 1, sd = 4)
beta.true[zeroes] <- 0

X <- cbind(matrix(rnorm(n * p), nrow = n))
X <- scale(X, center = TRUE, scale = FALSE)
y <- X \%*\% matrix(beta.true, ncol = 1) + rnorm(n, 0, sqrt(sigmasq_error))
y <- scale(y, center = TRUE, scale = FALSE)

# Set the prior
K <- 9
sigma0 <- c(0.001, .1, .5, 1, 5, 10, 20, 30, .005)
omega0 <- rep(1 / K, K)

# Calculate summary statistics
b.hat <- sapply(1:p, function(j) {
  summary(lm(y ~ X[, j]))$coefficients[-1, 1]
})
s.hat <- sapply(1:p, function(j) {
  summary(lm(y ~ X[, j]))$coefficients[-1, 2]
})
R.hat <- cor(X)
var_y <- var(y)
sigmasq_init <- 1.5

# Run mr.ash.rss
out <- mr.ash.rss(b.hat, s.hat,
  R = R.hat, var_y = var_y, n = n,
  sigma2_e = sigmasq_init, s0 = sigma0, w0 = omega0,
  mu1_init = rep(0, ncol(X)), tol = 1e-8, max_iter = 1e5,
  update_w0 = TRUE, update_sigma = TRUE, compute_ELBO = TRUE,
  standardize = FALSE
)

}


================================================
FILE: man/path.order.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/univariate_regression.R
\name{path.order}
\alias{path.order}
\title{Ordering of Predictors by Regularization Path}
\usage{
path.order(fit)
}
\arguments{
\item{fit}{A fit object whose \code{coef()} method returns a matrix of
coefficients with the intercept in the first row and one column per
penalty strength (as produced by typical penalized-regression
implementations).}
}
\value{
An ordering of the predictors.
}
\description{
This function determines an ordering of the predictors
 based on the regularization path of the penalized regression; in
  particular, the predictors are ordered based on the order in which
  the coefficients are included in the model as the penalty strength
  decreases.
}
\examples{
### generate synthetic data
set.seed(1)
n           = 200
p           = 30
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

### build a minimal example 'fit' object with the same structure as a
### fit from a penalized regression: a coefficient matrix with the
### intercept in row 1 and one column per (decreasing) penalty value.
beta_path   = matrix(0, p + 1, p)
for (k in 1:p) beta_path[k + 1, k:p] = 1
fit         = list(coefficients = beta_path)
order       = path.order(fit)

}


================================================
FILE: man/post_loglik_prior_hook.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/single_effect_regression.R
\name{post_loglik_prior_hook}
\alias{post_loglik_prior_hook}
\title{Post-loglik prior-update hook}
\usage{
post_loglik_prior_hook(data, params, model, ser_stats, l, V_init)
}
\description{
S3 generic, called after `loglik` / posterior moments / KL.
Default routes to `optimize_prior_variance` for `EM`. Returns
`list(V, model)`.
}
\keyword{internal}


================================================
FILE: man/pre_loglik_prior_hook.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/single_effect_regression.R
\name{pre_loglik_prior_hook}
\alias{pre_loglik_prior_hook}
\title{Pre-loglik prior-update hook}
\usage{
pre_loglik_prior_hook(data, params, model, ser_stats, l, V_init)
}
\description{
S3 generic, called between SER stats and `loglik`. Default
routes to `optimize_prior_variance` for `optim` / `uniroot` /
`simple`. Returns `list(V, model)`.
}
\keyword{internal}


================================================
FILE: man/predict.mr.ash.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mr.ash.R
\name{predict.mr.ash}
\alias{predict.mr.ash}
\title{Predict Outcomes or Extract Coefficients from Mr.ASH Fit}
\usage{
\method{predict}{mr.ash}(object, newx = NULL, type = c("response", "coefficients"), ...)
}
\arguments{
\item{object}{A mr_ash fit, usually the result of calling
\code{mr.ash}.}

\item{newx}{The input matrix, of dimension (n,p); each column is a
single predictor; and each row is an observation vector. Here, n is
the number of samples and p is the number of predictors. When
\code{newx} is \code{NULL}, the fitted values for the training data
are provided.}

\item{type}{The type of output. For \code{type = "response"},
predicted or fitted outcomes are returned; for \code{type =
"coefficients"}, the estimated coefficients are returned.}

\item{...}{Additional arguments passed to the default S3 method.}
}
\value{
For \code{type = "response"}, predicted or fitted outcomes
are returned; for \code{type = "coefficients"}, the estimated
coefficients are returned.
}
\description{
This function predicts outcomes (y) given the observed
  variables (X) and a Mr.ASH model; alternatively, retrieve the
  estimates of the regression coefficients.
}
\examples{
## generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

## fit mr.ash
fit.mr.ash  = mr.ash(X, y)

## predict
Xnew        = matrix(rnorm(n*p),n,p)
ypred       = predict(fit.mr.ash, Xnew)

}


================================================
FILE: man/predict.susie.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/predict.susie.R
\name{predict.susie}
\alias{predict.susie}
\title{Predict outcomes or extract coefficients from susie fit.}
\usage{
\method{predict}{susie}(object, newx = NULL, type = c("response", "coefficients"), ...)
}
\arguments{
\item{object}{A susie fit.}

\item{newx}{A new value for X at which to do predictions.}

\item{type}{The type of output. For \code{type = "response"},
predicted or fitted outcomes are returned; for \code{type =
"coefficients"}, the estimated coefficients are returned.}

\item{\dots}{Other arguments used by generic predict function. These
extra arguments are not used here.}
}
\value{
For \code{type = "response"}, predicted or fitted outcomes
  are returned; for \code{type = "coefficients"}, the estimated
  coefficients are returned. If the susie fit has intercept =
  \code{NA} (which is common when using \code{susie_ss}) then
  predictions are computed using an intercept of 0, and a warning is
  emitted.
}
\description{
Predict outcomes or extract coefficients from susie fit.
}


================================================
FILE: man/print.summary.susie_post_outcome_configuration.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_post_outcome_configuration.R
\name{print.summary.susie_post_outcome_configuration}
\alias{print.summary.susie_post_outcome_configuration}
\title{Print a summary.susie_post_outcome_configuration object}
\usage{
\method{print}{summary.susie_post_outcome_configuration}(x, ...)
}
\arguments{
\item{x}{Output of [summary.susie_post_outcome_configuration()].}

\item{...}{Ignored.}
}
\value{
The input invisibly.
}
\description{
Pretty-prints the tidy tables built by
[summary.susie_post_outcome_configuration()] with optional ANSI color
highlighting. See that page for the color encoding.
}
\seealso{
[summary.susie_post_outcome_configuration()]
}


================================================
FILE: man/resolve_mixture_prior.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/mixture_prior.R
\name{resolve_mixture_prior}
\alias{resolve_mixture_prior}
\title{Resolve fixed mixture prior parameters}
\usage{
resolve_mixture_prior(
  estimate_prior_method,
  estimate_prior_variance,
  prior_variance_grid,
  mixture_weights
)
}
\description{
Called from susie, susie_ss, and susie_rss to handle the
prior_variance_grid / mixture_weights parameters. When
prior_variance_grid is non-NULL, overrides estimate_prior_method
to "fixed_mixture" and validates inputs. Returns a list with
the resolved estimate_prior_method, estimate_prior_variance,
prior_variance_grid, and mixture_weights.
}
\keyword{internal}


================================================
FILE: man/safe_cor.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_utils.R
\name{safe_cor}
\alias{safe_cor}
\title{Computes correlation matrix from data matrix
Handles constant columns without warnings - returns 0 correlation for constant cols
Uses Rfast::cora when available (much faster for large matrices), falls back
to crossprod-based computation otherwise.}
\usage{
safe_cor(X)
}
\arguments{
\item{X}{Data matrix (n x p)}
}
\value{
Correlation matrix (p x p)
}
\description{
Computes correlation matrix from data matrix
Handles constant columns without warnings - returns 0 correlation for constant cols
Uses Rfast::cora when available (much faster for large matrices), falls back
to crossprod-based computation otherwise.
}
\keyword{internal}


================================================
FILE: man/safe_cov2cor.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_utils.R
\name{safe_cov2cor}
\alias{safe_cov2cor}
\title{Converts covariance matrix to correlation matrix
Constant variables (zero variance) get correlation 0 with others, 1 with self}
\usage{
safe_cov2cor(V)
}
\arguments{
\item{V}{Covariance matrix}
}
\value{
Correlation matrix
}
\description{
Converts covariance matrix to correlation matrix
Constant variables (zero variance) get correlation 0 with others, 1 with self
}
\keyword{internal}


================================================
FILE: man/scale_design_matrix.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_utils.R
\name{scale_design_matrix}
\alias{scale_design_matrix}
\title{Scale design matrix using centering and scaling parameters}
\usage{
scale_design_matrix(X, center = NULL, scale = NULL)
}
\arguments{
\item{X}{Matrix to scale (n x p)}

\item{center}{Vector of column means to subtract (length p), or NULL}

\item{scale}{Vector of column SDs to divide by (length p), or NULL}
}
\value{
Scaled matrix with centered and scaled columns
}
\description{
Applies column-wise centering and scaling to match the space used by
compute_XtX() and compute_Xty() for unmappable effects methods.
}
\keyword{internal}


================================================
FILE: man/set_prior_variance_l.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/model_methods.R
\name{set_prior_variance_l}
\alias{set_prior_variance_l}
\title{Set prior variance for effect l}
\usage{
set_prior_variance_l(model, l, V)
}
\description{
Set prior variance for effect l
}
\keyword{internal}


================================================
FILE: man/slot_prior_betabinom.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/slot_prior.R
\name{slot_prior_betabinom}
\alias{slot_prior_betabinom}
\alias{slot_prior_poisson}
\title{Slot Activity Prior for SuSiE}
\usage{
slot_prior_betabinom(
  a_beta = NULL,
  b_beta = NULL,
  c_hat_init = NULL,
  skip_threshold_multiplier = 0
)

slot_prior_poisson(
  C,
  nu = NULL,
  update_schedule = c("sequential", "batch"),
  c_hat_init = NULL,
  skip_threshold_multiplier = 0
)
}
\arguments{
\item{a_beta}{Shape parameter for the Beta prior on inclusion
probability rho. Default 1.}

\item{b_beta}{Shape parameter for the Beta prior on inclusion
probability rho. Default 2, giving a moderate sparsity preference
with \code{E[rho] = 1/3 ~ 0.33}. Setting \code{a_beta = 1}
and \code{b_beta = 1} gives a uniform prior on [0,1], providing
automatic multiplicity correction following Scott and Berger (2010).}

\item{c_hat_init}{Optional numeric L-vector of initial slot activity
probabilities for warm-starting. If NULL, initialized at the
prior mean.}

\item{skip_threshold_multiplier}{Multiplier for the adaptive skip
threshold. Slots with c_hat below this fraction of the baseline
(prior with zero signal) are skipped. Default 0 (no skipping).
The threshold is recomputed after each sweep from the current
model state, and is set to 0 on the first sweep so all slots
are evaluated at least once.}

\item{C}{Expected number of causal variants for the Gamma-Poisson prior
on the per-block causal rate. Must be positive. Not used by
\code{slot_prior_betabinom}.}

\item{nu}{Overdispersion parameter for the Gamma-Poisson prior on the
per-block causal rate. Not used by \code{slot_prior_betabinom}.
Larger values give stronger shrinkage toward C. Default 8 when
not specified.}

\item{update_schedule}{How the Gamma shape parameter is updated
during IBSS iterations (Gamma-Poisson only; ignored for
Beta-Binomial which is inherently sequential).
\code{"batch"} updates once per full sweep (standard CAVI).
\code{"sequential"} updates after each slot (faster convergence
per iteration, used by susieAnn).}
}
\value{
A list of class \code{"slot_prior"} with the appropriate
  subclass.
}
\description{
Construct a prior specification for the slot activity
  model, which regularizes the number of active single effects in
  SuSiE. Two prior families are available: Beta-Binomial (default,
  recommended for single-locus) and Gamma-Poisson (recommended for
  genome-wide applications via susieAnn).
}
\details{
Two prior types are available:
\describe{
  \item{\code{slot_prior_betabinom}}{Uses a Beta-Binomial model
    for slot inclusion. The inclusion probability rho is given a
    Beta(a_beta, b_beta) prior and integrated out analytically,
    yielding an adaptive multiplicity correction that penalizes
    less when more slots are active. This is the recommended
    default for single-locus applications. See Scott and Berger
    (2010) for the theoretical justification.}
  \item{\code{slot_prior_poisson}}{Uses the Gamma-Poisson model
    with Poisson approximation for slot indicators. Recommended
    for genome-wide applications via susieAnn, where C and nu
    are estimated across loci.}
}
}
\examples{
# Default: Beta-Binomial with Beta(1, 2) prior on inclusion probability
slot_prior_betabinom()

# Gamma-Poisson for susieAnn
slot_prior_poisson(C = 5, nu = 8)

# Pass to susie
# fit <- susie(X, y, slot_prior = slot_prior_betabinom())

}
\references{
Scott, J. G. and Berger, J. O. (2010). Bayes and empirical-Bayes
multiplicity adjustment in the variable-selection problem.
\emph{Annals of Statistics}, 38(5), 2587--2619.
}


================================================
FILE: man/summary.susie.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/summary.susie.R
\name{summary.susie}
\alias{summary.susie}
\alias{print.summary.susie}
\title{Summarize Susie Fit.}
\usage{
\method{summary}{susie}(object, ...)

\method{print}{summary.susie}(x, ...)
}
\arguments{
\item{object}{A susie fit.}

\item{\dots}{Additional arguments passed to the generic \code{summary}
or \code{print.summary} method.}

\item{x}{A susie summary.}
}
\value{
\code{summary.susie} returns a list containing a data frame
  of variables and a data frame of credible sets.
}
\description{
\code{summary} method for the \dQuote{susie} class.
}


================================================
FILE: man/summary.susie_post_outcome_configuration.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_post_outcome_configuration.R
\name{summary.susie_post_outcome_configuration}
\alias{summary.susie_post_outcome_configuration}
\title{Summarise a susie_post_outcome_configuration result}
\usage{
\method{summary}{susie_post_outcome_configuration}(
  object,
  prob_thresh = 0.8,
  ambiguous_lower = 0.5,
  signal_only = TRUE,
  color = "auto",
  ...
)
}
\arguments{
\item{object}{Output of [susie_post_outcome_configuration()].}

\item{prob_thresh}{Threshold above which `marginal_prob` counts as a
signal (default `0.8`).}

\item{ambiguous_lower}{Lower edge of the "ambiguous" band for the
SuSiEx color coding: marginals in
`[ambiguous_lower, prob_thresh)` are colored yellow. Default `0.5`.
Set to `prob_thresh` to disable the band.}

\item{signal_only}{Logical. If `TRUE` (default), drop CS tuples where
no trait is active and drop coloc rows whose dominant hypothesis is
H0. Pass `FALSE` to keep everything.}

\item{color}{One of `"auto"` (default; honors [crayon::has_color()]),
`TRUE` (force colors on), or `FALSE` (force them off).}

\item{...}{Ignored.}
}
\value{
A list of class `"summary.susie_post_outcome_configuration"`
with components:
\describe{
  \item{`$susiex`}{`data.frame` (or `NULL` when no signals): one row per
    CS tuple. Columns: `tuple` (e.g. `"(1,1,1)"`), one numeric column
    per trait carrying that trait's `marginal_prob`, `top_pattern`
    (binary configuration string for the most-probable configuration),
    `top_prob` (its probability).}
  \item{`$coloc_pairwise`}{`data.frame` (or `NULL`): the original coloc
    table extended with `verdict` (named hypothesis label) and `top_pp`
    (the dominant PP value).}
  \item{`$susiex_n_total`, `$susiex_n_kept`, `$coloc_n_total`,
    `$coloc_n_kept`}{row counts before and after `signal_only`
    filtering, used by the print method to footer hidden rows.}
  \item{`$prob_thresh`, `$ambiguous_lower`, `$signal_only`, `$color`}{
    parameters echoed for the print method.}
}
}
\description{
Builds tidy tables from the nested list returned by
[susie_post_outcome_configuration()] and prints them with ANSI color
highlighting via [print.summary.susie_post_outcome_configuration()].
The summary itself is an S3 object: index `$susiex` and
`$coloc_pairwise` to grab the data.frames for downstream use.
}
\details{
Color encoding (when ANSI colors are available):
\itemize{
  \item SuSiEx per-trait marginal probability: bold dark green when
    `>= prob_thresh` (active), yellow when in
    `[ambiguous_lower, prob_thresh)`, dim otherwise. The `active`
    logical from the raw result is encoded by color and is not shown
    as a separate column.
  \item Coloc verdict: bold dark green for H4 (shared causal), magenta
    for H3 (distinct causals), blue for H1 or H2 (single-trait causal),
    dim for H0 (no signal). The dominant PP per row is bolded.
}

Robustness: this method is defensive against malformed input. Empty
lists, NULL components, missing fields, length-mismatched per-trait
vectors, trait names that collide with reserved columns
(`tuple`, `top_pattern`, `top_prob`), and coloc data.frames that
lack some optional columns (`hit1`, `hit2`) all degrade gracefully
rather than erroring.
}
\seealso{
[susie_post_outcome_configuration()],
  [print.summary.susie_post_outcome_configuration()]
}


================================================
FILE: man/susie.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie.R
\name{susie}
\alias{susie}
\title{Sum of Single Effects (SuSiE) Regression}
\usage{
susie(
  X,
  y,
  L = min(10, ncol(X)),
  scaled_prior_variance = 0.2,
  residual_variance = NULL,
  prior_weights = NULL,
  null_weight = 0,
  standardize = TRUE,
  intercept = TRUE,
  estimate_residual_variance = TRUE,
  estimate_residual_method = c("MoM", "MLE", "NIG"),
  estimate_prior_variance = TRUE,
  estimate_prior_method = c("optim", "EM", "simple"),
  prior_variance_grid = NULL,
  mixture_weights = NULL,
  unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
  check_null_threshold = 0,
  prior_tol = 1e-09,
  residual_variance_upperbound = Inf,
  model_init = NULL,
  s_init = NULL,
  coverage = 0.95,
  min_abs_corr = 0.5,
  compute_univariate_zscore = FALSE,
  na.rm = FALSE,
  max_iter = 100,
  L_greedy = NULL,
  greedy_lbf_cutoff = 0.1,
  tol = 1e-04,
  convergence_method = c("elbo", "pip"),
  verbose = FALSE,
  track_fit = FALSE,
  residual_variance_lowerbound = NULL,
  refine = FALSE,
  n_purity = 100,
  alpha0 = 1/sqrt(nrow(X)),
  beta0 = 1/sqrt(nrow(X)),
  init_only = FALSE,
  slot_prior = NULL
)
}
\arguments{
\item{X}{An n by p matrix of covariates.}

\item{y}{The observed responses, a vector of length n.}

\item{L}{Maximum number of non-zero effects in the model. If L is larger than
the number of covariates, p, L is set to p.}

\item{scaled_prior_variance}{The prior variance, divided by
\code{var(y)} (or by \code{(1/(n-1))yty} for
\code{susie_ss}); that is, the prior variance of each
non-zero element of b is \code{var(y) * scaled_prior_variance}. The
value provided should be either a scalar or a vector of length
\code{L}. If \code{estimate_prior_variance = TRUE}, this provides
initial estimates of the prior variances.}

\item{residual_variance}{Variance of the residual. If
\code{estimate_residual_variance = TRUE}, this value provides the
initial estimate of the residual variance. By default, it is set to
\code{var(y)} in \code{susie} and \code{(1/(n-1))yty} in
\code{susie_ss}.}

\item{prior_weights}{A vector of length p, in which each entry
gives the prior probability that corresponding column of X has a
nonzero effect on the outcome, y. The weights are internally
normalized to sum to 1. When \code{NULL} (the default), uniform
prior weights are used (each variable is assigned probability
\code{1/p}).}

\item{null_weight}{Prior probability of no effect (a number between 0 and 1,
and cannot be exactly 1).}

\item{standardize}{If \code{standardize = TRUE}, standardize the
columns of X to unit variance prior to fitting (or equivalently
standardize XtX and Xty to have the same effect). Note that
\code{scaled_prior_variance} specifies the prior on the
coefficients of X \emph{after} standardization (if it is
performed). If you do not standardize, you may need to think more
carefully about specifying \code{scaled_prior_variance}. Whatever
your choice, the coefficients returned by \code{coef} are given for
\code{X} on the original input scale. Any column of \code{X} that
has zero variance is not standardized.}

\item{intercept}{If \code{intercept = TRUE}, the intercept is
fitted; it \code{intercept = FALSE}, the intercept is set to
zero. Setting \code{intercept = FALSE} is generally not
recommended.}

\item{estimate_residual_variance}{If
\code{estimate_residual_variance = TRUE}, the residual variance is
estimated, using \code{residual_variance} as an initial value. If
\code{estimate_residual_variance = FALSE}, the residual variance is
fixed to the value supplied by \code{residual_variance}.}

\item{estimate_residual_method}{The method used for estimating residual variance.
For the original SuSiE model, "MLE" and "MoM" estimation is equivalent, but for
the infinitesimal model, "MoM" is more stable. We recommend using "NIG"
when n < 80 for improved coverage, although it is currently only implemented
for individual-level data.}

\item{estimate_prior_variance}{If \code{estimate_prior_variance =
TRUE}, the prior variance is estimated (this is a separate
parameter for each of the L effects). If provided,
\code{scaled_prior_variance} is then used as an initial value for
the optimization. When \code{estimate_prior_variance = FALSE}, the
prior variance for each of the L effects is determined by the
value supplied to \code{scaled_prior_variance}.}

\item{estimate_prior_method}{The method used for estimating prior
variance. When \code{estimate_prior_method = "simple"} is used, the
likelihood at the specified prior variance is compared to the
likelihood at a variance of zero, and the setting with the larger
likelihood is retained. When \code{prior_variance_grid} is provided,
this is automatically set to \code{"fixed_mixture"}.}

\item{prior_variance_grid}{Numeric vector of K prior variances defining
a mixture-of-normals prior on effect sizes. When provided, the SER
evaluates Bayes factors at each grid point and forms a mixture BF
weighted by \code{mixture_weights}. This bypasses the scalar prior
variance optimization. Default is \code{NULL} (standard scalar V path).}

\item{mixture_weights}{Numeric vector of K non-negative weights summing
to 1, giving the mixture proportions for the variance grid. Default is
\code{NULL}, which uses uniform weights when \code{prior_variance_grid}
is provided.}

\item{unmappable_effects}{The method for modeling unmappable effects:
"none", "inf", "ash".}

\item{check_null_threshold}{When the prior variance is estimated,
compare the estimate with the null, and set the prior variance to
zero unless the log-likelihood using the estimate is larger by this
threshold amount. For example, if you set
\code{check_null_threshold = 0.1}, this will "nudge" the estimate
towards zero when the difference in log-likelihoods is small. A
note of caution that setting this to a value greater than zero may
lead the IBSS fitting procedure to occasionally decrease the ELBO. This
setting is disabled when using \code{unmappable_effects = "inf"} or
\code{unmappable_effects = "ash"}.}

\item{prior_tol}{When the prior variance is estimated, compare the
estimated value to \code{prior_tol} at the end of the computation,
and exclude a single effect from PIP computation if the estimated
prior variance is smaller than this tolerance value.}

\item{residual_variance_upperbound}{Upper limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{model_init}{A previous susie fit with which to initialize.}

\item{s_init}{Deprecated alias for \code{model_init}.}

\item{coverage}{A number between 0 and 1 specifying the
\dQuote{coverage} of the estimated confidence sets.}

\item{min_abs_corr}{Minimum absolute correlation allowed in a
credible set. The default, 0.5, corresponds to a squared
correlation of 0.25, which is a commonly used threshold for
genotype data in genetic studies. This "purity" filter is
applied to the CSs reported in the fit object, so the CS list
returned here may be a subset of the one produced by calling
\code{\link{susie_get_cs}} on the same fit without passing
\code{X} or \code{Xcorr} (in which case the purity filter is
skipped).}

\item{compute_univariate_zscore}{If \code{compute_univariate_zscore
= TRUE}, the univariate regression z-scores are outputted for each
variable.}

\item{na.rm}{Drop any missing values in y from both X and y.}

\item{max_iter}{Maximum number of IBSS iterations to perform.}

\item{L_greedy}{Integer or \code{NULL}. When non-\code{NULL}, run a
greedy outer loop that grows the number of effects from
\code{L_greedy} up to \code{L} in linear steps until the fit
saturates. The default \code{NULL} runs the usual fixed-\code{L}
fit.}

\item{greedy_lbf_cutoff}{Numeric saturation threshold for the
\code{L_greedy} outer loop. Default is 0.1.}

\item{tol}{tol A small, non-negative number specifying the convergence
tolerance for the IBSS fitting procedure.}

\item{convergence_method}{When \code{converge_method = "elbo"} the fitting
procedure halts when the difference in the variational lower bound, or
\dQuote{ELBO} (the objective function to be maximized), is
less than \code{tol}. When \code{converge_method = "pip"} the fitting
procedure halts when the maximum absolute difference in \code{alpha} is less
than \code{tol}.}

\item{verbose}{If \code{verbose = TRUE}, the algorithm's progress,
a summary of the optimization settings, and refinement progress (if
\code{refine = TRUE}) are printed to the console.}

\item{track_fit}{If \code{track_fit = TRUE}, \code{trace}
is also returned containing detailed information about the
estimates at each iteration of the IBSS fitting procedure.}

\item{residual_variance_lowerbound}{Lower limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{refine}{If \code{refine = TRUE}, then an additional
iterative refinement procedure is used, after the IBSS algorithm,
to check and escape from local optima (see details).}

\item{n_purity}{Passed as argument \code{n_purity} to
\code{\link{susie_get_cs}}.}

\item{alpha0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{beta0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{init_only}{Logical. If \code{TRUE}, return a list with
\code{data} and \code{params} objects without running the IBSS
algorithm. Used by packages like susieAnn that implement their own
outer loop around SuSiE's building blocks. Default is \code{FALSE}.}

\item{slot_prior}{Optional slot activity prior created by
\code{\link{slot_prior_betabinom}} or \code{\link{slot_prior_poisson}}.
Use \code{slot_prior_betabinom(a_beta, b_beta)} for the usual
single-locus setting; it places a Beta-Binomial prior on the
number of active effects and gives an adaptive multiplicity
correction. Use \code{slot_prior_poisson(C, nu)} when you want a
Gamma-Poisson prior centered on an expected number \code{C} of
active effects. When supplied, each single-effect slot has an
estimated activity probability \code{c_hat}; fitted values and
PIPs are weighted by these activity probabilities, and convergence
is checked using \code{convergence_method = "pip"}.}
}
\value{
A \code{"susie"} object with some or all of the following elements:

\item{alpha}{An L by p matrix of posterior inclusion probabilities.}

\item{mu}{An L by p matrix of posterior means, conditional on inclusion.}

\item{mu2}{An L by p matrix of posterior second moments, conditional on
  inclusion.}

\item{Xr}{A vector of length n, equal to \code{X \%*\% colSums(alpha * mu)}.}

\item{lbf}{Log-Bayes Factor for each single effect.}

\item{lbf_variable}{Log-Bayes Factor for each variable and single effect.}

\item{intercept}{Intercept (fixed or estimated).}

\item{sigma2}{Residual variance (fixed or estimated).}

\item{V}{Prior variance of the non-zero elements of b.}

\item{elbo}{The variational lower bound (or ELBO) achieved at each iteration.}

\item{fitted}{Vector of length n containing the fitted values.}

\item{sets}{Credible sets estimated from model fit.}

\item{pip}{A vector of length p giving the marginal posterior inclusion
  probabilities.}

\item{z}{A vector of univariate z-scores.}

\item{niter}{Number of IBSS iterations performed.}

\item{converged}{\code{TRUE} or \code{FALSE} indicating whether
  the IBSS converged to a solution within the chosen tolerance
  level.}

\item{theta}{If \code{unmappable_effects = "inf"} or
  \code{unmappable_effects = "ash"}, then \code{theta} is a p-vector of posterior
  means for the unmappable effects.}

\item{tau2}{If \code{unmappable_effects = "inf"} or
  \code{unmappable_effects = "ash"}, then \code{tau2} is the unmappable variance.}
}
\description{
Performs a sparse Bayesian multiple linear regression
of y on X, using the "Sum of Single Effects" model from Wang et al
(2020). In brief, this function fits the regression model \eqn{y =
\mu + X b + e}, where elements of \eqn{e} are \emph{i.i.d.} normal
with zero mean and variance \code{residual_variance}, \eqn{\mu} is
an intercept term and \eqn{b} is a vector of length p representing
the effects to be estimated. The \dQuote{susie assumption} is that
\eqn{b = \sum_{l=1}^L b_l} where each \eqn{b_l} is a vector of
length p with exactly one non-zero element. The prior on the
non-zero element is normal with zero mean and variance \code{var(y)
* scaled_prior_variance}. The value of \code{L} is fixed, and
should be chosen to provide a reasonable upper bound on the number
of non-zero effects to be detected. Typically, the hyperparameters
\code{residual_variance} and \code{scaled_prior_variance} will be
estimated during model fitting, although they can also be fixed as
specified by the user. See functions \code{\link{susie_get_cs}} and
other functions of form \code{susie_get_*} to extract the most
commonly-used results from a susie fit.

#' @details The function \code{susie} implements the IBSS algorithm
from Wang et al (2020). The option \code{refine = TRUE} implements
an additional step to help reduce problems caused by convergence of
the IBSS algorithm to poor local optima (which is rare in our
experience, but can provide misleading results when it occurs). The
refinement step incurs additional computational expense that
increases with the number of CSs found in the initial run.

The function \code{susie_ss} implements essentially the same
algorithms, but using sufficient statistics. (The statistics are
sufficient for the regression coefficients \eqn{b}, but not for the
intercept \eqn{\mu}; see below for how the intercept is treated.)
If the sufficient statistics are computed correctly then the
results from \code{susie_ss} should be the same as (or very
similar to) \code{susie}, although runtimes will differ as
discussed below. The sufficient statistics are the sample
size \code{n}, and then the p by p matrix \eqn{X'X}, the p-vector
\eqn{X'y}, and the sum of squared y values \eqn{y'y}, all computed
after centering the columns of \eqn{X} and the vector \eqn{y} to
have mean 0; these can be computed using \code{compute_suff_stat}.

The handling of the intercept term in \code{susie_ss} needs
some additional explanation. Computing the summary data after
centering \code{X} and \code{y} effectively ensures that the
resulting posterior quantities for \eqn{b} allow for an intercept
in the model; however, the actual value of the intercept cannot be
estimated from these centered data. To estimate the intercept term
the user must also provide the column means of \eqn{X} and the mean
of \eqn{y} (\code{X_colmeans} and \code{y_mean}). If these are not
provided, they are treated as \code{NA}, which results in the
intercept being \code{NA}. If for some reason you prefer to have
the intercept be 0 instead of \code{NA} then set
\code{X_colmeans = 0,y_mean = 0}.

For completeness, we note that if \code{susie_ss} is run on
\eqn{X'X, X'y, y'y} computed \emph{without} centering \eqn{X} and
\eqn{y}, and with \code{X_colmeans = 0,y_mean = 0}, this is
equivalent to \code{susie} applied to \eqn{X, y} with
\code{intercept = FALSE} (although results may differ due to
different initializations of \code{residual_variance} and
\code{scaled_prior_variance}). However, this usage is not
recommended for for most situations.

The computational complexity of \code{susie} is \eqn{O(npL)} per
iteration, whereas \code{susie_ss} is \eqn{O(p^2L)} per
iteration (not including the cost of computing the sufficient
statistics, which is dominated by the \eqn{O(np^2)} cost of
computing \eqn{X'X}). Because of the cost of computing \eqn{X'X},
\code{susie} will usually be faster. However, if \eqn{n >> p},
and/or if \eqn{X'X} is already computed, then
\code{susie_ss} may be faster.
}


================================================
FILE: man/susieR-package.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susieR-package.R
\docType{package}
\name{susieR-package}
\alias{susieR}
\alias{susieR-package}
\title{susieR: Sum of Single Effects Linear Regression}
\description{
Implements methods for variable selection in linear regression based on the "Sum of Single Effects" (SuSiE) model, as described in Wang et al (2020) \doi{10.1101/501114} and Zou et al (2021) \doi{10.1101/2021.11.03.467167}. These methods provide simple summaries, called "Credible Sets", for accurately quantifying uncertainty in which variables should be selected. The methods are motivated by genetic fine-mapping applications, and are particularly well-suited to settings where variables are highly correlated and detectable effects are sparse. The fitting algorithm, a Bayesian analogue of stepwise selection methods called "Iterative Bayesian Stepwise Selection" (IBSS), is simple and fast, allowing the SuSiE model be fit to large data sets (thousands of samples and hundreds of thousands of variables).
}
\seealso{
Useful links:
\itemize{
  \item \url{https://github.com/stephenslab/susieR}
  \item Report bugs at \url{https://github.com/stephenslab/susieR/issues}
}

}
\author{
\strong{Maintainer}: Peter Carbonetto \email{peter.carbonetto@gmail.com}

Authors:
\itemize{
  \item Gao Wang \email{wang.gao@columbia.edu}
  \item Yuxin Zou
  \item Alexander McCreight
  \item Kaiqian Zhang
  \item William R.P. Denault
  \item Matthew Stephens
}

}
\keyword{internal}


================================================
FILE: man/susie_auto.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_auto.R
\name{susie_auto}
\alias{susie_auto}
\title{Attempt at Automating SuSiE for Hard Problems}
\usage{
susie_auto(
  X,
  y,
  L_init = 1,
  L_max = 512,
  verbose = FALSE,
  init_tol = 1,
  standardize = TRUE,
  intercept = TRUE,
  max_iter = 100,
  tol = 0.01,
  ...
)
}
\arguments{
\item{X}{An n by p matrix of covariates.}

\item{y}{The observed responses, a vector of length n.}

\item{L_init}{The initial value of L.}

\item{L_max}{The largest value of L to consider.}

\item{verbose}{If \code{verbose = TRUE}, the algorithm's progress,
and a summary of the optimization settings, are printed to the
console.}

\item{init_tol}{The tolerance to passed to \code{susie} during
early runs (set large to shorten the initial runs).}

\item{standardize}{If \code{standardize = TRUE}, standardize the
columns of X to unit variance prior to fitting. Note that
\code{scaled_prior_variance} specifies the prior on the
coefficients of X \emph{after} standardization (if it is
performed). If you do not standardize, you may need to think more
carefully about specifying \code{scaled_prior_variance}. Whatever
your choice, the coefficients returned by \code{coef} are given for
\code{X} on the original input scale. Any column of \code{X} that
has zero variance is not standardized.}

\item{intercept}{If \code{intercept = TRUE}, the intercept is
fitted; it \code{intercept = FALSE}, the intercept is set to
zero. Setting \code{intercept = FALSE} is generally not
recommended.}

\item{max_iter}{Maximum number of IBSS iterations to perform.}

\item{tol}{A small, non-negative number specifying the convergence
tolerance for the IBSS fitting procedure. The fitting procedure
will halt when the difference in the variational lower bound, or
\dQuote{ELBO} (the objective function to be maximized), is
less than \code{tol}.}

\item{\dots}{Additional arguments passed to \code{\link{susie}}.}
}
\value{
See \code{\link{susie}} for a description of return values.
}
\description{
\code{susie_auto} is an attempt to automate reliable
  running of susie even on hard problems. It implements a three-stage
  strategy for each L: first, fit susie with very small residual
  error; next, estimate residual error; finally, estimate the prior
  variance. If the last step estimates some prior variances to be
  zero, stop. Otherwise, double L, and repeat. Initial runs are
  performed with relaxed tolerance; the final run is performed using
  the default susie tolerance.
}
\examples{
set.seed(1)
n = 1000
p = 1000
beta = rep(0,p)
beta[1:4] = 1
X = matrix(rnorm(n*p),nrow = n,ncol = p)
X = scale(X,center = TRUE,scale = TRUE)
y = drop(X \%*\% beta + rnorm(n))
res = susie_auto(X,y)
plot(beta,coef(res)[-1])
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
plot(y,predict(res))
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")

}
\seealso{
\code{\link{susie}}
}


================================================
FILE: man/susie_get_methods.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_get_functions.R
\name{susie_get_objective}
\alias{susie_get_objective}
\alias{susie_get_posterior_mean}
\alias{susie_get_posterior_sd}
\alias{susie_get_niter}
\alias{susie_get_prior_variance}
\alias{susie_get_residual_variance}
\alias{susie_get_lfsr}
\alias{susie_get_posterior_samples}
\alias{susie_get_cs}
\alias{susie_get_pip}
\title{Inferences From Fitted SuSiE Model}
\usage{
susie_get_objective(res, last_only = TRUE, warning_tol = 1e-06)

susie_get_posterior_mean(res, prior_tol = 1e-09)

susie_get_posterior_sd(res, prior_tol = 1e-09)

susie_get_niter(res)

susie_get_prior_variance(res)

susie_get_residual_variance(res)

susie_get_lfsr(res)

susie_get_posterior_samples(susie_fit, num_samples)

susie_get_cs(
  res,
  X = NULL,
  Xcorr = NULL,
  coverage = 0.95,
  min_abs_corr = 0.5,
  dedup = TRUE,
  squared = FALSE,
  check_symmetric = TRUE,
  n_purity = 100,
  use_rfast = NULL,
  ld_extend_threshold = 0.99
)

susie_get_pip(res, prune_by_cs = FALSE, prior_tol = 1e-09)
}
\arguments{
\item{res}{A susie fit, typically an output from
\code{\link{susie}} or one of its variants. For
\code{susie_get_pip} and \code{susie_get_cs}, this may instead be
the posterior inclusion probability matrix, \code{alpha}.}

\item{last_only}{If \code{last_only = FALSE}, return the ELBO from
all iterations; otherwise return the ELBO from the last iteration
only.}

\item{warning_tol}{Warn if ELBO is decreasing by this
tolerance level.}

\item{prior_tol}{Filter out effects having estimated prior variance
smaller than this threshold.}

\item{susie_fit}{A susie fit, an output from \code{\link{susie}}.}

\item{num_samples}{The number of draws from the posterior
distribution.}

\item{X}{n by p matrix of values of the p variables (covariates) in
n samples. When provided, correlation between variables will be
computed and used to remove CSs whose minimum correlation among
variables is smaller than \code{min_abs_corr}.}

\item{Xcorr}{p by p matrix of correlations between variables
(covariates). When provided, it will be used to remove CSs whose
minimum correlation among variables is smaller than
\code{min_abs_corr}.}

\item{coverage}{A number between 0 and 1 specifying desired
coverage of each CS.}

\item{min_abs_corr}{A "purity" threshold for the CS. Any CS that
contains a pair of variables with correlation less than this
threshold will be filtered out and not reported. This filter is
only applied when \code{X} or \code{Xcorr} is provided; otherwise
it is ignored and a warning is issued.}

\item{dedup}{If \code{dedup = TRUE}, remove duplicate CSs.}

\item{squared}{If \code{squared = TRUE}, report min, mean and
median of squared correlation instead of the absolute correlation.}

\item{check_symmetric}{If \code{check_symmetric = TRUE}, perform a
check for symmetry of matrix \code{Xcorr} when \code{Xcorr} is
provided (not \code{NULL}).}

\item{n_purity}{The maximum number of credible set (CS) variables
used in calculating the correlation (\dQuote{purity})
statistics. When the number of variables included in the CS is
greater than this number, the CS variables are randomly subsampled.}

\item{use_rfast}{Use the Rfast package for the purity calculations.
By default \code{use_rfast = TRUE} if the Rfast package is
installed.}

\item{ld_extend_threshold}{Threshold for extending CS by LD (default 0.99).
Variants with |correlation| > threshold with any CS member are added.
Set to NULL to disable LD extension. Requires Xcorr (would not work if only X is provided).}

\item{prune_by_cs}{Whether or not to ignore single effects not in
a reported CS when calculating PIP.}
}
\value{
\code{susie_get_objective} returns the evidence lower bound
(ELBO) achieved by the fitted susie model and, optionally, at each
iteration of the IBSS fitting procedure.

\code{susie_get_residual_variance} returns the (estimated or
fixed) residual variance parameter.

\code{susie_get_prior_variance} returns the (estimated or fixed)
prior variance parameters.

\code{susie_get_posterior_mean} returns the posterior mean for the
regression coefficients of the fitted susie model.

\code{susie_get_posterior_sd} returns the posterior standard
deviation for coefficients of the fitted susie model.

\code{susie_get_niter} returns the number of model fitting
iterations performed.

\code{susie_get_pip} returns a vector containing the posterior
inclusion probabilities (PIPs) for all variables.

\code{susie_get_lfsr} returns a vector containing the average lfsr
across variables for each single-effect, weighted by the posterior
inclusion probability (alpha).

\code{susie_get_posterior_samples} returns a list containing the
effect sizes samples and causal status with two components: \code{b},
an \code{num_variables} x \code{num_samples} matrix of effect
sizes; \code{gamma}, an \code{num_variables} x \code{num_samples}
matrix of causal status random draws.

\code{susie_get_cs} returns credible sets (CSs) from a susie fit,
as well as summaries of correlation among the variables included in
each CS. If desired, one can filter out CSs that do not meet a
specified \dQuote{purity} threshold; to do this, either \code{X} or
\code{Xcorr} must be supplied. It returns a list with the following
elements:

\item{cs}{A list in which each list element is a vector containing
  the indices of the variables in the CS.}

\item{coverage}{The nominal coverage specified for each CS.}

\item{purity}{If \code{X} or \code{Xcorr} iis provided), the
  purity of each CS.}

\item{cs_index}{If \code{X} or \code{Xcorr} is provided) the index
  (number between 1 and L) of each reported CS in the supplied susie
  fit.}
}
\description{
These functions access basic properties or draw
  inferences from a fitted susie model.
}
\examples{
set.seed(1)
n <- 1000
p <- 1000
beta <- rep(0, p)
beta[1:4] <- 1
X <- matrix(rnorm(n * p), nrow = n, ncol = p)
X <- scale(X, center = TRUE, scale = TRUE)
y <- drop(X \%*\% beta + rnorm(n))
s <- susie(X, y, L = 10)
susie_get_objective(s)
susie_get_objective(s, last_only = FALSE)
susie_get_residual_variance(s)
susie_get_prior_variance(s)
susie_get_posterior_mean(s)
susie_get_posterior_sd(s)
susie_get_niter(s)
susie_get_pip(s)
susie_get_lfsr(s)

}


================================================
FILE: man/susie_init_coef.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_get_functions.R
\name{susie_init_coef}
\alias{susie_init_coef}
\title{Initialize a susie object using regression coefficients}
\usage{
susie_init_coef(coef_index, coef_value, p)
}
\arguments{
\item{coef_index}{An L-vector containing the the indices of the
nonzero coefficients.}

\item{coef_value}{An L-vector containing initial coefficient
estimates.}

\item{p}{A scalar giving the number of variables.}
}
\value{
A list with elements \code{alpha}, \code{mu} and \code{mu2}
  to be used by \code{susie}.
}
\description{
Initialize a susie object using regression coefficients
}
\examples{
set.seed(1)
n = 1000
p = 1000
beta = rep(0,p)
beta[sample(1:1000,4)] = 1
X = matrix(rnorm(n*p),nrow = n,ncol = p)
X = scale(X,center = TRUE,scale = TRUE)
y = drop(X \%*\% beta + rnorm(n))

# Initialize susie to ground-truth coefficients.
s = susie_init_coef(which(beta != 0),beta[beta != 0],length(beta))
res = susie(X,y,L = 10,model_init=s)

}


================================================
FILE: man/susie_plot_changepoint.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_plot.R
\name{susie_plot_changepoint}
\alias{susie_plot_changepoint}
\title{Plot changepoint data and susie fit using ggplot2}
\usage{
susie_plot_changepoint(
  s,
  y,
  line_col = "blue",
  line_size = 1.5,
  cs_col = "red"
)
}
\arguments{
\item{s}{A susie fit generated by
\code{susie_trendfilter(y,order = 0)}.}

\item{y}{An n-vector of observations that are ordered in time or
space (assumed equally-spaced).}

\item{line_col}{Color for the line showing fitted values.}

\item{line_size}{Size of the lines showing fitted values}

\item{cs_col}{Color of the shaded rectangles showing credible
sets.}
}
\value{
A ggplot2 plot object.
}
\description{
Plots original data, y, overlaid with line showing
  susie fitted value and shaded rectangles showing credible sets for
  changepoint locations.
}
\examples{
set.seed(1)
mu <- c(rep(0, 50), rep(1, 50), rep(3, 50), rep(-2, 50), rep(0, 300))
y <- mu + rnorm(500)
# Here we use a less sensitive tolerance so that the example takes
# less time; in practice you will likely want to use a more stringent
# setting such as tol = 0.001.
s <- susie_trendfilter(y, tol = 0.1)

# Produces ggplot with credible sets for changepoints.
susie_plot_changepoint(s, y)

}


================================================
FILE: man/susie_plots.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_plot.R
\name{susie_plot}
\alias{susie_plot}
\alias{susie_plot_iteration}
\title{SuSiE Plots.}
\usage{
susie_plot(
  model,
  y,
  add_bar = FALSE,
  pos = NULL,
  b = NULL,
  max_cs = 400,
  add_legend = NULL,
  ...
)

susie_plot_iteration(model, L, file_prefix, pos = NULL)
}
\arguments{
\item{model}{A SuSiE fit, typically an output from
\code{\link{susie}} or one of its variants. For \code{suse_plot},
the susie fit must have \code{model$z}, \code{model$PIP}, and may
include \code{model$sets}. \code{model} may also be a vector of
z-scores or PIPs.}

\item{y}{A string indicating what to plot: either \code{"z_original"} for
z-scores, \code{"z"} for z-score derived p-values on (base-10) log-scale,
\code{"PIP"} for posterior inclusion probabilities,
\code{"log10PIP"} for posterior inclusion probabiliities on the
(base-10) log-scale. For any other setting, the data are plotted as
is.}

\item{add_bar}{If \code{add_bar = TRUE}, add horizontal bar to
signals in credible interval.}

\item{pos}{Indices of variables to plot. If \code{pos = NULL} all
variables are plotted.}

\item{b}{For simulated data, set \code{b = TRUE} to highlight
"true" effects (highlights in red).}

\item{max_cs}{The largest credible set to display, either based on
purity (set \code{max_cs} between 0 and 1), or based on size (set
\code{max_cs > 1}).}

\item{add_legend}{If \code{add_legend = TRUE}, add a legend to
annotate the size and purity of each CS discovered. It can also be
specified as location where legends should be added, e.g.,
\code{add_legend = "bottomright"} (default location is
\code{"topright"}).}

\item{\dots}{Additional arguments passed to
\code{\link[graphics]{plot}}.}

\item{L}{An integer specifying the number of credible sets to plot.}

\item{file_prefix}{Prefix to path of output plot file. If not
specified, the plot, or plots, will be saved to a temporary
directory generated using \code{\link{tempdir}}.}
}
\value{
Invisibly returns \code{NULL}.
}
\description{
\code{susie_plot} produces a per-variable summary of
  the SuSiE credible sets. \code{susie_plot_iteration} produces a
  diagnostic plot for the susie model fitting. For
  \code{susie_plot_iteration}, several plots will be created if
  \code{track_fit = TRUE} when calling \code{susie}.
}
\examples{
set.seed(1)
n <- 1000
p <- 1000
beta <- rep(0, p)
beta[sample(1:1000, 4)] <- 1
X <- matrix(rnorm(n * p), nrow = n, ncol = p)
X <- scale(X, center = TRUE, scale = TRUE)
y <- drop(X \%*\% beta + rnorm(n))
res <- susie(X, y, L = 10)
susie_plot(res, "PIP")
susie_plot(res, "PIP", add_bar = TRUE)
susie_plot(res, "PIP", add_legend = TRUE)
susie_plot(res, "PIP", pos = 1:500, add_legend = TRUE)
# Plot selected regions with adjusted x-axis position label
res$genomic_position <- 1000 + (1:length(res$pip))
susie_plot(res, "PIP",
  add_legend = TRUE,
  pos = list(attr = "genomic_position", start = 1000, end = 1500)
)
# True effects are shown in red.
susie_plot(res, "PIP", b = beta, add_legend = TRUE)

set.seed(1)
n <- 1000
p <- 1000
beta <- rep(0, p)
beta[sample(1:1000, 4)] <- 1
X <- matrix(rnorm(n * p), nrow = n, ncol = p)
X <- scale(X, center = TRUE, scale = TRUE)
y <- drop(X \%*\% beta + rnorm(n))
res <- susie(X, y, L = 10)
susie_plot_iteration(res, L = 10)

}
\seealso{
\code{\link{susie_plot_changepoint}}
}


================================================
FILE: man/susie_post_outcome_configuration.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_post_outcome_configuration.R
\name{susie_post_outcome_configuration}
\alias{susie_post_outcome_configuration}
\title{Post-hoc causal-configuration probabilities for one or more SuSiE-class fits}
\usage{
susie_post_outcome_configuration(
  input,
  by = c("fit", "outcome"),
  method = c("susiex", "coloc_pairwise"),
  prob_thresh = 0.8,
  cs_only = TRUE,
  p1 = 1e-04,
  p2 = 1e-04,
  p12 = 5e-06,
  ...
)
}
\arguments{
\item{input}{A single fit of class \code{susie}, \code{mvsusie}, or
\code{mfsusie}, OR a list of such fits.}

\item{by}{Either \code{"fit"} (one trait per input fit; default) or
\code{"outcome"} (multi-output fits expand into per-outcome traits).}

\item{method}{Character scalar; one of \code{"susiex"} (default) or
\code{"coloc_pairwise"}. Pick the analysis to run; for both, call
the function twice.}

\item{prob_thresh}{Per-trait marginal threshold for the convenience
\code{$active} flags in the SuSiEx output. Default \code{0.8}.}

\item{cs_only}{Logical. If \code{TRUE} (default) only enumerate over CSs
present in each fit's \code{$sets$cs}; if \code{FALSE} loop over all L
rows of \code{$alpha}. Either way, effects whose entire alpha row is
zero are skipped. When \code{TRUE}, every fit must carry a non-null
\code{$sets$cs} or the function errors.}

\item{p1, p2, p12}{Coloc per-SNP causal priors: \code{p1} for trait 1
alone, \code{p2} for trait 2 alone, \code{p12} for shared causal.
Defaults match \code{coloc::coloc.bf_bf}: \code{p1 = p2 = 1e-4},
\code{p12 = 5e-6}. Only used when \code{"coloc_pairwise"} is in
\code{methods}.}

\item{...}{Currently ignored.}
}
\value{
A list of class \code{"susie_post_outcome_configuration"} with
exactly one of the following components, depending on \code{method}:
\describe{
  \item{\code{$susiex}}{(when \code{method = "susiex"}) A list of length
    equal to the number of CS tuples considered. Each element has
    components \code{cs_indices} (length-N integer tuple),
    \code{logBF_trait} (length N), \code{configs} (\eqn{2^N \times N}
    binary matrix), \code{config_prob} (length \eqn{2^N}),
    \code{marginal_prob} (length-N per-trait marginal posterior
    probability of being active across the configuration ensemble),
    and \code{active} (logical, \code{marginal_prob >= prob_thresh}).}
  \item{\code{$coloc_pairwise}}{(when \code{method = "coloc_pairwise"})
    A data.frame with one row per (trait1, trait2, l1, l2)
    combination, columns \code{trait1, trait2, l1, l2, hit1, hit2,
    PP.H0, PP.H1, PP.H2, PP.H3, PP.H4}.}
}
Pretty-print with \code{summary(out)}.
}
\description{
Runs one of two complementary post-hoc analyses, selected by
\code{method}: \code{"susiex"} (default) for the SuSiEx \eqn{2^N}
combinatorial enumeration, reporting the posterior probability of
every binary causality pattern across the \eqn{N} input traits; or
\code{"coloc_pairwise"} for the coloc pairwise ABF, reporting the
five colocalisation hypothesis posteriors (H0/H1/H2/H3/H4) for every
pair of traits. To get both, call the function twice and combine.
}
\details{
Two grouping modes are supported through the \code{by} argument:
\describe{
  \item{\code{"fit"}}{Each input fit contributes a single trait view.
    Multi-output fits (\code{mvsusie}, \code{mfsusie}) are kept whole: the
    trait's per-(CS, SNP) log Bayes factors are the joint composite
    stored on the fit as \code{lbf_variable}. Configuration enumeration
    loops over the cross-product \eqn{L_1 \times \dots \times L_N} of CS
    indices.}
  \item{\code{"outcome"}}{Multi-output fits fan out into per-outcome views,
    each with its own per-(CS, SNP) log Bayes factors read from
    \code{fit$lbf_variable_outcome} (an \eqn{L \times J \times R} or
    \eqn{L \times J \times M} array). All per-outcome views share the
    joint fit's PIP matrix and CS list, so the configuration enumeration
    reduces to a single index \eqn{l \in 1..L}. Single-output \code{susie}
    fits pass through unchanged. Requires \code{$lbf_variable_outcome} on the
    fit (set \code{attach_lbf_variable_outcome = TRUE} when fitting).}
}

\subsection{SuSiEx algorithm}{
For each credible-set tuple \eqn{(l_1, \dots, l_N)}:
\enumerate{
  \item Per-trait CS-level log BF (alpha-weighted SNP average):
    \deqn{\log\mathrm{BF}^{(n)}_{l_n} = \sum_j \alpha_{n,l_n,j}\,
      \log\mathrm{BF}_{n,l_n,j}.}
  \item Enumerate the \eqn{2^N} binary configurations
    \eqn{c \in \{0,1\}^N}.
  \item Configuration log BF:
    \deqn{\log\mathrm{BF}^{(c)} = \sum_{n: c_n = 1} \log\mathrm{BF}^{(n)}_{l_n}.}
  \item Normalise under a uniform prior over the \eqn{2^N} configurations.
  \item Per-trait marginal: \eqn{P(\mathrm{trait}\,n\,\mathrm{causal}) =
    \sum_{c: c_n = 1} P(c \mid \mathrm{tuple})}.
}
}

\subsection{Coloc pairwise algorithm}{
For each unordered trait pair \eqn{(n, n')} and each CS pair
\eqn{(l_n, l_{n'})}, with per-SNP log BFs
\eqn{\ell_1 = \log\mathrm{BF}_{n,l_n,\cdot}} and
\eqn{\ell_2 = \log\mathrm{BF}_{n',l_{n'},\cdot}} (length \eqn{J}), the
five hypothesis log-BFs are
\deqn{\log\mathrm{BF}_{H_0} = 0,\quad
      \log\mathrm{BF}_{H_1} = \log p_1 + \mathrm{LSE}(\ell_1),\quad
      \log\mathrm{BF}_{H_2} = \log p_2 + \mathrm{LSE}(\ell_2),}
\deqn{\log\mathrm{BF}_{H_3} = \log p_1 + \log p_2 +
      \mathrm{logdiff}(\mathrm{LSE}(\ell_1) + \mathrm{LSE}(\ell_2),\;
                       \mathrm{LSE}(\ell_1 + \ell_2)),}
\deqn{\log\mathrm{BF}_{H_4} = \log p_{12} + \mathrm{LSE}(\ell_1 + \ell_2),}
and the corresponding posteriors are
\eqn{\mathrm{PP.H}_h = \exp(\log\mathrm{BF}_{H_h} -
      \mathrm{LSE}(\log\mathrm{BF}_{H_0:H_4}))}, where
\eqn{\mathrm{LSE}} is the log-sum-exp.
\itemize{
  \item H0: no causal variant in either CS.
  \item H1: causal in trait \eqn{n} only.
  \item H2: causal in trait \eqn{n'} only.
  \item H3: distinct causals in the two traits.
  \item H4: a single shared causal variant.
}
}
}
\references{
SuSiEx, Nature Genetics 2024 (combinatorial \eqn{2^N} enumeration).
Wallace, PLoS Genetics 2020 (coloc pairwise H0/H1/H2/H3/H4 ABF).
}


================================================
FILE: man/susie_rss.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie.R
\name{susie_rss}
\alias{susie_rss}
\title{SuSiE with Regression Summary Statistics (RSS)}
\usage{
susie_rss(
  z = NULL,
  R = NULL,
  n = NULL,
  X = NULL,
  bhat = NULL,
  shat = NULL,
  var_y = NULL,
  L = min(10, if (is.list(R) && !is.matrix(R)) ncol(R[[1]]) else if (!is.null(R)) ncol(R)
    else if (is.list(X) && !is.matrix(X)) ncol(X[[1]]) else ncol(X)),
  maf = NULL,
  maf_thresh = 0,
  scaled_prior_variance = 0.2,
  residual_variance = NULL,
  prior_weights = NULL,
  null_weight = 0,
  standardize = TRUE,
  estimate_residual_variance = FALSE,
  estimate_residual_method = c("MoM", "MLE", "NIG"),
  estimate_prior_variance = TRUE,
  estimate_prior_method = c("optim", "EM", "simple"),
  prior_variance_grid = NULL,
  mixture_weights = NULL,
  unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
  check_null_threshold = 0,
  prior_tol = 1e-09,
  residual_variance_lowerbound = 0,
  residual_variance_upperbound = Inf,
  model_init = NULL,
  s_init = NULL,
  coverage = 0.95,
  min_abs_corr = 0.5,
  max_iter = 100,
  L_greedy = NULL,
  greedy_lbf_cutoff = 0.1,
  tol = 1e-04,
  convergence_method = c("elbo", "pip"),
  verbose = FALSE,
  track_fit = FALSE,
  check_input = FALSE,
  check_prior = TRUE,
  n_purity = 100,
  r_tol = 1e-08,
  refine = FALSE,
  R_finite = NULL,
  R_mismatch = c("none", "map", "map_qc"),
  eig_delta_rel = 0.001,
  eig_delta_abs = 0,
  artifact_threshold = 0.1,
  alpha0 = if (is.null(n)) NULL else 1/sqrt(n),
  beta0 = if (is.null(n)) NULL else 1/sqrt(n),
  init_only = FALSE,
  slot_prior = NULL
)
}
\arguments{
\item{z}{A p-vector of z-scores.}

\item{R}{A p by p correlation matrix. Exactly one of \code{R} or
\code{X} must be provided.}

\item{n}{The sample size, not required but recommended.}

\item{X}{A factor matrix (B x p) such that \code{R = crossprod(X) /
nrow(X)} approximates the R (correlation) matrix. When
\code{nrow(X) >= ncol(X)}, the correlation matrix \code{R} is
formed explicitly and the standard path is used. When
\code{nrow(X) < ncol(X)}, a low-rank path is used that avoids
forming the p x p matrix, reducing per-iteration cost from
O(Lp^2) to O(LBp). Columns of \code{X} are standardized
internally.}

\item{bhat}{Alternative summary data giving the estimated effects
(a vector of length p). This, together with \code{shat}, may be
provided instead of \code{z}.}

\item{shat}{Alternative summary data giving the standard errors of
the estimated effects (a vector of length p). This, together with
\code{bhat}, may be provided instead of \code{z}.}

\item{var_y}{The sample variance of y, defined as \eqn{y'y/(n-1)}.
When the sample variance is not provided, the coefficients
(returned from \code{coef}) are computed on the
\dQuote{standardized} X, y scale.}

\item{L}{Maximum number of non-zero effects in the model. If L is larger than
the number of covariates, p, L is set to p.}

\item{maf}{A p-vector of minor allele frequencies; to be used along with
\code{maf_thresh} to filter input summary statistics.}

\item{maf_thresh}{Variants with MAF smaller than this threshold are not used.}

\item{scaled_prior_variance}{The prior variance, divided by
\code{var(y)} (or by \code{(1/(n-1))yty} for
\code{susie_ss}); that is, the prior variance of each
non-zero element of b is \code{var(y) * scaled_prior_variance}. The
value provided should be either a scalar or a vector of length
\code{L}. If \code{estimate_prior_variance = TRUE}, this provides
initial estimates of the prior variances.}

\item{residual_variance}{Variance of the residual. If
\code{estimate_residual_variance = TRUE}, this value provides the
initial estimate of the residual variance. By default, it is set to
\code{var(y)} in \code{susie} and \code{(1/(n-1))yty} in
\code{susie_ss}.}

\item{prior_weights}{A vector of length p, in which each entry
gives the prior probability that corresponding column of X has a
nonzero effect on the outcome, y. The weights are internally
normalized to sum to 1. When \code{NULL} (the default), uniform
prior weights are used (each variable is assigned probability
\code{1/p}).}

\item{null_weight}{Prior probability of no effect (a number between 0 and 1,
and cannot be exactly 1).}

\item{standardize}{If \code{standardize = TRUE}, standardize the
columns of X to unit variance prior to fitting (or equivalently
standardize XtX and Xty to have the same effect). Note that
\code{scaled_prior_variance} specifies the prior on the
coefficients of X \emph{after} standardization (if it is
performed). If you do not standardize, you may need to think more
carefully about specifying \code{scaled_prior_variance}. Whatever
your choice, the coefficients returned by \code{coef} are given for
\code{X} on the original input scale. Any column of \code{X} that
has zero variance is not standardized.}

\item{estimate_residual_variance}{The default is FALSE, the
residual variance is fixed to 1 or variance of y. If the in-sample
R matrix is provided, we recommend setting
\code{estimate_residual_variance = TRUE}.}

\item{estimate_residual_method}{The method used for estimating residual variance.
For the original SuSiE model, "MLE" and "MoM" estimation is equivalent, but for
the infinitesimal model, "MoM" is more stable. We recommend using "NIG"
when n < 80 for improved coverage, although it is currently only implemented
for individual-level data.}

\item{estimate_prior_variance}{If \code{estimate_prior_variance =
TRUE}, the prior variance is estimated (this is a separate
parameter for each of the L effects). If provided,
\code{scaled_prior_variance} is then used as an initial value for
the optimization. When \code{estimate_prior_variance = FALSE}, the
prior variance for each of the L effects is determined by the
value supplied to \code{scaled_prior_variance}.}

\item{estimate_prior_method}{The method used for estimating prior
variance. When \code{estimate_prior_method = "simple"} is used, the
likelihood at the specified prior variance is compared to the
likelihood at a variance of zero, and the setting with the larger
likelihood is retained. When \code{prior_variance_grid} is provided,
this is automatically set to \code{"fixed_mixture"}.}

\item{prior_variance_grid}{Numeric vector of K prior variances defining
a mixture-of-normals prior on effect sizes. When provided, the SER
evaluates Bayes factors at each grid point and forms a mixture BF
weighted by \code{mixture_weights}. This bypasses the scalar prior
variance optimization. Default is \code{NULL} (standard scalar V path).}

\item{mixture_weights}{Numeric vector of K non-negative weights summing
to 1, giving the mixture proportions for the variance grid. Default is
\code{NULL}, which uses uniform weights when \code{prior_variance_grid}
is provided.}

\item{unmappable_effects}{The method for modeling unmappable effects:
"none", "inf", "ash".}

\item{check_null_threshold}{When the prior variance is estimated,
compare the estimate with the null, and set the prior variance to
zero unless the log-likelihood using the estimate is larger by this
threshold amount. For example, if you set
\code{check_null_threshold = 0.1}, this will "nudge" the estimate
towards zero when the difference in log-likelihoods is small. A
note of caution that setting this to a value greater than zero may
lead the IBSS fitting procedure to occasionally decrease the ELBO. This
setting is disabled when using \code{unmappable_effects = "inf"} or
\code{unmappable_effects = "ash"}.}

\item{prior_tol}{When the prior variance is estimated, compare the
estimated value to \code{prior_tol} at the end of the computation,
and exclude a single effect from PIP computation if the estimated
prior variance is smaller than this tolerance value.}

\item{residual_variance_lowerbound}{Lower limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{residual_variance_upperbound}{Upper limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{model_init}{A previous susie fit with which to initialize.}

\item{s_init}{Deprecated alias for \code{model_init}.}

\item{coverage}{A number between 0 and 1 specifying the
\dQuote{coverage} of the estimated confidence sets.}

\item{min_abs_corr}{Minimum absolute correlation allowed in a
credible set. The default, 0.5, corresponds to a squared
correlation of 0.25, which is a commonly used threshold for
genotype data in genetic studies. This "purity" filter is
applied to the CSs reported in the fit object, so the CS list
returned here may be a subset of the one produced by calling
\code{\link{susie_get_cs}} on the same fit without passing
\code{X} or \code{Xcorr} (in which case the purity filter is
skipped).}

\item{max_iter}{Maximum number of IBSS iterations to perform.}

\item{L_greedy}{Integer or \code{NULL}. When non-\code{NULL}, run a
greedy outer loop that grows the number of effects from
\code{L_greedy} up to \code{L} in linear steps until the fit
saturates. The default \code{NULL} runs the usual fixed-\code{L}
fit.}

\item{greedy_lbf_cutoff}{Numeric saturation threshold for the
\code{L_greedy} outer loop. Default is 0.1.}

\item{tol}{tol A small, non-negative number specifying the convergence
tolerance for the IBSS fitting procedure.}

\item{convergence_method}{When \code{converge_method = "elbo"} the fitting
procedure halts when the difference in the variational lower bound, or
\dQuote{ELBO} (the objective function to be maximized), is
less than \code{tol}. When \code{converge_method = "pip"} the fitting
procedure halts when the maximum absolute difference in \code{alpha} is less
than \code{tol}.}

\item{verbose}{If \code{verbose = TRUE}, the algorithm's progress,
a summary of the optimization settings, and refinement progress (if
\code{refine = TRUE}) are printed to the console.}

\item{track_fit}{If \code{track_fit = TRUE}, \code{trace}
is also returned containing detailed information about the
estimates at each iteration of the IBSS fitting procedure.}

\item{check_input}{If \code{check_input = TRUE}, \code{susie_ss} performs
additional checks on \code{XtX} and \code{Xty}. The checks are:
(1) check that \code{XtX} is positive semidefinite; (2) check that
\code{Xty} is in the space spanned by the non-zero eigenvectors of \code{XtX}.}

\item{check_prior}{If \code{check_prior = TRUE}, it checks if the
estimated prior variance becomes unreasonably large (comparing with
10 * max(abs(z))^2).}

\item{n_purity}{Passed as argument \code{n_purity} to
\code{\link{susie_get_cs}}.}

\item{r_tol}{Tolerance level for eigenvalue check of positive semidefinite
matrix \code{XtX}.}

\item{refine}{If \code{refine = TRUE}, then an additional
iterative refinement procedure is used, after the IBSS algorithm,
to check and escape from local optima (see details).}

\item{R_finite}{Controls variance inflation to account
for estimating the R matrix from a finite reference panel. Accepts three
types of input:
\describe{
  \item{\code{NULL} (default)}{The R matrix is treated as trusted, and no
    finite-reference variance inflation is applied.}
  \item{\code{TRUE}}{Infer the reference sample size B from the input
    \code{X}. Sets \code{B = nrow(X)} for single-panel input,
    or \code{B = min(nrow(X_k))} across panels for multi-panel
    input. Requires \code{X} to be provided (errors if only
    \code{R} is given, since B cannot be inferred).}
  \item{Number}{Explicit reference sample size B.}
}
When active, this dynamically inflates the null variance of each
variable's score statistic at every IBSS iteration to account for
finite-reference uncertainty in the Single Effect Regression (SER).
When provided, the output includes a
\code{R_finite_diagnostics} element with per-region and
per-variable quality metrics.}

\item{R_mismatch}{R-bias correction mode. \code{"none"} (default) is off.
\code{"map"} adds a region-level population-mismatch variance
component on top of the finite-reference correction; recommended
whenever \code{R} comes from a different cohort than the GWAS.
\code{"map_qc"} is \code{"map"} plus a QC score (\code{Q_art}) that
warns when the fitted residual carries energy in directions where
the supplied \code{R} indicates signal should be weak. For
allele-coding / strand-flip checks, see the kriging diagnostic in
\code{susie_rss}'s companion utilities.
Requires \code{R_finite}; auto-disables \code{estimate_residual_variance}
with a warning.}

\item{eig_delta_rel, eig_delta_abs}{Cutoffs for "low-eigenvalue"
directions of \code{R} used by the QC diagnostic
(\code{R_mismatch = "map_qc"}). Default \code{eig_delta_rel = 1e-3},
\code{eig_delta_abs = 0}; the threshold is
\code{max(eig_delta_abs, eig_delta_rel * max_eigenvalue(R))}. Tighter
(smaller) values flag fewer regions.}

\item{artifact_threshold}{Flag threshold on the QC score \code{Q_art}
(a fraction in [0, 1]). Default \code{0.1}; flag fires when
\code{Q_art > artifact_threshold}. Heuristic, not a calibrated test.}

\item{alpha0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{beta0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{init_only}{Logical. If \code{TRUE}, return a list with
\code{data} and \code{params} objects without running the IBSS
algorithm. Default is \code{FALSE}.}

\item{slot_prior}{Optional slot activity prior created by
\code{\link{slot_prior_betabinom}} or \code{\link{slot_prior_poisson}}.
Use \code{slot_prior_betabinom(a_beta, b_beta)} for the usual
single-locus setting; it places a Beta-Binomial prior on the
number of active effects and gives an adaptive multiplicity
correction. Use \code{slot_prior_poisson(C, nu)} when you want a
Gamma-Poisson prior centered on an expected number \code{C} of
active effects. When supplied, each single-effect slot has an
estimated activity probability \code{c_hat}; fitted values and
PIPs are weighted by these activity probabilities, and convergence
is checked using \code{convergence_method = "pip"}.}
}
\value{
In addition to the standard \code{"susie"} output (see
  \code{\link{susie}}), the returned object may contain:

\item{R_finite_diagnostics}{A list of diagnostics for the
  finite-reference correction (only present when
  \code{R_finite} is provided), containing:
  \code{B} (the reference sample size);
  \code{p} (number of variables);
  \code{effective_rank} (debiased \eqn{\tilde{r} = p^2 / \|R\|_F^2});
  \code{r_over_B} (\eqn{\tilde{r}/B}, one number per region; values
    \eqn{\le 0.2} indicate the reference panel is adequate);
  \code{Rhat_diag_deviation} (\eqn{|\hat{R}_{jj} - 1|}, one number
    per variable);
  \code{lambda_bias} (region-level scalar on the default
    \code{lambda = 0} sufficient-statistics path when
    \code{R_mismatch != "none"});
  \code{B_corrected} (effective reference sample size after the
    R-bias correction, \eqn{1/(1/B + \lambda_{\mathrm{bias}})};
    substantially
    smaller than the input \code{B} flags a dominant population
    mismatch component);
  \code{per_variable_penalty} (final-iteration
    \eqn{v_j / \sigma^2 = \tau_j^2 / \sigma^2 - 1}, one number per
    variable; values \eqn{\le 0.2} indicate minimal power loss,
    values \eqn{\gg 1} flag variables where the correction is doing
    heavy lifting).}
}
\description{
Performs SuSiE regression using z-scores and correlation matrix.
This is the sufficient-statistics RSS interface. For the specialized
regularized eigendecomposition likelihood with \code{lambda > 0}, use
\code{\link{susie_rss_lambda}}.
}


================================================
FILE: man/susie_rss_lambda.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie.R
\name{susie_rss_lambda}
\alias{susie_rss_lambda}
\title{Sum of Single Effects Regression using the RSS-lambda likelihood}
\usage{
susie_rss_lambda(
  z = NULL,
  R = NULL,
  n = NULL,
  X = NULL,
  L = min(10, if (!is.null(R)) ncol(R) else ncol(X)),
  lambda,
  maf = NULL,
  maf_thresh = 0,
  prior_variance = 50,
  residual_variance = NULL,
  prior_weights = NULL,
  null_weight = 0,
  intercept_value = 0,
  estimate_residual_variance = FALSE,
  estimate_residual_method = "MLE",
  estimate_prior_variance = TRUE,
  estimate_prior_method = c("optim", "EM", "simple"),
  prior_variance_grid = NULL,
  mixture_weights = NULL,
  check_null_threshold = 0,
  prior_tol = 1e-09,
  residual_variance_lowerbound = 0,
  model_init = NULL,
  coverage = 0.95,
  min_abs_corr = 0.5,
  max_iter = 100,
  L_greedy = NULL,
  greedy_lbf_cutoff = 0.1,
  tol = 1e-04,
  convergence_method = c("elbo", "pip"),
  verbose = FALSE,
  track_fit = FALSE,
  check_prior = TRUE,
  check_R = TRUE,
  check_z = FALSE,
  n_purity = 100,
  r_tol = 1e-08,
  refine = FALSE,
  init_only = FALSE,
  slot_prior = NULL
)
}
\arguments{
\item{z}{A p-vector of z-scores.}

\item{R}{A p by p correlation matrix. Exactly one of \code{R} or
\code{X} must be provided.}

\item{n}{The sample size, not required but recommended.}

\item{X}{A factor matrix (B x p) such that \code{R = crossprod(X) /
nrow(X)} approximates the R (correlation) matrix. When
\code{nrow(X) >= ncol(X)}, the correlation matrix \code{R} is
formed explicitly and the standard path is used. When
\code{nrow(X) < ncol(X)}, a low-rank path is used that avoids
forming the p x p matrix, reducing per-iteration cost from
O(Lp^2) to O(LBp). Columns of \code{X} are standardized
internally.}

\item{L}{Maximum number of non-zero effects in the model. If L is larger than
the number of covariates, p, L is set to p.}

\item{lambda}{Regularization parameter for the RSS-lambda likelihood.
Must be supplied. \code{lambda = "estimate"} estimates lambda from
the null-space residual.}

\item{maf}{A p-vector of minor allele frequencies; to be used along with
\code{maf_thresh} to filter input summary statistics.}

\item{maf_thresh}{Variants with MAF smaller than this threshold are not used.}

\item{prior_variance}{Prior variance for each non-zero effect on the
z-score scale. Replaces \code{scaled_prior_variance} from
\code{\link{susie_rss}}. Default \code{50}.}

\item{residual_variance}{Variance of the residual. If
\code{estimate_residual_variance = TRUE}, this value provides the
initial estimate of the residual variance. By default, it is set to
\code{var(y)} in \code{susie} and \code{(1/(n-1))yty} in
\code{susie_ss}.}

\item{prior_weights}{A vector of length p, in which each entry
gives the prior probability that corresponding column of X has a
nonzero effect on the outcome, y. The weights are internally
normalized to sum to 1. When \code{NULL} (the default), uniform
prior weights are used (each variable is assigned probability
\code{1/p}).}

\item{null_weight}{Prior probability of no effect (a number between 0 and 1,
and cannot be exactly 1).}

\item{intercept_value}{Intercept used by the RSS-lambda likelihood.
Default \code{0}.}

\item{estimate_residual_variance}{The default is FALSE, the
residual variance is fixed to 1 or variance of y. If the in-sample
R matrix is provided, we recommend setting
\code{estimate_residual_variance = TRUE}.}

\item{estimate_residual_method}{Variance-component estimator. The
RSS-lambda path supports \code{"MLE"} only; any other value errors.}

\item{estimate_prior_variance}{If \code{estimate_prior_variance = TRUE},
the prior variance is estimated (a separate parameter for each of
the L effects). When \code{TRUE}, \code{prior_variance} provides the
initial value; when \code{FALSE}, it is held fixed.}

\item{estimate_prior_method}{The method used for estimating prior
variance. When \code{estimate_prior_method = "simple"} is used, the
likelihood at the specified prior variance is compared to the
likelihood at a variance of zero, and the setting with the larger
likelihood is retained. When \code{prior_variance_grid} is provided,
this is automatically set to \code{"fixed_mixture"}.}

\item{prior_variance_grid}{Numeric vector of K prior variances defining
a mixture-of-normals prior on effect sizes. When provided, the SER
evaluates Bayes factors at each grid point and forms a mixture BF
weighted by \code{mixture_weights}. This bypasses the scalar prior
variance optimization. Default is \code{NULL} (standard scalar V path).}

\item{mixture_weights}{Numeric vector of K non-negative weights summing
to 1, giving the mixture proportions for the variance grid. Default is
\code{NULL}, which uses uniform weights when \code{prior_variance_grid}
is provided.}

\item{check_null_threshold}{When the prior variance is estimated,
compare its likelihood to the likelihood at zero and use zero
unless the larger value exceeds it by at least
\code{check_null_threshold}. \code{0} (default) takes the larger
likelihood at face value.}

\item{prior_tol}{When the prior variance is estimated, compare the
estimated value to \code{prior_tol} at the end of the computation,
and exclude a single effect from PIP computation if the estimated
prior variance is smaller than this tolerance value.}

\item{residual_variance_lowerbound}{Lower limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{model_init}{A previous susie fit with which to initialize.}

\item{coverage}{A number between 0 and 1 specifying the
\dQuote{coverage} of the estimated confidence sets.}

\item{min_abs_corr}{Minimum absolute correlation allowed in a
credible set. The default, 0.5, corresponds to a squared
correlation of 0.25, which is a commonly used threshold for
genotype data in genetic studies. This "purity" filter is
applied to the CSs reported in the fit object, so the CS list
returned here may be a subset of the one produced by calling
\code{\link{susie_get_cs}} on the same fit without passing
\code{X} or \code{Xcorr} (in which case the purity filter is
skipped).}

\item{max_iter}{Maximum number of IBSS iterations to perform.}

\item{L_greedy}{Integer or \code{NULL}. When non-\code{NULL}, run a
greedy outer loop that grows the number of effects from
\code{L_greedy} up to \code{L} in linear steps until the fit
saturates. The default \code{NULL} runs the usual fixed-\code{L}
fit.}

\item{greedy_lbf_cutoff}{Numeric saturation threshold for the
\code{L_greedy} outer loop. Default is 0.1.}

\item{tol}{tol A small, non-negative number specifying the convergence
tolerance for the IBSS fitting procedure.}

\item{convergence_method}{When \code{converge_method = "elbo"} the fitting
procedure halts when the difference in the variational lower bound, or
\dQuote{ELBO} (the objective function to be maximized), is
less than \code{tol}. When \code{converge_method = "pip"} the fitting
procedure halts when the maximum absolute difference in \code{alpha} is less
than \code{tol}.}

\item{verbose}{If \code{verbose = TRUE}, the algorithm's progress,
a summary of the optimization settings, and refinement progress (if
\code{refine = TRUE}) are printed to the console.}

\item{track_fit}{If \code{track_fit = TRUE}, \code{trace}
is also returned containing detailed information about the
estimates at each iteration of the IBSS fitting procedure.}

\item{check_prior}{If \code{check_prior = TRUE}, it checks if the
estimated prior variance becomes unreasonably large (comparing with
10 * max(abs(z))^2).}

\item{check_R}{If TRUE, verify that \code{R} is positive semidefinite.}

\item{check_z}{If TRUE, verify that \code{z} lies in the column space
of \code{R}.}

\item{n_purity}{Passed as argument \code{n_purity} to
\code{\link{susie_get_cs}}.}

\item{r_tol}{Tolerance level for eigenvalue check of positive semidefinite
matrix \code{XtX}.}

\item{refine}{If \code{refine = TRUE}, then an additional
iterative refinement procedure is used, after the IBSS algorithm,
to check and escape from local optima (see details).}

\item{init_only}{Logical. If \code{TRUE}, return a list with
\code{data} and \code{params} objects without running the IBSS
algorithm. Default is \code{FALSE}.}

\item{slot_prior}{Optional slot activity prior created by
\code{\link{slot_prior_betabinom}} or \code{\link{slot_prior_poisson}}.
Use \code{slot_prior_betabinom(a_beta, b_beta)} for the usual
single-locus setting; it places a Beta-Binomial prior on the
number of active effects and gives an adaptive multiplicity
correction. Use \code{slot_prior_poisson(C, nu)} when you want a
Gamma-Poisson prior centered on an expected number \code{C} of
active effects. When supplied, each single-effect slot has an
estimated activity probability \code{c_hat}; fitted values and
PIPs are weighted by these activity probabilities, and convergence
is checked using \code{convergence_method = "pip"}.}
}
\value{
A \code{"susie"} fit (or, with \code{init_only = TRUE}, the
  constructed data and params objects).
}
\description{
Specialized interface for the regularized eigendecomposition
RSS likelihood of Zou et al. (2022). This path accepts a single reference
matrix or a single factor matrix and does not support multi-panel mixture,
finite-reference inflation, or R-bias correction.
}


================================================
FILE: man/susie_ss.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie.R
\name{susie_ss}
\alias{susie_ss}
\title{SuSiE using Sufficient Statistics}
\usage{
susie_ss(
  XtX,
  Xty,
  yty,
  n,
  L = min(10, ncol(XtX)),
  X_colmeans = NA,
  y_mean = NA,
  maf = NULL,
  maf_thresh = 0,
  check_input = FALSE,
  r_tol = 1e-08,
  standardize = TRUE,
  scaled_prior_variance = 0.2,
  residual_variance = NULL,
  prior_weights = NULL,
  null_weight = 0,
  model_init = NULL,
  s_init = NULL,
  estimate_residual_variance = TRUE,
  estimate_residual_method = c("MoM", "MLE", "NIG"),
  residual_variance_lowerbound = 0,
  residual_variance_upperbound = Inf,
  estimate_prior_variance = TRUE,
  estimate_prior_method = c("optim", "EM", "simple"),
  prior_variance_grid = NULL,
  mixture_weights = NULL,
  unmappable_effects = c("none", "inf", "ash", "ash_filter_archived"),
  check_null_threshold = 0,
  prior_tol = 1e-09,
  max_iter = 100,
  L_greedy = NULL,
  greedy_lbf_cutoff = 0.1,
  tol = 1e-04,
  convergence_method = c("elbo", "pip"),
  coverage = 0.95,
  min_abs_corr = 0.5,
  n_purity = 100,
  verbose = FALSE,
  track_fit = FALSE,
  check_prior = FALSE,
  refine = FALSE,
  alpha0 = 1/sqrt(n),
  beta0 = 1/sqrt(n),
  slot_prior = NULL
)
}
\arguments{
\item{XtX}{A p by p matrix, X'X, with columns of X centered to have mean zero.}

\item{Xty}{A p-vector, X'y, with y and columns of X centered to have mean zero.}

\item{yty}{A scalar, y'y, with y centered to have mean zero.}

\item{n}{The sample size.}

\item{L}{Maximum number of non-zero effects in the model. If L is larger than
the number of covariates, p, L is set to p.}

\item{X_colmeans}{A p-vector of column means of \code{X}. If both
\code{X_colmeans} and \code{y_mean} are provided, the intercept
is estimated; otherwise, the intercept is NA.}

\item{y_mean}{A scalar containing the mean of \code{y}. If both
\code{X_colmeans} and \code{y_mean} are provided, the intercept
is estimated; otherwise, the intercept is NA.}

\item{maf}{A p-vector of minor allele frequencies; to be used along with
\code{maf_thresh} to filter input summary statistics.}

\item{maf_thresh}{Variants with MAF smaller than this threshold are not used.}

\item{check_input}{If \code{check_input = TRUE}, \code{susie_ss} performs
additional checks on \code{XtX} and \code{Xty}. The checks are:
(1) check that \code{XtX} is positive semidefinite; (2) check that
\code{Xty} is in the space spanned by the non-zero eigenvectors of \code{XtX}.}

\item{r_tol}{Tolerance level for eigenvalue check of positive semidefinite
matrix \code{XtX}.}

\item{standardize}{If \code{standardize = TRUE}, standardize the
columns of X to unit variance prior to fitting (or equivalently
standardize XtX and Xty to have the same effect). Note that
\code{scaled_prior_variance} specifies the prior on the
coefficients of X \emph{after} standardization (if it is
performed). If you do not standardize, you may need to think more
carefully about specifying \code{scaled_prior_variance}. Whatever
your choice, the coefficients returned by \code{coef} are given for
\code{X} on the original input scale. Any column of \code{X} that
has zero variance is not standardized.}

\item{scaled_prior_variance}{The prior variance, divided by
\code{var(y)} (or by \code{(1/(n-1))yty} for
\code{susie_ss}); that is, the prior variance of each
non-zero element of b is \code{var(y) * scaled_prior_variance}. The
value provided should be either a scalar or a vector of length
\code{L}. If \code{estimate_prior_variance = TRUE}, this provides
initial estimates of the prior variances.}

\item{residual_variance}{Variance of the residual. If
\code{estimate_residual_variance = TRUE}, this value provides the
initial estimate of the residual variance. By default, it is set to
\code{var(y)} in \code{susie} and \code{(1/(n-1))yty} in
\code{susie_ss}.}

\item{prior_weights}{A vector of length p, in which each entry
gives the prior probability that corresponding column of X has a
nonzero effect on the outcome, y. The weights are internally
normalized to sum to 1. When \code{NULL} (the default), uniform
prior weights are used (each variable is assigned probability
\code{1/p}).}

\item{null_weight}{Prior probability of no effect (a number between 0 and 1,
and cannot be exactly 1).}

\item{model_init}{A previous susie fit with which to initialize.}

\item{s_init}{Deprecated alias for \code{model_init}.}

\item{estimate_residual_variance}{If
\code{estimate_residual_variance = TRUE}, the residual variance is
estimated, using \code{residual_variance} as an initial value. If
\code{estimate_residual_variance = FALSE}, the residual variance is
fixed to the value supplied by \code{residual_variance}.}

\item{estimate_residual_method}{The method used for estimating residual variance.
For the original SuSiE model, "MLE" and "MoM" estimation is equivalent, but for
the infinitesimal model, "MoM" is more stable. We recommend using "NIG"
when n < 80 for improved coverage, although it is currently only implemented
for individual-level data.}

\item{residual_variance_lowerbound}{Lower limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{residual_variance_upperbound}{Upper limit on the estimated
residual variance. It is only relevant when
\code{estimate_residual_variance = TRUE}.}

\item{estimate_prior_variance}{If \code{estimate_prior_variance =
TRUE}, the prior variance is estimated (this is a separate
parameter for each of the L effects). If provided,
\code{scaled_prior_variance} is then used as an initial value for
the optimization. When \code{estimate_prior_variance = FALSE}, the
prior variance for each of the L effects is determined by the
value supplied to \code{scaled_prior_variance}.}

\item{estimate_prior_method}{The method used for estimating prior
variance. When \code{estimate_prior_method = "simple"} is used, the
likelihood at the specified prior variance is compared to the
likelihood at a variance of zero, and the setting with the larger
likelihood is retained. When \code{prior_variance_grid} is provided,
this is automatically set to \code{"fixed_mixture"}.}

\item{prior_variance_grid}{Numeric vector of K prior variances defining
a mixture-of-normals prior on effect sizes. When provided, the SER
evaluates Bayes factors at each grid point and forms a mixture BF
weighted by \code{mixture_weights}. This bypasses the scalar prior
variance optimization. Default is \code{NULL} (standard scalar V path).}

\item{mixture_weights}{Numeric vector of K non-negative weights summing
to 1, giving the mixture proportions for the variance grid. Default is
\code{NULL}, which uses uniform weights when \code{prior_variance_grid}
is provided.}

\item{unmappable_effects}{The method for modeling unmappable effects:
"none", "inf", "ash".}

\item{check_null_threshold}{When the prior variance is estimated,
compare the estimate with the null, and set the prior variance to
zero unless the log-likelihood using the estimate is larger by this
threshold amount. For example, if you set
\code{check_null_threshold = 0.1}, this will "nudge" the estimate
towards zero when the difference in log-likelihoods is small. A
note of caution that setting this to a value greater than zero may
lead the IBSS fitting procedure to occasionally decrease the ELBO. This
setting is disabled when using \code{unmappable_effects = "inf"} or
\code{unmappable_effects = "ash"}.}

\item{prior_tol}{When the prior variance is estimated, compare the
estimated value to \code{prior_tol} at the end of the computation,
and exclude a single effect from PIP computation if the estimated
prior variance is smaller than this tolerance value.}

\item{max_iter}{Maximum number of IBSS iterations to perform.}

\item{L_greedy}{Integer or \code{NULL}. When non-\code{NULL}, run a
greedy outer loop that grows the number of effects from
\code{L_greedy} up to \code{L} in linear steps until the fit
saturates. The default \code{NULL} runs the usual fixed-\code{L}
fit.}

\item{greedy_lbf_cutoff}{Numeric saturation threshold for the
\code{L_greedy} outer loop. Default is 0.1.}

\item{tol}{tol A small, non-negative number specifying the convergence
tolerance for the IBSS fitting procedure.}

\item{convergence_method}{When \code{converge_method = "elbo"} the fitting
procedure halts when the difference in the variational lower bound, or
\dQuote{ELBO} (the objective function to be maximized), is
less than \code{tol}. When \code{converge_method = "pip"} the fitting
procedure halts when the maximum absolute difference in \code{alpha} is less
than \code{tol}.}

\item{coverage}{A number between 0 and 1 specifying the
\dQuote{coverage} of the estimated confidence sets.}

\item{min_abs_corr}{Minimum absolute correlation allowed in a
credible set. The default, 0.5, corresponds to a squared
correlation of 0.25, which is a commonly used threshold for
genotype data in genetic studies. This "purity" filter is
applied to the CSs reported in the fit object, so the CS list
returned here may be a subset of the one produced by calling
\code{\link{susie_get_cs}} on the same fit without passing
\code{X} or \code{Xcorr} (in which case the purity filter is
skipped).}

\item{n_purity}{Passed as argument \code{n_purity} to
\code{\link{susie_get_cs}}.}

\item{verbose}{If \code{verbose = TRUE}, the algorithm's progress,
a summary of the optimization settings, and refinement progress (if
\code{refine = TRUE}) are printed to the console.}

\item{track_fit}{If \code{track_fit = TRUE}, \code{trace}
is also returned containing detailed information about the
estimates at each iteration of the IBSS fitting procedure.}

\item{check_prior}{If \code{check_prior = TRUE}, it checks if the
estimated prior variance becomes unreasonably large (comparing with
10 * max(abs(z))^2).}

\item{refine}{If \code{refine = TRUE}, then an additional
iterative refinement procedure is used, after the IBSS algorithm,
to check and escape from local optima (see details).}

\item{alpha0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{beta0}{Numerical parameter for the NIG prior when using
\code{estimate_residual_method = "NIG"}. Defaults to
\code{1/sqrt(n)}, where \code{n} is the sample size. When calling
\code{susie_rss} with NIG, \code{n} must be supplied; otherwise
validation errors.}

\item{slot_prior}{Optional slot activity prior created by
\code{\link{slot_prior_betabinom}} or \code{\link{slot_prior_poisson}}.
Use \code{slot_prior_betabinom(a_beta, b_beta)} for the usual
single-locus setting; it places a Beta-Binomial prior on the
number of active effects and gives an adaptive multiplicity
correction. Use \code{slot_prior_poisson(C, nu)} when you want a
Gamma-Poisson prior centered on an expected number \code{C} of
active effects. When supplied, each single-effect slot has an
estimated activity probability \code{c_hat}; fitted values and
PIPs are weighted by these activity probabilities, and convergence
is checked using \code{convergence_method = "pip"}.}
}
\description{
Performs SuSiE regression using sufficient statistics (XtX, Xty,
yty, n) instead of individual-level data (X, y).
}


================================================
FILE: man/susie_trendfilter.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_trendfilter.R
\name{susie_trendfilter}
\alias{susie_trendfilter}
\title{Apply susie to trend filtering (especially changepoint
  problems), a type of non-parametric regression.}
\usage{
susie_trendfilter(y, order = 0, standardize = FALSE, use_mad = TRUE, ...)
}
\arguments{
\item{y}{An n-vector of observations ordered in time or space
(assumed to be equally spaced).}

\item{order}{An integer specifying the order of trend filtering.
The default, \code{order = 0}, corresponds to "changepoint"
problems (\emph{i.e.}, piecewise constant \eqn{mu}). Although
\code{order > 0} is implemented, we do not recommend its use; in
practice, we have found problems with convergence of the algorithm
to poor local optima, producing unreliable inferences.}

\item{standardize}{Logical indicating whether to standardize the X
variables ("basis functions"); \code{standardize = FALSE} is
recommended as these basis functions already have a natural scale.}

\item{use_mad}{Logical indicating whether to use the "median
absolute deviation" (MAD) method to the estimate residual
variance. If \code{use_mad = TRUE}, susie is run twice, first by
fixing the residual variance to the MAD value, then a second time,
initialized to the first fit, but with residual variance estimated
the usual way (by maximizing the ELBO). We have found this strategy
typically improves reliability of the results by reducing a
tendency to converge to poor local optima of the ELBO.}

\item{...}{Other arguments passed to \code{\link{susie}}.}
}
\value{
A "susie" fit; see \code{\link{susie}} for details.
}
\description{
Fits the non-parametric Gaussian regression model
  \eqn{y = mu + e}, where the mean \eqn{mu} is modelled as \eqn{mu =
  Xb}, X is a matrix with columns containing an appropriate basis,
  and b is vector with a (sparse) SuSiE prior. In particular, when
  \code{order = 0}, the jth column of X is a vector with the first j
  elements equal to zero, and the remaining elements equal to 1, so
  that \eqn{b_j} corresponds to the change in the mean of y between
  indices j and j+1. For background on trend filtering, see
  Tibshirani (2014). See also the "Trend filtering" vignette,
  \code{vignette("trend_filtering")}.
}
\details{
This implementation exploits the special structure of X,
  which means that the matrix-vector product \eqn{X^Ty} is fast to
  compute; in particular, the computation time is \eqn{O(n)} rather
  than \eqn{O(n^2)} if \code{X} were formed explicitly. For
  implementation details, see the "Implementation of SuSiE trend
  filtering" vignette by running
  \code{vignette("trendfiltering_derivations")}.
}
\examples{
set.seed(1)
mu <- c(rep(0, 50), rep(1, 50), rep(3, 50), rep(-2, 50), rep(0, 200))
y <- mu + rnorm(400)
s <- susie_trendfilter(y)
plot(y)
lines(mu, col = 1, lwd = 3)
lines(predict(s), col = 2, lwd = 2)

# Calculate credible sets (indices of y that occur just before
# changepoints).
susie_get_cs(s)

# Plot with credible sets for changepoints.
susie_plot_changepoint(s, y)

}
\references{
R. J. Tibshirani (2014). Adaptive piecewise polynomial
  estimation via trend filtering. \emph{Annals of Statistics}
  \bold{42}, 285-323.
}


================================================
FILE: man/susie_workhorse.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/susie_workhorse.R
\name{susie_workhorse}
\alias{susie_workhorse}
\title{SuSiE workhorse function}
\usage{
susie_workhorse(data, params)
}
\arguments{
\item{data}{Data object (individual, ss, or rss_lambda).}

\item{params}{Validated params object.}
}
\value{
Complete fitted SuSiE model.
}
\description{
Main orchestration for the IBSS algorithm. When `params$L_greedy`
is non-NULL, runs a greedy outer loop that grows `L` in linear
steps of `params$L_greedy` until the fit has at least one empty
slot (`min(lbf) < params$greedy_lbf_cutoff`, default `0.1`) or `L` reaches
`params$L`. With `params$L_greedy = NULL` (default), runs a
single fixed-`L` IBSS, output bit-identical to prior susieR.
}
\keyword{internal}


================================================
FILE: man/univar.order.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/univariate_regression.R
\name{univar.order}
\alias{univar.order}
\title{Ordering of Predictors from Univariate Regression}
\usage{
univar.order(X, y)
}
\arguments{
\item{X}{An input design matrix. This may be centered and/or
standardized prior to calling function.}

\item{y}{A vector of response variables.}
}
\value{
An ordering of the predictors.
}
\description{
This function extracts the ordering of the predictors
  according to the coefficients estimated in a basic univariate
  regression; in particular, the predictors are ordered in decreasing
  order by magnitude of the univariate regression coefficient
  estimate.
}
\examples{
### generate synthetic data
set.seed(1)
n           = 200
p           = 300
X           = matrix(rnorm(n*p),n,p)
beta        = double(p)
beta[1:10]  = 1:10
y           = X \%*\% beta + rnorm(n)

univ.order = univar.order(X,y)

}


================================================
FILE: man/univariate_regression.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/univariate_regression.R
\name{univariate_regression}
\alias{univariate_regression}
\alias{calc_z}
\title{Perform Univariate Linear Regression Separately for Columns of X}
\usage{
univariate_regression(
  X,
  y,
  Z = NULL,
  center = TRUE,
  scale = FALSE,
  return_residuals = FALSE,
  method = c("lmfit", "sumstats")
)

calc_z(X, Y, center = FALSE, scale = FALSE)
}
\arguments{
\item{X}{n by p matrix of regressors.}

\item{y}{n-vector of response variables.}

\item{Z}{Optional n by k matrix of covariates to be included in all
regresions. If Z is not \code{NULL}, the linear effects of
covariates are removed from y first, and the resulting residuals
are used in place of y.}

\item{center}{If \code{center = TRUE}, center X, y and Z.}

\item{scale}{If \code{scale = TRUE}, scale X, y and Z.}

\item{return_residuals}{Whether or not to output the residuals if Z
is not \code{NULL}.}

\item{method}{Either \dQuote{sumstats} (faster implementation) or
\dQuote{lmfit} (uses \code{\link[stats]{.lm.fit}}).}
}
\value{
A list with two vectors containing the least-squares
  estimates of the coefficients (\code{betahat}) and their standard
  errors (\code{sebetahat}). Optionally, and only when a matrix of
  covariates \code{Z} is provided, a third vector \code{residuals}
  containing the residuals is returned.
}
\description{
This function performs the univariate linear
  regression y ~ x separately for each column x of X. The estimated effect size
  and stardard error for each variable are outputted.
}
\examples{
set.seed(1)
n = 1000
p = 1000
beta = rep(0,p)
beta[1:4] = 1
X = matrix(rnorm(n*p),nrow = n,ncol = p)
X = scale(X,center = TRUE,scale = TRUE)
y = drop(X \%*\% beta + rnorm(n))
res = univariate_regression(X,y)
plot(res$betahat/res$sebetahat)

}


================================================
FILE: man/unmappable_data.Rd
================================================
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/example_dataset.R
\docType{data}
\name{unmappable_data}
\alias{unmappable_data}
\title{Simulated Fine-mapping Data with Sparse, Oligogenic and Polygenic Effects.}
\format{
\code{unmappable_data} is a list with the following elements:

\describe{

  \item{X}{Centered and scaled genotype matrix.}

  \item{y}{Simulated response.}

  \item{beta}{Simulated effect sizes.}

  \item{h2g}{Total proportion of variance in the response explained
    by the simulated effects.}}
}
\description{
A simulated data set with 1,000 individuals and 5,000
  variants, combining 3 sparse, 5 oligogenic and 15 polygenic
  non-zero effects. The response is generated under a linear
  regression model. This data set illustrates fine-mapping with
  SuSiE-ash and SuSiE-inf.
}
\examples{
data(unmappable_data)
}
\seealso{
The \dQuote{Fine-mapping with SuSiE-ash and SuSiE-inf}
  vignette.
}
\keyword{data}


================================================
FILE: pixi.toml
================================================
[workspace]
name = "r-susier"
channels = ["dnachun", "conda-forge", "bioconda"]
platforms = ["linux-64", "osx-arm64"]

[system-requirements]
libc = { family="glibc", version="2.17" }

[tasks]
devtools_document = "cd $GITHUB_WORKSPACE; R -e 'devtools::document()'"
devtools_test = "cd $GITHUB_WORKSPACE; R -e 'devtools::test()'"
codecov = "cd $GITHUB_WORKSPACE; R -e 'covr::codecov(quiet = FALSE)'"
build = "cd $GITHUB_WORKSPACE; R -e 'devtools::build(vignettes = TRUE)'"
rcmdcheck = "cd $GITHUB_WORKSPACE; R -e 'pkg <- list.files(\"..\", pattern = \".tar.gz\", full.names = TRUE); rcmdcheck::rcmdcheck(path = pkg[1], args = c(\"--as-cran\", \"--no-manual\"))'"
use_major_version = "cd $GITHUB_WORKSPACE; R -e 'usethis::use_version(which = \"major\", push = FALSE)'"
use_minor_version = "cd $GITHUB_WORKSPACE; R -e 'usethis::use_version(which = \"minor\", push = FALSE)'"
use_patch_version = "cd $GITHUB_WORKSPACE; R -e 'usethis::use_version(which = \"patch\", push = FALSE)'"
pkgdown_build = "cd $GITHUB_WORKSPACE; R -e 'pkgdown::build_site_github_pages(new_process = FALSE, install = TRUE)'"

[feature.r44]
dependencies = {"r-base" = "4.4.*"}

[feature.r45]
dependencies = {"r-base" = "4.5.*"}

[environments]
r44 = {features = ["r44"]}
r45 = {features = ["r45"]}

[target.linux-64.dependencies]
"gcc" = "*"

[dependencies]
# Core dependencies (from Imports / LinkingTo)
"r-cpp11" = "*"
"r-cpp11armadillo" = "*"
"r-matrix" = "*"
"r-matrixstats" = "*"
"r-mixsqp" = "*"
"r-reshape" = "*"
"r-crayon" = "*"
"r-ggplot2" = "*"
"r-l0learn" = "*"
"r-survival" = "*"

# Suggested dependencies (for testing and documentation)
"r-curl" = "*"
"r-testthat" = "*"
"r-microbenchmark" = "*"
"r-knitr" = "*"
"r-rmarkdown" = "*"
"r-rfast" = "*"
"r-cowplot" = "*"

# Development tools (optional, but useful for package development)
"r-devtools" = "*"
"r-covr" = "*"
"r-rcmdcheck" = "*"
"r-pkgdown" = "*"
"r-decor" = "*"         # required by cpp11::cpp_register() during devtools::document()
"qpdf" = "*"


================================================
FILE: src/Makevars
================================================
PKG_CXXFLAGS = $(SHLIB_OPENMP_CXXFLAGS)
PKG_LIBS = $(SHLIB_OPENMP_CXXFLAGS) $(LAPACK_LIBS) $(BLAS_LIBS) $(FLIBS)


================================================
FILE: src/Makevars.win
================================================
PKG_CXXFLAGS = $(SHLIB_OPENMP_CXXFLAGS) 
PKG_LIBS = $(SHLIB_OPENMP_CXXFLAGS) $(LAPACK_LIBS) $(BLAS_LIBS) $(FLIBS)


================================================
FILE: src/caisa.cpp
================================================
#include <cpp11.hpp>
#include <cpp11armadillo.hpp>
#include "mr_ash.h"

using namespace cpp11;
using namespace arma;

// Random permutation index vector of length p * numiter (0-based).
[[cpp11::register]]
integers random_order(int p, int numiter) {
  return as_integers(random_order_impl(p, numiter));
}

// Mr.ASH coordinate-ascent in sufficient-statistic form.
[[cpp11::register]]
writable::list caisa_cpp(const doubles_matrix<>& X,
                         const doubles& w, const doubles& sa2,
                         const doubles& pi_init, const doubles& beta_init,
                         const doubles& r_init, double sigma2,
                         const integers& o_r,
                         int maxiter, int miniter,
                         double convtol, double epstol, std::string method_q,
                         bool updatepi, bool updatesigma,
                         bool verbose) {

  // cpp11 inputs -> Armadillo. pi, beta, r are mutated -> own their memory.
  const mat X_mat   = as_Mat(X);
  const vec w_vec   = as_Col(w);
  const vec sa2_vec = as_Col(sa2);
  const uvec o      = as_uvec(o_r);
  vec pi    = conv_to<vec>::from(as_Col(pi_init));
  vec beta  = conv_to<vec>::from(as_Col(beta_init));
  vec r     = conv_to<vec>::from(as_Col(r_init));

  const int n = X_mat.n_rows;
  const int p = X_mat.n_cols;
  const int K = sa2_vec.n_elem;

  // Per-iter per-coordinate prior weights (mixture precision + X*X'/sigma2).
  mat S2inv = 1.0 / outerAddition(1.0 / sa2_vec, w_vec);
  S2inv.row(0).fill(epstol);

  vec varobj(maxiter);
  vec piold, betaold;
  int iter = 0;
  int i = 0;

  for (iter = 0; iter < maxiter; iter++) {
    double a1 = 0.0, a2 = 0.0;
    piold   = pi;
    betaold = beta;
    pi.fill(0);

    // Coordinate-ascent sweep (random order given by o)
    for (int j = 0; j < p; j++) {
      updatebetaj(X_mat.col(o(i)), w_vec(o(i)), beta(o(i)), r, piold, pi,
                  sigma2, sa2_vec, S2inv.col(o(i)), a1, a2, o(i), p, epstol);
      i++;
    }

    // Variational objective (first term)
    varobj(iter) = dot(r, r) - dot(square(beta), w_vec) + a1;

    // Optionally update sigma2
    if (updatesigma) {
      if (method_q == "sigma_indep_q") {
        sigma2 = (varobj(iter) + p * (1.0 - pi(0)) * sigma2)
                 / (n + p * (1.0 - pi(0)));
      } else if (method_q == "sigma_dep_q") {
        sigma2 = varobj(iter) / n;
      }
    }

    // Freeze piold for objective computation when updating pi
    if (updatepi) piold = pi;

    // Variational objective (full expression)
    varobj(iter) = varobj(iter) / sigma2 / 2.0
                   + log(2.0 * M_PI * sigma2) / 2.0 * n
                   - dot(pi, log(piold + epstol)) * p + a2;
    for (int j = 1; j < K; j++) {
      varobj(iter) += pi(j) * log(sa2_vec(j)) * p / 2.0;
    }

    // Restore pi if we are not updating it
    if (!updatepi) pi = piold;

    // Convergence: beta change small, or objective non-decreasing
    if (iter >= miniter - 1) {
      double beta_norm = norm(beta, 2);
      if (norm(betaold - beta, 2) < convtol * std::max(1.0, beta_norm)) {
        iter++;
        break;
      }
      if (iter > 0 && varobj(iter) > varobj(iter - 1)) break;
    }
  }

  if (verbose) {
    Rprintf("Mr.ASH terminated at iteration %d: max|beta|=%.4e, sigma2=%.4e, pi0=%.4f\n",
            iter, max(abs(beta)), sigma2, pi(0));
  }

  using namespace cpp11::literals;
  return writable::list({
    "beta"_nm   = as_doubles(beta),
    "sigma2"_nm = as_sexp(sigma2),
    "pi"_nm     = as_doubles(pi),
    "iter"_nm   = as_sexp(iter),
    "varobj"_nm = as_doubles(vec(varobj.subvec(0, iter - 1)))
  });
}


================================================
FILE: src/cpp11.cpp
================================================
// Generated by cpp11: do not edit by hand
// clang-format off


#include "cpp11/declarations.hpp"
#include <R_ext/Visibility.h>

// caisa.cpp
integers random_order(int p, int numiter);
extern "C" SEXP _susieR_random_order(SEXP p, SEXP numiter) {
  BEGIN_CPP11
    return cpp11::as_sexp(random_order(cpp11::as_cpp<cpp11::decay_t<int>>(p), cpp11::as_cpp<cpp11::decay_t<int>>(numiter)));
  END_CPP11
}
// caisa.cpp
writable::list caisa_cpp(const doubles_matrix<>& X, const doubles& w, const doubles& sa2, const doubles& pi_init, const doubles& beta_init, const doubles& r_init, double sigma2, const integers& o_r, int maxiter, int miniter, double convtol, double epstol, std::string method_q, bool updatepi, bool updatesigma, bool verbose);
extern "C" SEXP _susieR_caisa_cpp(SEXP X, SEXP w, SEXP sa2, SEXP pi_init, SEXP beta_init, SEXP r_init, SEXP sigma2, SEXP o_r, SEXP maxiter, SEXP miniter, SEXP convtol, SEXP epstol, SEXP method_q, SEXP updatepi, SEXP updatesigma, SEXP verbose) {
  BEGIN_CPP11
    return cpp11::as_sexp(caisa_cpp(cpp11::as_cpp<cpp11::decay_t<const doubles_matrix<>&>>(X), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(w), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(sa2), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(pi_init), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(beta_init), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(r_init), cpp11::as_cpp<cpp11::decay_t<double>>(sigma2), cpp11::as_cpp<cpp11::decay_t<const integers&>>(o_r), cpp11::as_cpp<cpp11::decay_t<int>>(maxiter), cpp11::as_cpp<cpp11::decay_t<int>>(miniter), cpp11::as_cpp<cpp11::decay_t<double>>(convtol), cpp11::as_cpp<cpp11::decay_t<double>>(epstol), cpp11::as_cpp<cpp11::decay_t<std::string>>(method_q), cpp11::as_cpp<cpp11::decay_t<bool>>(updatepi), cpp11::as_cpp<cpp11::decay_t<bool>>(updatesigma), cpp11::as_cpp<cpp11::decay_t<bool>>(verbose)));
  END_CPP11
}
// mr_ash_rss.cpp
writable::list mr_ash_rss_cpp(const doubles& bhat, const doubles& shat, const doubles& z, const doubles_matrix<>& R, double var_y, int n, double sigma2_e, const doubles& s0, const doubles& w0, const doubles& mu1_init, double tol, int max_iter, bool update_w0, bool update_sigma, bool compute_ELBO, bool standardize);
extern "C" SEXP _susieR_mr_ash_rss_cpp(SEXP bhat, SEXP shat, SEXP z, SEXP R, SEXP var_y, SEXP n, SEXP sigma2_e, SEXP s0, SEXP w0, SEXP mu1_init, SEXP tol, SEXP max_iter, SEXP update_w0, SEXP update_sigma, SEXP compute_ELBO, SEXP standardize) {
  BEGIN_CPP11
    return cpp11::as_sexp(mr_ash_rss_cpp(cpp11::as_cpp<cpp11::decay_t<const doubles&>>(bhat), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(shat), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(z), cpp11::as_cpp<cpp11::decay_t<const doubles_matrix<>&>>(R), cpp11::as_cpp<cpp11::decay_t<double>>(var_y), cpp11::as_cpp<cpp11::decay_t<int>>(n), cpp11::as_cpp<cpp11::decay_t<double>>(sigma2_e), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(s0), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(w0), cpp11::as_cpp<cpp11::decay_t<const doubles&>>(mu1_init), cpp11::as_cpp<cpp11::decay_t<double>>(tol), cpp11::as_cpp<cpp11::decay_t<int>>(max_iter), cpp11::as_cpp<cpp11::decay_t<bool>>(update_w0), cpp11::as_cpp<cpp11::decay_t<bool>>(update_sigma), cpp11::as_cpp<cpp11::decay_t<bool>>(compute_ELBO), cpp11::as_cpp<cpp11::decay_t<bool>>(standardize)));
  END_CPP11
}

extern "C" {
static const R_CallMethodDef CallEntries[] = {
    {"_susieR_caisa_cpp",      (DL_FUNC) &_susieR_caisa_cpp,      16},
    {"_susieR_mr_ash_rss_cpp", (DL_FUNC) &_susieR_mr_ash_rss_cpp, 16},
    {"_susieR_random_order",   (DL_FUNC) &_susieR_random_order,    2},
    {NULL, NULL, 0}
};
}

extern "C" attribute_visible void R_init_susieR(DllInfo* dll){
  R_registerRoutines(dll, NULL, CallEntries, NULL, NULL);
  R_useDynamicSymbols(dll, FALSE);
  R_forceSymbols(dll, TRUE);
}


================================================
FILE: src/mr_ash.h
================================================

#ifndef MR_ASH_H
#define MR_ASH_H
#include <math.h>
#include <cpp11armadillo.hpp>

// Helper: build a random permutation vector of length p * numiter.
// Wrapped by a registered entry point in caisa.cpp.
inline arma::uvec random_order_impl(int p, int numiter) {
  arma::uvec o(p * numiter);
  for (int i = 0 ; i < numiter; i++) {
    o.subvec(i * p, (i+1) * p - 1) = arma::randperm(p);
  }
  return o;
}

inline arma::mat outerAddition(const arma::vec& a, const arma::vec& b) {
  arma::mat A(a.n_elem, b.n_elem);
  A.fill(0);
  A.each_row()          += b.t();
  A.each_col()          += a;
  return A;
}

inline void updatebetaj(const arma::vec& xj, double wj,
                        double& betaj, arma::vec& r,
                        arma::vec& piold, arma::vec& pi,
                        double sigma2, const arma::vec& sa2,
                        const arma::vec& s2inv,
                        double& a1, double& a2,
                        int j, int p,
                        double epstol) {

  // calculate b
  double bjwj           = dot(r, xj) + betaj * wj;

  // update r first step
  r                    += xj * betaj;

  // calculate muj
  arma::vec muj         = bjwj * s2inv;
  muj(0)                = 0;

  // calculate phij
  arma::vec phij        = log(piold + epstol) - log(1 + sa2 * wj)/2 + muj * (bjwj / 2 / sigma2);
  phij                  = exp(phij - max(phij));
  phij                  = phij / sum(phij);

  // pinew
  pi                   += phij / p;

  // update betaj
  betaj                 = dot(phij, muj);

  // update r second step
  r                    += -xj * betaj;

  // precalculate for M-step
  a1                   += bjwj * betaj;
  a2                   += dot(phij, log(phij + epstol));
  phij(0)               = 0;
  a2                   += -dot(phij, log(s2inv)) / 2;

  return;
}

#endif


================================================
FILE: src/mr_ash_rss.cpp
================================================
#include <cpp11.hpp>
#include <cpp11armadillo.hpp>
#include "mr_ash_rss.h"

using namespace cpp11;
using namespace arma;
using namespace std;

[[cpp11::register]]
writable::list mr_ash_rss_cpp(const doubles& bhat, const doubles& shat, const doubles& z,
                              const doubles_matrix<>& R, double var_y, int n, double sigma2_e,
                              const doubles& s0, const doubles& w0, const doubles& mu1_init,
                              double tol = 1e-8, int max_iter = 1e5,
                              bool update_w0 = true, bool update_sigma = true,
                              bool compute_ELBO = true, bool standardize = false) {

	// Convert input types
	vec bhat_vec = as_Col(bhat);
	vec shat_vec = as_Col(shat);
	vec z_vec = as_Col(z);
	mat R_mat = as_Mat(R);
	vec s0_vec = as_Col(s0);
	vec w0_vec = as_Col(w0);
	vec mu1_init_vec = as_Col(mu1_init);

	// Call the C++ function
	unordered_map<string, mat> result = mr_ash_rss(bhat_vec, shat_vec, z_vec, R_mat, var_y, n, sigma2_e, s0_vec, w0_vec,
	                                               mu1_init_vec, tol, max_iter, update_w0, update_sigma, compute_ELBO,
	                                               standardize);

	// Convert the result to a named list (matrices returned as doubles_matrix).
	// The unordered_map iteration does not preserve insertion order.
	writable::list ret;
	for (const auto& item : result) {
		cpp11::named_arg na(item.first.c_str());
		na = as_doubles_matrix(item.second);
		ret.push_back(na);
	}

	return ret;
}


================================================
FILE: src/mr_ash_rss.h
================================================
#ifndef MR_ASH_RSS_H
#define MR_ASH_RSS_H

#include <cpp11armadillo.hpp>
#include <cmath>
#include <vector>
#include <string>
#include <algorithm>
#include <unordered_map>

using namespace arma;
using namespace std;

/**
 * Softmax function
 *
 * @param x Input vector
 * @return Softmax output vector
 */
inline vec softmax_rss(const vec& x) {
	vec y = exp(x - max(x));
	return y / sum(y);
}

/**
 * Bayesian regression with Normal prior from sufficient statistics
 *
 * @param xTx X'X (scalar)
 * @param xTy X'y (scalar)
 * @param sigma2_e Error variance
 * @param sigma2_0 Prior variance
 * @return An unordered_map containing the least-squares estimate (bhat, s2), the posterior mean and standard deviation (mu1, sigma2_1), and the log-Bayes factor (logbf)
 */
inline unordered_map<string, double> bayes_ridge_sufficient(double xTx, double xTy, double sigma2_e, double sigma2_0) {
	// Compute the least-squares estimate and its variance
	double bhat = xTy / xTx;
	double s2 = sigma2_e / xTx;

	// Compute the posterior mean and variance assuming a normal prior with zero mean and variance sigma2_0
	double sigma2_1 = 1 / (1 / s2 + 1 / sigma2_0);
	double mu1 = sigma2_1 / s2 * bhat;

	// Compute the log-Bayes factor
	double logbf = log(s2 / (sigma2_0 + s2)) / 2 + (pow(bhat, 2) / s2 - pow(bhat, 2) / (sigma2_0 + s2)) / 2;

	// Return the least-squares estimate (bhat, s2), the posterior mean and standard deviation (mu1, sigma2_1), and the log-Bayes factor (logbf)
	return {{"bhat", bhat}, {"s2", s2}, {"mu1", mu1}, {"sigma2_1", sigma2_1}, {"logbf", logbf}};
}

/**
 * Bayesian regression with mixture-of-normals prior from sufficient statistics
 *
 * @param xTx X'X (scalar)
 * @param xTy X'y (scalar)
 * @param sigma2_e Error variance
 * @param w0 Mixture weights
 * @param sigma2_0 Mixture variances
 * @return An unordered_map containing the log-Bayes factor (logbf), the posterior assignment probabilities (w1), the posterior mean (mu1) and variance (sigma2_1) of the coefficients, and the posterior mean (mu1_k) and variance (sigma2_1_k) for each mixture component
 */
inline unordered_map<string, vec> bayes_mix_sufficient(double xTx, double xTy, double sigma2_e, const vec& w0, const vec& sigma2_0) {
	// Get the number of mixture components (K)
	int K = sigma2_0.n_elem;

	// Compute the Bayes factors and posterior statistics separately for each mixture component
	// Note: sigma2_0[i] is the prior variance scale parameter (like sa2 in mr.ash).
	// The actual prior variance is sigma2_e * sigma2_0[i], matching mr.ash's model:
	//   beta_j ~ sum_k pi_k * N(0, sigma2 * sa2[k])
	mat out(K, 5);
	for (int i = 0; i < K; i++) {
		unordered_map<string, double> ridge_out = bayes_ridge_sufficient(xTx, xTy, sigma2_e, sigma2_e * sigma2_0[i]);
		out(i, 0) = ridge_out["bhat"];
		out(i, 1) = ridge_out["s2"];
		out(i, 2) = ridge_out["mu1"];
		out(i, 3) = ridge_out["sigma2_1"];
		out(i, 4) = ridge_out["logbf"];
	}

	// Compute the posterior assignment probabilities for the latent indicator variable
	vec w1 = softmax_rss(out.col(4) + log(w0));

	// Compute the posterior mean (mu1) and variance (sigma2_1) of the regression coefficients
	vec mu1_k_vec = out.col(2);
	vec sigma2_1_k_vec = out.col(3);

	double mu1 = sum(w1 % mu1_k_vec);
	double sigma2_1 = sum(w1 % (square(mu1_k_vec) + sigma2_1_k_vec)) - pow(mu1, 2);

	// Compute the log-Bayes factor as a linear combination of the individual BFs for each mixture component
	double u = max(out.col(4));
	double logbf = u + log(sum(w0 % exp(out.col(4) - u)));

	// Return the posterior assignment probabilities (w1), the posterior mean (mu1) and variance (sigma2_1) of the coefficients,
	// and the posterior mean (mu1_k) and variance (sigma2_1_k) for each mixture component, and the log-Bayes factor (logbf)
	return {{"w1", w1}, {"mu1", vec(1, fill::value(mu1))}, {"sigma2_1", vec(1, fill::value(sigma2_1))},
		{"mu1_k", mu1_k_vec}, {"sigma2_1_k", sigma2_1_k_vec}, {"logbf", vec(1, fill::value(logbf))}};
}

/**
 * Bayesian multiple regression with mixture-of-normals prior from sufficient statistics
 *
 * @param XTy X'y vector
 * @param XTX X'X matrix
 * @param yTy y'y scalar
 * @param n Sample size
 * @param sigma2_e Error variance
 * @param sigma2_0 Mixture variances
 * @param w0 Mixture weights
 * @param mu1_init Initial value for mu1
 * @param tol Convergence tolerance
 * @param max_iter Maximum number of iterations
 * @param update_w0 Whether to update w0
 * @param update_sigma Whether to update sigma2_e
 * @param compute_ELBO Whether to compute the Evidence Lower Bound (ELBO)
 * @return An unordered_map containing the posterior assignment probabilities (w1), the posterior mean (mu1) and variance (sigma2_1) of the coefficients, the error variance (sigma2_e), the mixture weights (w0), and optionally the ELBO
 */
inline unordered_map<string, mat> mr_ash_sufficient(const vec& XTy, const mat& XTX, double yTy, int n, double& sigma2_e,
                                             const vec& sigma2_0, vec& w0, const vec& mu1_init, double tol = 1e-8,
                                             int max_iter = 1e5, bool update_w0 = true, bool update_sigma = true,
                                             bool compute_ELBO = true) {

	// Initialize parameters
	int p = XTX.n_cols;
	int K = sigma2_0.n_elem;
	vec mu1_t = mu1_init;
	vec sigma2_1_t(p, fill::zeros);
	mat w1_t(p, K, fill::zeros);
	mat mu1_k_t(p, K, fill::zeros);
	mat sigma2_1_k_t(p, K, fill::zeros);
	int t = 0;
	double ELBO = 0;
	vec varobj_vec(max_iter, fill::zeros);
	bool converged = false;

	// Iterate until convergence
	while (!converged) {
		double var_part_ERSS = 0;
		double neg_KL = 0;

		// Update iterator
		t++;

		// Exit loop if maximum number of iterations is reached
		if (t > max_iter) {
			t = max_iter;  // Clamp to valid index range
			cerr << "Max number of iterations reached. Try increasing max_iter." << endl;
			break;
		}

		// Save current estimates
		vec mu1_tminus1 = mu1_t;

		vec XTrbar = XTy - XTX * mu1_t;

		// Loop through the variables
		for (int j = 0; j < p; j++) {
			// Remove j-th effect from expected residuals
			vec XTrbar_j = XTrbar + XTX.col(j) * mu1_t[j];

			double xTrbar_j = XTrbar_j[j];
			double xTx = XTX(j, j);

			// Run Bayesian SLR
			unordered_map<string, vec> bfit = bayes_mix_sufficient(xTx, xTrbar_j, sigma2_e, w0, sigma2_0);

			// Update variational parameters
			mu1_t[j] = bfit["mu1"][0];
			sigma2_1_t[j] = bfit["sigma2_1"][0];
			w1_t.row(j) = bfit["w1"].t();
			mu1_k_t.row(j) = bfit["mu1_k"].t();
			sigma2_1_k_t.row(j) = bfit["sigma2_1_k"].t();

			// Compute ELBO parameters
			if (compute_ELBO) {
				var_part_ERSS += sigma2_1_t[j] * xTx;
				neg_KL += bfit["logbf"][0] + (1 / (2 * sigma2_e)) * (-2 * xTrbar_j * mu1_t[j] + (xTx * (sigma2_1_t[j] + pow(mu1_t[j], 2))));
			}

			// Update expected residuals
			XTrbar = XTrbar_j - XTX.col(j) * mu1_t[j];
		}

		// Update w0 if requested
		if (update_w0) {
			w0 = sum(w1_t, 0).t() / p;
		}

		// Compute convergence using relative L2 norm (matching mr.ash)
		double beta_diff = norm(mu1_t - mu1_tminus1, 2);
		double beta_norm = norm(mu1_t, 2);

		// Compute ERSS and ELBO
		double ERSS = yTy - 2 * dot(XTy, mu1_t) + as_scalar(mu1_t.t() * XTX * mu1_t) + var_part_ERSS;
		if (compute_ELBO) {
			ELBO = -0.5 * log(n) - 0.5 * n * log(2 * datum::pi * sigma2_e) - (1 / (2 * sigma2_e)) * ERSS + neg_KL;
		}
		varobj_vec[t - 1] = ELBO;

		// Update residual variance using mr.ash's sigma_dep_q formula:
		// sigma2 = (y'y - beta'X'y) / n
		if (update_sigma) {
			sigma2_e = (yTy - dot(XTy, mu1_t)) / n;
		}

		// Check convergence (matching mr.ash's relative L2 criterion)
		if (t >= 2 && beta_diff < tol * max(1.0, beta_norm)) {
			converged = true;
		}
	}

	// Return results including iteration count and ELBO trajectory
	return {{"mu1", mat(mu1_t)}, {"sigma2_1", mat(sigma2_1_t)}, {"w1", w1_t},
		{"sigma2_e", mat(1, 1, fill::value(sigma2_e))}, {"w0", mat(w0)},
		{"ELBO", mat(1, 1, fill::value(ELBO))},
		{"iter", mat(1, 1, fill::value((double)t))},
		{"varobj", mat(varobj_vec.subvec(0, t - 1))}};
}

/**
 * Rescale posterior mean and covariance
 *
 * @param mu1 Posterior mean vector
 * @param sigma2_1 Posterior covariance matrix
 * @param sx Scaling vector
 * @return An unordered_map containing the rescaled posterior mean (mu1_orig) and covariance (sigma2_1_orig)
 */
inline unordered_map<string, mat> rescale_post_mean_covar(const vec& mu1, const mat& sigma2_1, const vec& sx) {
	vec mu1_orig = mu1 / sx;
	mat sigma2_1_orig = diagmat(1 / sx) * sigma2_1 * diagmat(1 / sx);
	return {{"mu1_orig", mat(mu1_orig)}, {"sigma2_1_orig", sigma2_1_orig}};
}

/**
 * Bayesian multiple regression with mixture-of-normals prior
 *
 * @param bhat Observed effect sizes (standardized)
 * @param shat Standard errors of effect sizes
 * @param z Z-scores
 * @param R Correlation matrix
 * @param var_y Variance of the outcome
 * @param n Sample size
 * @param sigma2_e Error variance
 * @param s0 Prior variances for the mixture components
 * @param w0 Prior weights for the mixture components
 * @param mu1_init Initial value for the posterior mean of the coefficients
 * @param tol Convergence tolerance
 * @param max_iter Maximum number of iterations
 * @param update_w0 Whether to update the mixture weights
 * @param update_sigma Whether to update the error variance
 * @param compute_ELBO Whether to compute the Evidence Lower Bound (ELBO)
 * @param standardize Whether to standardize the input data
 * @return An unordered_map containing the posterior mean (mu1) and covariance (sigma2_1) of the coefficients, the posterior assignment probabilities (w1), the error variance (sigma2_e), the mixture weights (w0), and optionally the ELBO
 */
inline unordered_map<string, mat> mr_ash_rss(const vec& bhat, const vec& shat, const vec& z, const mat& R, double var_y, int n,
                                      double sigma2_e, const vec& s0, vec& w0, const vec& mu1_init, double tol = 1e-8,
                                      int max_iter = 1e5, bool update_w0 = true, bool update_sigma = true, bool compute_ELBO = true,
                                      bool standardize = false) {
	// Get number of variables
	int p = z.n_elem;

	// Initialize regression coefficients to 0 if not provided
	vec mu1_init_use = mu1_init;
	if (mu1_init.is_empty()) {
		mu1_init_use = vec(p, fill::zeros);
	}

	// Compute Z-scores if not provided
	vec z_use = z;
	if (z.is_empty()) {
		z_use = bhat / shat;
	}

	// Compute PVE-adjusted Z-scores if sample size is provided
	vec adj(p, fill::ones);
	if (std::isfinite(n)) {
		adj = (n - 1) / (square(z_use) + n - 2);
		z_use %= sqrt(adj);
	}
	// Compute X'X and X'y
	mat XtX;
	vec Xty;
	if (std::isfinite(var_y) && !shat.is_empty()) {
		vec XtXdiag = var_y * adj / square(shat);
		XtX = diagmat(sqrt(XtXdiag)) * R * diagmat(sqrt(XtXdiag));
		XtX = 0.5 * (XtX + XtX.t());
		Xty = z_use % sqrt(adj) % (var_y / shat);
	} else {
		// The effects are on the standardized X, y scale
		XtX = (n - 1) * R;
		Xty = z_use * sqrt(n - 1);
		var_y = 1.0;
	}

	// Adjust X'X and X'y if X is standardized
	vec sx(p, fill::ones);
	if (standardize) {
		vec dXtX = XtX.diag();
		sx = sqrt(dXtX / (n - 1));
		sx.replace(0, 1);
		XtX = diagmat(1 / sx) * XtX * diagmat(1 / sx);
		Xty /= sx;
		mu1_init_use %= sx;
	}

	// Run variational inference
	unordered_map<string, mat> result = mr_ash_sufficient(Xty, XtX, var_y * (n - 1), n, sigma2_e, s0, w0, mu1_init_use,
	                                                      tol, max_iter, update_w0, update_sigma, compute_ELBO);

	// Rescale posterior mean and covariance if X was standardized
	if (standardize) {
		unordered_map<string, mat> out_adj = rescale_post_mean_covar(vectorise(result["mu1"]), result["sigma2_1"], sx);
		result["mu1"] = out_adj["mu1_orig"];
		result["sigma2_1"] = out_adj["sigma2_1_orig"];
	}

	return {{"mu1", result["mu1"]}, {"sigma2_1", result["sigma2_1"]}, {"w1", result["w1"]},
		{"sigma2_e", result["sigma2_e"]}, {"w0", result["w0"]}, {"ELBO", result["ELBO"]},
		{"iter", result["iter"]}, {"varobj", result["varobj"]}};
};

#endif


================================================
FILE: tests/README.md
================================================
# susieR Testing Framework

This directory contains the comprehensive test suite for the susieR 2.0 package, with **>1,000 total tests** ensuring code correctness, stability, and consistency with the reference implementation.

## File Organization

- `testthat/`: Directory containing test files
    - `helper_*.R`: Helper functions used in testing for simulating data, assigning attributes, and more
    - `test_*.R`: Unit tests validating correctness and stability for all functions in susieR 2.0
    - `reference/`: Reference tests ensuring consistency with original susieR 1.0 implementation


================================================
FILE: tests/testthat/helper_nig_reference.R
================================================
# =============================================================================
# HELPER FUNCTIONS FOR NIG REFERENCE COMPARISON
# =============================================================================
#
# These functions compare the local susieR implementation of
# estimate_residual_method = "NIG" against the reference
# implementation on stephenslab/susieR@fix-susie-small-sigma-update
# (commit a999d44), where the equivalent feature is small = TRUE.
#
# This helper parallels helper_reference.R but targets a different
# reference commit and maps between the two parameter interfaces.
#
library(pkgload)
library(rprojroot)

# Reference package details for the NIG comparison
.nig_ref_repo   <- "stephenslab/susieR"
.nig_ref_commit <- "a999d44"

# Cached environments (separate from helper_reference.R's globals)
.nig_ref_env         <- NULL
.nig_dev_env         <- NULL
.nig_ref_source_path <- NULL

# Get reference source for the fix-susie-small-sigma-update branch
get_nig_reference_source <- function() {
  if (!is.null(.nig_ref_source_path) && dir.exists(.nig_ref_source_path)) {
    return(.nig_ref_source_path)
  }

  ref_source <- file.path(tempdir(), "susieR_nig_reference_source")

  if (!dir.exists(ref_source)) {
    message("Downloading NIG reference source from GitHub...")

    result <- system(sprintf("git clone -q https://github.com/%s.git %s 2>&1",
                             .nig_ref_repo, ref_source),
                     intern = FALSE)

    if (result != 0) {
      stop("Failed to clone reference package")
    }

    result <- system(sprintf("cd %s && git checkout -q %s 2>&1",
                             ref_source, .nig_ref_commit),
                     intern = FALSE)

    if (result != 0) {
      stop("Failed to checkout commit ", .nig_ref_commit)
    }

    message("\u2713 NIG reference source downloaded")
  }

  .nig_ref_source_path <<- ref_source
  return(ref_source)
}

# Load the fix-susie-small-sigma-update reference using pkgload
load_nig_reference_env <- function() {
  if (!is.null(.nig_ref_env)) {
    return(.nig_ref_env)
  }

  if (!requireNamespace("pkgload", quietly = TRUE)) {
    stop("Package 'pkgload' is required. Install with: install.packages('pkgload')")
  }

  ref_source <- get_nig_reference_source()

  message("Loading NIG reference package with pkgload...")
  env <- pkgload::load_all(ref_source, export_all = FALSE, quiet = TRUE)

  .nig_ref_env <<- env
  return(env)
}

# Load development package using pkgload
load_nig_development_env <- function() {
  if (!is.null(.nig_dev_env)) {
    return(.nig_dev_env)
  }

  if (!requireNamespace("pkgload", quietly = TRUE)) {
    stop("Package 'pkgload' is required. Install with: install.packages('pkgload')")
  }

  dev_source <- tryCatch({
    rprojroot::find_root(rprojroot::is_r_package)
  }, error = function(e) {
    normalizePath(file.path(getwd(), "../.."))
  })

  message("Loading development package with pkgload...")
  env <- pkgload::load_all(dev_source, export_all = FALSE, quiet = TRUE)

  .nig_dev_env <<- env
  return(env)
}

# Skip test if reference not available
skip_if_no_nig_reference <- function() {
  tryCatch({
    load_nig_reference_env()
    load_nig_development_env()
  }, error = function(e) {
    skip(paste("NIG reference comparison not available:", e$message))
  })
}

# -----------------------------------------------------------------------
# compare_NIG_to_reference
#
# Runs susie() with estimate_residual_method = "NIG" on the
# development package and susie() with small = TRUE on the reference
# branch, then compares all output fields.
#
# Parameters:
#   dev_args  - named list of arguments for the development susie() call
#               (must include X and y; estimate_residual_method is set
#               automatically to "NIG")
#   ref_args  - (optional) named list of arguments for the reference
#               susie() call. If NULL, derived from dev_args by mapping
#               estimate_residual_method -> small = TRUE and
#               tol -> tol_small.
#   tolerance - numeric tolerance for expect_equal comparisons
# -----------------------------------------------------------------------
compare_NIG_to_reference <- function(dev_args,
                                      ref_args = NULL,
                                      tolerance = 1e-5) {
  skip_if_no_nig_reference()

  ref_env <- load_nig_reference_env()
  dev_env <- load_nig_development_env()

  # Ensure the dev call uses NIG
  dev_args$estimate_residual_method <- "NIG"

  # Match reference behavior: disable V null threshold check and use
  # the same convergence tolerance as the reference (tol_small = 1e-4)
  if (is.null(dev_args$check_null_threshold))
    dev_args$check_null_threshold <- -Inf
  if (is.null(dev_args$tol))
    dev_args$tol <- 1e-4

  # Match reference NIG hyperparameter defaults. Dev defaults changed in
  # commit b0b0c40 ("new defaults") from alpha0 = beta0 = 0.1 to
  # alpha0 = beta0 = 1/sqrt(n), a weakly-informative scaling. The reference
  # (stephenslab/susieR@a999d44, small = TRUE) still uses 0.1. Force 0.1
  # on the dev side when the caller hasn't set these so the two runs use
  # the same prior; the change to 1/sqrt(n) is a deliberate design choice
  # unrelated to mathematical parity with the reference.
  if (is.null(dev_args$alpha0))
    dev_args$alpha0 <- 0.1
  if (is.null(dev_args$beta0))
    dev_args$beta0 <- 0.1

  # Build reference args by mapping interface differences
  if (is.null(ref_args)) {
    ref_args <- dev_args

    # Map estimate_residual_method -> small
    ref_args$estimate_residual_method <- NULL
    ref_args$small <- TRUE

    # Map tol -> tol_small (reference replaces tol with tol_small when small=TRUE)
    if (!is.null(ref_args$tol)) {
      ref_args$tol_small <- ref_args$tol
      ref_args$tol       <- NULL
    }

    # Remove parameters that don't exist in the reference interface
    ref_args$convergence_method <- NULL

    # The reference uses s_init instead of model_init
    if (!is.null(ref_args$model_init)) {
      ref_args$s_init     <- ref_args$model_init
      ref_args$model_init <- NULL
    }
  }

  ref_func <- ref_env$env[["susie"]]
  dev_func <- dev_env$env[["susie"]]

  if (is.null(ref_func)) stop("susie() not found in reference package")
  if (is.null(dev_func)) stop("susie() not found in development package")

  # Suppress known warnings (method override messages)
  dev_result <- suppressWarnings(do.call(dev_func, dev_args))
  ref_result <- suppressWarnings(do.call(ref_func, ref_args))

  # Return both results for custom assertions
  invisible(list(dev = dev_result, ref = ref_result))
}

# -----------------------------------------------------------------------
# expect_equal_NIG_objects
#
# Deep comparison of susie objects produced under the NIG /
# small = TRUE prior. Compares the standard fields (alpha, mu, mu2, V,
# sigma2, elbo, fitted, intercept, pip, sets) plus the NIG-specific
# rv field.
# -----------------------------------------------------------------------
expect_equal_NIG_objects <- function(dev_obj, ref_obj,
                                      tolerance = 1e-5) {

  # --- Core posterior quantities ---
  expect_equal(dev_obj$alpha, ref_obj$alpha, tolerance = tolerance,
               info = "alpha (posterior inclusion probabilities) differ")

  expect_equal(dev_obj$mu, ref_obj$mu, tolerance = tolerance,
               info = "mu (posterior means) differ")

  expect_equal(dev_obj$mu2, ref_obj$mu2, tolerance = tolerance,
               info = "mu2 (posterior second moments) differ")

  # --- Variance parameters ---
  expect_equal(dev_obj$V, ref_obj$V, tolerance = tolerance,
               info = "V (prior variance, after rv scaling) differs")

  expect_equal(dev_obj$sigma2, ref_obj$sigma2, tolerance = tolerance,
               info = "sigma2 (residual variance) differs")

  # --- Residual variance per effect (NIG-specific) ---
  if (!is.null(dev_obj$rv) && !is.null(ref_obj$rv)) {
    expect_equal(dev_obj$rv, ref_obj$rv, tolerance = tolerance,
                 info = "rv (per-effect residual variance) differs")
  }

  # --- ELBO / convergence ---
  # For L = 1 the dev package intentionally uses ELBO convergence while
  # the reference uses PIP convergence, so niter and elbo may differ.
  # Only compare these for L > 1.
  L <- nrow(dev_obj$alpha)
  if (L > 1) {
    expect_equal(dev_obj$niter, ref_obj$niter,
                 info = "Number of iterations differs")

    expect_equal(dev_obj$converged, ref_obj$converged,
                 info = "Convergence status differs")
  }

  # For L = 1 the ELBO (loglik) is well-defined; compare if both present
  # and the iteration counts match (they may differ due to convergence method)
  if (!is.null(dev_obj$elbo) && !is.null(ref_obj$elbo) &&
      !all(is.na(dev_obj$elbo)) && !all(is.na(ref_obj$elbo)) &&
      length(dev_obj$elbo) == length(ref_obj$elbo)) {
    expect_equal(dev_obj$elbo, ref_obj$elbo, tolerance = tolerance,
                 info = "ELBO values differ")
  }

  # --- Fitted values and intercept ---
  if (!is.null(dev_obj$fitted) && !is.null(ref_obj$fitted)) {
    expect_equal(dev_obj$fitted, ref_obj$fitted, tolerance = tolerance,
                 info = "Fitted values differ")
  }

  expect_equal(dev_obj$intercept, ref_obj$intercept, tolerance = tolerance,
               info = "Intercept differs")

  # --- PIPs ---
  if (!is.null(dev_obj$pip) && !is.null(ref_obj$pip)) {
    expect_equal(dev_obj$pip, ref_obj$pip, tolerance = tolerance,
                 info = "PIPs differ")
  }

  # --- Credible sets ---
  if (!is.null(dev_obj$sets) && !is.null(ref_obj$sets)) {
    expect_equal(dev_obj$sets$cs, ref_obj$sets$cs,
                 info = "Credible sets differ")
    if (!is.null(dev_obj$sets$purity) && !is.null(ref_obj$sets$purity)) {
      expect_equal(dev_obj$sets$purity, ref_obj$sets$purity,
                   tolerance = tolerance, info = "CS purity differs")
    }
    expect_equal(dev_obj$sets$coverage, ref_obj$sets$coverage,
                 tolerance = tolerance, info = "CS coverage differs")
  }

  invisible(TRUE)
}

# -----------------------------------------------------------------------
# run_ss_and_individual_NIG
#
# Given X, y, and extra arguments (L, standardize, intercept, alpha0,
# beta0, etc.), runs both susie() and susie_ss() with
# estimate_residual_method = "NIG", ensuring that the
# sufficient statistics are computed to match susie()'s internal
# preprocessing.
#
# Returns list(ind = ..., ss = ...) with both results.
# -----------------------------------------------------------------------
run_ss_and_individual_NIG <- function(X, y, extra_args = list()) {
  n <- nrow(X)
  p <- ncol(X)

  # Extract preprocessing settings (defaults match susie)
  intercept   <- if (!is.null(extra_args$intercept))   extra_args$intercept   else TRUE
  standardize <- if (!is.null(extra_args$standardize)) extra_args$standardize else TRUE

  # Preprocess exactly as susie() does internally
  y_mean     <- mean(y)
  X_colmeans <- colMeans(X)

  if (intercept) {
    y_c <- y - y_mean
    X_c <- scale(X, center = TRUE, scale = FALSE)
  } else {
    y_c <- y
    X_c <- X
  }

  if (standardize) {
    csd <- apply(X, 2, sd)
    csd[csd == 0] <- 1
    X_cs <- t(t(X_c) / csd)
  } else {
    X_cs <- X_c
  }

  # Compute sufficient statistics from preprocessed data
  XtX <- crossprod(X_cs)
  Xty <- drop(t(X_cs) %*% y_c)
  yty <- sum(y_c^2)

  # Run individual-level susie
  ind_args <- c(list(X = X, y = y,
                     estimate_residual_method = "NIG"),
                extra_args)
  res_ind <- suppressWarnings(do.call(susie, ind_args))

  # Build SS arguments: remove individual-only params, add SS-specific ones
  ss_extra <- extra_args
  ss_extra$intercept   <- NULL
  ss_extra$standardize <- NULL

  ss_args <- c(list(XtX = XtX, Xty = Xty, yty = yty, n = n,
                    estimate_residual_method = "NIG",
                    standardize = FALSE,
                    X_colmeans = if (intercept) X_colmeans else NA,
                    y_mean     = if (intercept) y_mean else NA),
               ss_extra)
  res_ss <- suppressWarnings(do.call(susie_ss, ss_args))

  list(ind = res_ind, ss = res_ss)
}

# -----------------------------------------------------------------------
# run_rss_and_individual_NIG
#
# Given X, y, and extra arguments (L, standardize, intercept, alpha0,
# beta0, etc.), runs both susie() and susie_rss() with
# estimate_residual_method = "NIG", ensuring that the
# summary statistics (bhat, shat, R, var_y) are computed to match
# susie()'s internal preprocessing.
#
# Uses the bhat/shat/var_y input path of susie_rss(), which recovers
# exact sufficient statistics (XtX, Xty, yty) from summary statistics.
# This is necessary because the NIG prior's alpha0/beta0 break scale
# invariance, so the z-score-only path would not match.
#
# Returns list(ind = ..., rss = ...) with both results.
# -----------------------------------------------------------------------
run_rss_and_individual_NIG <- function(X, y, extra_args = list()) {
  n <- nrow(X)
  p <- ncol(X)

  # Extract preprocessing settings (defaults match susie)
  intercept   <- if (!is.null(extra_args$intercept))   extra_args$intercept   else TRUE
  standardize <- if (!is.null(extra_args$standardize)) extra_args$standardize else TRUE

  # Preprocess exactly as susie() does internally
  if (intercept) {
    y_c <- y - mean(y)
    X_c <- scale(X, center = TRUE, scale = FALSE)
  } else {
    y_c <- y
    X_c <- X
  }

  if (standardize) {
    csd <- apply(X, 2, sd)
    csd[csd == 0] <- 1
    X_cs <- t(t(X_c) / csd)
  } else {
    X_cs <- X_c
  }

  # Compute correlation matrix from preprocessed data
  R <- cor(X_cs)
  R <- (R + t(R)) / 2  # ensure symmetry

  # Compute bhat/shat via univariate regression on preprocessed data
  # center=FALSE because we already centered
  ss <- univariate_regression(X_cs, y_c, center = FALSE)

  # Compute var_y
  var_y <- sum(y_c^2) / (n - 1)

  # Run individual-level susie
  ind_args <- c(list(X = X, y = y,
                     estimate_residual_method = "NIG"),
                extra_args)
  res_ind <- suppressWarnings(do.call(susie, ind_args))

  # Build RSS arguments: remove individual-only params, add RSS-specific ones
  rss_extra <- extra_args
  rss_extra$intercept   <- NULL
  rss_extra$standardize <- NULL

  rss_args <- c(list(bhat = ss$betahat, shat = ss$sebetahat,
                     R = R, n = n, var_y = var_y,
                     estimate_residual_method = "NIG",
                     standardize = FALSE),
                rss_extra)
  res_rss <- suppressWarnings(do.call(susie_rss, rss_args))

  list(ind = res_ind, rss = res_rss)
}

# -----------------------------------------------------------------------
# expect_rss_matches_individual_ss
#
# Deep comparison of susie objects produced by the individual-level and
# RSS interfaces under NIG. Delegates to
# expect_ss_matches_individual_ss by mapping rss -> ss.
# -----------------------------------------------------------------------
expect_rss_matches_individual_ss <- function(res, tolerance = 1e-6) {
  expect_ss_matches_individual_ss(
    list(ind = res$ind, ss = res$rss),
    tolerance = tolerance
  )
}

# -----------------------------------------------------------------------
# expect_ss_matches_individual_ss
#
# Deep comparison of susie objects produced by the individual-level and
# sufficient-statistics interfaces under NIG.
# -----------------------------------------------------------------------
expect_ss_matches_individual_ss <- function(res, tolerance = 1e-6) {
  ind <- res$ind
  ss  <- res$ss

  # Core posterior quantities
  expect_equal(ind$alpha, ss$alpha, tolerance = tolerance,
               info = "alpha differs between susie and susie_ss")
  expect_equal(ind$mu, ss$mu, tolerance = tolerance,
               info = "mu differs between susie and susie_ss")
  expect_equal(ind$mu2, ss$mu2, tolerance = tolerance,
               info = "mu2 differs between susie and susie_ss")
  expect_equal(ind$V, ss$V, tolerance = tolerance,
               info = "V differs between susie and susie_ss")
  expect_equal(ind$sigma2, ss$sigma2, tolerance = tolerance,
               info = "sigma2 differs between susie and susie_ss")
  expect_equal(ind$pip, ss$pip, tolerance = tolerance,
               info = "pip differs between susie and susie_ss")

  # Convergence
  expect_equal(ind$niter, ss$niter,
               info = "niter differs between susie and susie_ss")
  expect_equal(ind$converged, ss$converged,
               info = "converged differs between susie and susie_ss")

  # NIG-specific: per-effect residual variance
  if (!is.null(ind$rv) && !is.null(ss$rv)) {
    expect_equal(ind$rv, ss$rv, tolerance = tolerance,
                 info = "rv differs between susie and susie_ss")
  }

  # Credible sets
  if (!is.null(ind$sets) && !is.null(ss$sets)) {
    expect_equal(ind$sets$cs, ss$sets$cs,
                 info = "Credible sets differ between susie and susie_ss")
    if (!is.null(ind$sets$purity) && !is.null(ss$sets$purity)) {
      expect_equal(ind$sets$purity, ss$sets$purity,
                   tolerance = tolerance,
                   info = "CS purity differs between susie and susie_ss")
    }
  }

  invisible(TRUE)
}


================================================
FILE: tests/testthat/helper_reference.R
================================================
# =============================================================================
# HELPER FUNCTIONS FOR REFERENCE PACKAGE COMPARISON (PKGLOAD APPROACH)
# =============================================================================
#
# These functions compare the new susieR implementation against the reference
# package (stephenslab/susieR@1f9166c) to ensure results are identical.
#
# Strategy: Use pkgload to load both packages into separate environments
library(pkgload)
library(rprojroot)

# Reference package details
.ref_repo <- "stephenslab/susieR"
.ref_commit <- "1f9166c"

# Cached environments
.ref_env <- NULL
.dev_env <- NULL
.ref_source_path <- NULL

# Get reference package source (download once, cache path)
get_reference_source <- function() {
  if (!is.null(.ref_source_path) && dir.exists(.ref_source_path)) {
    return(.ref_source_path)
  }

  # Download to temp directory
  ref_source <- file.path(tempdir(), "susieR_reference_source")

  if (!dir.exists(ref_source)) {
    message("Downloading reference package source from GitHub...")

    result <- system(sprintf("git clone -q https://github.com/%s.git %s 2>&1",
                             .ref_repo, ref_source),
                     intern = FALSE)

    if (result != 0) {
      stop("Failed to clone reference package")
    }

    result <- system(sprintf("cd %s && git checkout -q %s 2>&1",
                             ref_source, .ref_commit),
                     intern = FALSE)

    if (result != 0) {
      stop("Failed to checkout commit ", .ref_commit)
    }

    message("✓ Reference source downloaded")
  }

  .ref_source_path <<- ref_source
  return(ref_source)
}

# Load reference package using pkgload
load_reference_env <- function() {
  if (!is.null(.ref_env)) {
    return(.ref_env)
  }

  if (!requireNamespace("pkgload", quietly = TRUE)) {
    stop("Package 'pkgload' is required. Install with: install.packages('pkgload')")
  }

  ref_source <- get_reference_source()

  message("Loading reference package with pkgload...")
  env <- pkgload::load_all(ref_source, export_all = FALSE, quiet = TRUE)

  .ref_env <<- env
  return(env)
}

# Load development package using pkgload
load_development_env <- function() {
  if (!is.null(.dev_env)) {
    return(.dev_env)
  }

  if (!requireNamespace("pkgload", quietly = TRUE)) {
    stop("Package 'pkgload' is required. Install with: install.packages('pkgload')")
  }

  # Get path to development package (current package being tested)
  # Use rprojroot to find package root
  dev_source <- tryCatch({
    rprojroot::find_root(rprojroot::is_r_package)
  }, error = function(e) {
    # Fallback: assume we're in tests/testthat
    normalizePath(file.path(getwd(), "../.."))
  })

  message("Loading development package with pkgload...")
  env <- pkgload::load_all(dev_source, export_all = FALSE, quiet = TRUE)

  .dev_env <<- env
  return(env)
}

# Skip test if reference not available
skip_if_no_reference <- function() {
  tryCatch({
    load_reference_env()
    load_development_env()
  }, error = function(e) {
    skip(paste("Reference comparison not available:", e$message))
  })
}

# Compare new implementation to reference
compare_to_reference <- function(func_name, args, tolerance = 1e-8, ref_func_name = NULL, ref_args = NULL) {
  skip_if_no_reference()

  # Load both environments
  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  # If ref_func_name not specified, use same name as dev function
  if (is.null(ref_func_name)) {
    ref_func_name <- func_name
  }

  # If ref_args not specified, use same args as dev function
  if (is.null(ref_args)) {
    ref_args <- args
  }

  # Dev skips the null-likelihood V-zeroing step for EM (intentional: avoids
  # an inconsistent (q, V) pair that can decrease the ELBO; null effects are
  # instead removed by trim_null_effects() post-convergence). The reference
  # always runs the check. Setting check_null_threshold = -Inf disables the
  # check on the reference side without affecting dev, making the two paths
  # comparable. Only injected when the caller hasn't set it explicitly.
  uses_em <- identical(args$estimate_prior_method, "EM") ||
             identical(ref_args$estimate_prior_method, "EM")
  if (uses_em) {
    if (is.null(args$check_null_threshold))
      args$check_null_threshold <- -Inf
    if (is.null(ref_args$check_null_threshold))
      ref_args$check_null_threshold <- -Inf
  }

  # Get functions from each environment
  ref_func <- ref_env$env[[ref_func_name]]
  dev_func <- dev_env$env[[func_name]]

  if (is.null(ref_func)) {
    stop("Function '", ref_func_name, "' not found in reference package")
  }

  if (is.null(dev_func)) {
    stop("Function '", func_name, "' not found in development package")
  }

  # Call both implementations (potentially with different arguments)
  dev_result <- do.call(dev_func, args)
  ref_result <- do.call(ref_func, ref_args)

  # Deep comparison of all fields
  expect_equal_susie_objects(dev_result, ref_result, tolerance)

  invisible(list(dev = dev_result, ref = ref_result))
}

# Inject check_null_threshold = -Inf when estimate_prior_method = "EM" and
# the caller hasn't explicitly set a threshold. Needed because dev skips the
# null-likelihood V-zeroing step for EM while the reference always runs it;
# -Inf disables the check on the reference side. Safe for dev (the branch is
# not executed). Used by direct do.call sites in tests that don't go through
# compare_to_reference().
#' @keywords internal
inject_em_null_check <- function(args) {
  if (identical(args$estimate_prior_method, "EM") &&
      is.null(args$check_null_threshold)) {
    args$check_null_threshold <- -Inf
  }
  args
}

# Deep comparison of susie objects
expect_equal_susie_objects <- function(dev_obj, ref_obj, tolerance = 1e-8) {

  # Core posterior quantities
  expect_equal(dev_obj$alpha, ref_obj$alpha, tolerance = tolerance,
               info = "alpha (posterior inclusion probabilities) differ")

  expect_equal(dev_obj$mu, ref_obj$mu, tolerance = tolerance,
               info = "mu (posterior means) differ")

  expect_equal(dev_obj$mu2, ref_obj$mu2, tolerance = tolerance,
               info = "mu2 (posterior second moments) differ")

  # Variance parameters
  expect_equal(dev_obj$V, ref_obj$V, tolerance = tolerance,
               info = "V (prior variance) differs")

  expect_equal(dev_obj$sigma2, ref_obj$sigma2, tolerance = tolerance,
               info = "sigma2 (residual variance) differs")

  # ELBO and convergence
  expect_equal(dev_obj$elbo, ref_obj$elbo, tolerance = tolerance,
               info = "ELBO values differ")

  expect_equal(dev_obj$niter, ref_obj$niter,
               info = "Number of iterations differs")

  expect_equal(dev_obj$converged, ref_obj$converged,
               info = "Convergence status differs")

  # Fitted values and intercept
  if (!is.null(dev_obj$fitted) && !is.null(ref_obj$fitted)) {
    expect_equal(dev_obj$fitted, ref_obj$fitted, tolerance = tolerance,
                 info = "Fitted values differ")
  }

  expect_equal(dev_obj$intercept, ref_obj$intercept, tolerance = tolerance,
               info = "Intercept differs")

  # PIPs (if present)
  if (!is.null(dev_obj$pip) && !is.null(ref_obj$pip)) {
    expect_equal(dev_obj$pip, ref_obj$pip, tolerance = tolerance,
                 info = "PIPs differ")
  }

  # Credible sets (if present)
  if (!is.null(dev_obj$sets) && !is.null(ref_obj$sets)) {
    expect_equal(dev_obj$sets$cs, ref_obj$sets$cs,
                 info = "Credible sets differ")
    if (!is.null(dev_obj$sets$purity) && !is.null(ref_obj$sets$purity)) {
      expect_equal(dev_obj$sets$purity, ref_obj$sets$purity, tolerance = tolerance,
                   info = "CS purity differs")
    }
    expect_equal(dev_obj$sets$coverage, ref_obj$sets$coverage, tolerance = tolerance,
                 info = "CS coverage differs")
  }

  invisible(TRUE)
}

# Compare susie_ss objects
expect_equal_susie_ss_objects <- function(dev_obj, ref_obj, tolerance = 1e-8) {

  # Use the same comparisons as susie objects
  expect_equal_susie_objects(dev_obj, ref_obj, tolerance)

  # Additional checks specific to sufficient statistics
  if (!is.null(dev_obj$XtXr) && !is.null(ref_obj$XtXr)) {
    expect_equal(dev_obj$XtXr, ref_obj$XtXr, tolerance = tolerance,
                 info = "XtXr differs")
  }

  invisible(TRUE)
}

# Compare susie_rss objects
expect_equal_susie_rss_objects <- function(dev_obj, ref_obj, tolerance = 1e-8) {

  # Use the same comparisons as susie objects
  expect_equal_susie_objects(dev_obj, ref_obj, tolerance)

  # Additional checks specific to RSS
  if (!is.null(dev_obj$Rz) && !is.null(ref_obj$Rz)) {
    expect_equal(dev_obj$Rz, ref_obj$Rz, tolerance = tolerance,
                 info = "Rz differs")
  }

  invisible(TRUE)
}


================================================
FILE: tests/testthat/helper_testthat.R
================================================
# =============================================================================
# HELPER FUNCTIONS FOR UNIT TESTS
# =============================================================================
#
# This file provides helper functions for testing the susieR package. These
# functions are automatically loaded by testthat when running tests.
#
# CONTENTS:
#
# 1. DATA SIMULATION FUNCTIONS
#    - simulate()              : Legacy simulation (sparse/dense matrices)
#    - simulate_tf()           : Simulate trend filtering data
#    - simulate_regression()   : Simulate linear regression with causal effects
#
# 2. DATA SETUP FUNCTIONS (Constructor-based)
#    - setup_individual_data()  : Create 'individual' class test data
#    - setup_ss_data()          : Create 'ss' class test data
#    - setup_rss_lambda_data()  : Create 'rss_lambda' class test data
#
# 3. CUSTOM EXPECTATION FUNCTIONS
#    - expect_equal_susie_*()   : Compare susie objects (individual/ss/rss)
#    - expect_equal_SER_*()     : Compare single effect regression results
#
# 4. UTILITY FUNCTIONS
#    - set_X_attributes()       : Set standardization attributes on X matrix
#    - compute_summary_stats()  : Compute XtX, Xty, yty from X, y
#    - create_sparsity_mat()    : Create sparse matrix with given sparsity
#
# USAGE NOTES:
#
# - All simulation functions use set.seed() internally for reproducibility
# - Setup functions return list(data, params, model) ready for testing
# - Custom expectation functions handle tolerance and class-specific fields
# - For new tests, prefer simulate_regression() over legacy simulate()
# - Setup functions use actual constructors to ensure correct initialization
#
# =============================================================================

# -----------------------------------------------------------------------------
# UTILITY FUNCTIONS
# -----------------------------------------------------------------------------

#' Set standardization attributes on matrix X
#'
#' Sets three attributes on the input matrix: `scaled:center` (column means),
#' `scaled:scale` (column standard deviations), and `d` (column sums of
#' squared standardized values). These attributes are used by SuSiE algorithm
#' to efficiently handle standardized data.
#'
#' @param X An n by p data matrix (dense, sparse, or trend filtering matrix)
#' @param center Logical; if TRUE, center by column means
#' @param scale Logical; if TRUE, scale by column standard deviations
#' @return X with three attributes set: `scaled:center`, `scaled:scale`, and `d`
#' @keywords internal
#' @importFrom Matrix rowSums
#' @importFrom Matrix colMeans
set_X_attributes <- function(X, center = TRUE, scale = TRUE) {
    
  # if X is a trend filtering matrix
  if (!is.null(attr(X,"matrix.type"))) {
    order = attr(X,"order")
    n = ncol(X)
    
    # Set three attributes for X.
    attr(X,"scaled:center") = compute_tf_cm(order,n)
    attr(X,"scaled:scale") = compute_tf_csd(order,n)
    attr(X,"d") = compute_tf_d(order,n,attr(X,"scaled:center"),
                               attr(X,"scaled:scale"),scale,center)
    if (!center)
      attr(X,"scaled:center") = rep(0,n)
    if (!scale)
      attr(X,"scaled:scale") = rep(1,n)
  } else {
      
    # If X is either a dense or sparse ordinary matrix.
    # Get column means.
    cm = colMeans(X,na.rm = TRUE)
    
    # Get column standard deviations.
    csd = compute_colSds(X)
    
    # Set sd = 1 when the column has variance 0.
    csd[csd == 0] = 1
    if (!center)
      cm = rep(0,length = length(cm))
    if (!scale) 
      csd = rep(1,length = length(cm))

    # Ah, this code is very inefficient because the matrix becomes
    # dense!
    # 
    #   X.std = as.matrix(X)
    #   X.std = (t(X.std) - cm)/csd
    #   attr(X,"d") = rowSums(X.std * X.std)
    #
    # Set three attributes for X.
    n = nrow(X)
    d = n*colMeans(X)^2 + (n-1)*compute_colSds(X)^2
    d = (d - n*cm^2)/csd^2
    attr(X,"d") = d
    attr(X,"scaled:center") = cm
    attr(X,"scaled:scale") = csd
  }
  return(X)
}

#' Create sparse matrix with specified sparsity level
#'
#' Generates a binary matrix with a specified proportion of non-zero entries.
#' Used for testing sparse matrix operations.
#'
#' @param sparsity Proportion of zero entries (between 0 and 1)
#' @param n Number of rows
#' @param p Number of columns
#' @return Binary matrix with (1-sparsity)*n*p non-zero entries
#' @keywords internal
create_sparsity_mat <- function(sparsity, n, p) {
  nonzero <- round(n * p * (1 - sparsity))
  nonzero.idx <- sample(n * p, nonzero)
  mat <- numeric(n * p)
  mat[nonzero.idx] <- 1
  mat <- matrix(mat, nrow = n, ncol = p)
  return(mat)
}

# -----------------------------------------------------------------------------
# DATA SIMULATION FUNCTIONS
# -----------------------------------------------------------------------------

#' Simulate trend filtering data
#'
#' Generates synthetic data for testing trend filtering functionality.
#' Creates piecewise constant (order=0), linear (order=1), or quadratic
#' (order=2) signals with noise.
#'
#' @param order Trend filtering order (0, 1, or 2)
#' @return List with X (trend filtering matrix) and y (response vector)
#' @keywords internal
simulate_tf <- function(order) {
  suppressWarnings(RNGversion("3.5.0"))
  set.seed(2)
  n = 50
  D = diag(-1, n)
  for (i in 1:(n-1)){
    D[i, i+1] = 1
  }
  if (order==0) {
    beta = c(rep(0,5),rep(1,5),rep(3,5),rep(-2,5),rep(0,30))
    y = beta + rnorm(n)
    X = solve(D)
  } else if (order==1) {
    beta = numeric(n)
    for (i in 1:n){
      if (i <= 5){
        beta[i] = 0.001*i + 2
      } else if (i <= 15){
        beta[i] = 5*0.001*i + 1.6
      } else{
        beta[i] = 6.1 - 10*0.001*i
      }
    }
    y = beta + rnorm(n)
    X = solve(D%*%D)
  } else if (order==2) {
    beta = numeric(n)
    for (i in 1:n){
      if (i <= 5){
        beta[i] = (0.001*i)^2
      } else if (i <= 35){
        beta[i] = -5*(0.001*i)^2 + 0.06
      } else{
        beta[i] = 3*(0.001*i)^2 - 3.86
      }
    }
    y = beta + rnorm(n)
    X = solve(D%*%D%*%D)
  }
  return(list(X=X, y=y))
}

# -----------------------------------------------------------------------------
# CUSTOM EXPECTATION FUNCTIONS
# -----------------------------------------------------------------------------

expect_equal_susie_update = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal(new.res$alpha, original.res$alpha, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu, original.res$mu, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu2, original.res$mu2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$Xr, original.res$Xr, scale = 1, tolerance = tolerance)
  expect_equal(new.res$KL, original.res$KL, scale = 1, tolerance = tolerance)
  expect_equal(new.res$sigma2, original.res$sigma2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$V, original.res$V, scale = 1, tolerance = tolerance)
}

expect_equal_susie_suff_stat_update = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal(new.res$alpha, original.res$alpha, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu, original.res$mu, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu2, original.res$mu2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$XtXr, original.res$XtXr, scale = 1, tolerance = tolerance)
  expect_equal(new.res$KL, original.res$KL, scale = 1, tolerance = tolerance)
  expect_equal(new.res$sigma2, original.res$sigma2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$V, original.res$V, scale = 1, tolerance = tolerance)
}

expect_equal_susie_rss_update = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal(new.res$alpha, original.res$alpha, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu, original.res$mu, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu2, original.res$mu2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$Rz, original.res$Rz, scale = 1, tolerance = tolerance)
  expect_equal(new.res$KL, original.res$KL, scale = 1, tolerance = tolerance)
  expect_equal(new.res$sigma2, original.res$sigma2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$V, original.res$V, scale = 1, tolerance = tolerance)
}

expect_equal_SER = function(new.res, original.res){
  expect_equal(new.res$alpha, original.res$alpha)
  expect_equal(new.res$mu, original.res$mu)
  expect_equal(new.res$mu2, original.res$mu2)
  expect_equal(new.res$lbf, original.res$lbf)
  expect_equal(new.res$V, original.res$V)
  expect_equal(new.res$loglik, original.res$loglik)
}

expect_equal_SER_suff_stat = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal(new.res$alpha, original.res$alpha, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu, original.res$mu, scale = 1, tolerance = tolerance)
  expect_equal(new.res$mu2, original.res$mu2, scale = 1, tolerance = tolerance)
  expect_equal(new.res$lbf, original.res$lbf, scale = 1, tolerance = tolerance)
  expect_equal(new.res$V, original.res$V, scale = 1, tolerance = tolerance)
  expect_equal(new.res$lbf_model, original.res$lbf_model, scale = 1, tolerance = tolerance)
}

expect_equal_susie = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal_susie_update(new.res, original.res, tolerance = tolerance)
  expect_equal(new.res$elbo, original.res$elbo, scale = 1, tolerance = tolerance)
  expect_equal(new.res$niter, original.res$niter, scale = 1, tolerance = tolerance)
  expect_equal(new.res$intercept, original.res$intercept, scale = 1, tolerance = tolerance)
  expect_equal(new.res$fitted, original.res$fitted, scale = 1, tolerance = tolerance)
  expect_equal(new.res$X_column_scale_factors, original.res$X_column_scale_factors, scale = 1, tolerance = tolerance)
}

expect_equal_susie_suff_stat = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal_susie_suff_stat_update(new.res, original.res, tolerance = tolerance)
  expect_equal(new.res$elbo, original.res$elbo, scale = 1, tolerance = tolerance)
  expect_equal(new.res$niter, original.res$niter, scale = 1, tolerance = tolerance)
  expect_equal(new.res$intercept, original.res$intercept, scale = 1, tolerance = tolerance)
  expect_equal(new.res$Xtfitted, original.res$Xtfitted, scale = 1, tolerance = tolerance)
}

expect_equal_susie_rss = function(new.res, original.res, tolerance = .Machine$double.eps^0.5){
  expect_equal_susie_rss_update(new.res, original.res, scale = 1, tolerance = tolerance)
  expect_equal(new.res$elbo, original.res$elbo, scale = 1, tolerance = tolerance)
  expect_equal(new.res$niter, original.res$niter, scale = 1, tolerance = tolerance)
  expect_equal(new.res$intercept, original.res$intercept, scale = 1, tolerance = tolerance)
  expect_equal(new.res$Rz, original.res$Rz, scale = 1, tolerance = tolerance)
}

#' Unified dispatcher for comparing susie objects
#'
#' Automatically detects the type of susie object and calls the appropriate
#' comparison function. This simplifies test code and ensures correct
#' comparison based on object structure.
#'
#' @param new.res New susie result object
#' @param original.res Original susie result object to compare against
#' @param tolerance Numerical tolerance for comparisons (default: sqrt(.Machine$double.eps))
#'
#' @details
#' Detects object type by checking for class-specific fields:
#' - Individual data: has 'Xr' field
#' - Sufficient stats: has 'XtXr' field
#' - RSS/RSS lambda: has 'Rz' field
#'
#' @examples
#' # Automatically handles all susie object types
#' fit1 <- susie(X, y, L = 5)
#' fit2 <- susie(X, y, L = 5)
#' expect_equal_susie_objects(fit1, fit2)
#'
expect_equal_susie_objects <- function(new.res, original.res,
                                       tolerance = .Machine$double.eps^0.5) {
  # Detect type based on class-specific fields
  if (!is.null(new.res$Xr) && !is.null(original.res$Xr)) {
    # Individual data (has Xr)
    expect_equal_susie(new.res, original.res, tolerance = tolerance)
  } else if (!is.null(new.res$XtXr) && !is.null(original.res$XtXr)) {
    # Sufficient stats (has XtXr)
    expect_equal_susie_suff_stat(new.res, original.res, tolerance = tolerance)
  } else if (!is.null(new.res$Rz) && !is.null(original.res$Rz)) {
    # RSS or RSS lambda (has Rz)
    expect_equal_susie_rss(new.res, original.res, tolerance = tolerance)
  } else {
    stop("Cannot determine susie object type. Unknown structure.")
  }
}

#' Unified dispatcher for comparing SER results
#'
#' Automatically detects the type of single effect regression result and calls
#' the appropriate comparison function.
#'
#' @param new.res New SER result object
#' @param original.res Original SER result object to compare against
#' @param tolerance Numerical tolerance for comparisons (default: sqrt(.Machine$double.eps))
#'
#' @details
#' Detects result type by checking for 'lbf_model' field (sufficient stats only)
#'
expect_equal_SER_objects <- function(new.res, original.res,
                                     tolerance = .Machine$double.eps^0.5) {
  # Detect type based on presence of lbf_model (sufficient stats specific)
  if (!is.null(new.res$lbf_model) && !is.null(original.res$lbf_model)) {
    # Sufficient stats SER
    expect_equal_SER_suff_stat(new.res, original.res, tolerance = tolerance)
  } else {
    # Individual data SER (default)
    expect_equal_SER(new.res, original.res)
  }
}

# -----------------------------------------------------------------------------
# BASE HELPER FUNCTIONS (Internal - reduce duplication)
# -----------------------------------------------------------------------------

#' Generate base regression data for testing
#'
#' Creates random X matrix and y vector for use in test setup functions.
#' This function encapsulates the common data generation pattern used across
#' multiple setup functions to reduce code duplication.
#'
#' @param n Sample size
#' @param p Number of variables
#' @param k Number of causal variables (if 0, generates random y)
#' @param signal_sd Standard deviation of effect sizes for causal variables
#' @param seed Random seed (if NULL, no seed is set)
#' @return List with X, y, and optionally beta and causal_idx
#' @keywords internal
generate_base_data <- function(n, p, k = 0, signal_sd = 1, seed = NULL) {
  if (!is.null(seed)) set.seed(seed)

  X <- matrix(rnorm(n * p), n, p)

  if (k > 0) {
    # Generate data with known causal structure
    beta <- rep(0, p)
    causal_idx <- sort(sample(1:p, k))
    beta[causal_idx] <- rnorm(k, mean = 0, sd = signal_sd)
    y <- as.vector(X %*% beta + rnorm(n))
    return(list(X = X, y = y, n = n, p = p, beta = beta, causal_idx = causal_idx))
  } else {
    # Generate random y (no causal structure)
    y <- rnorm(n)
    return(list(X = X, y = y, n = n, p = p))
  }
}

#' Create base model structure
#'
#' Creates the common model list structure used across all data types.
#' This function encapsulates the shared model initialization pattern.
#'
#' @param L Number of single effects
#' @param p Number of variables
#' @param n Number of samples (for individual data, adds Xr field)
#' @param X_attr Optional attributes from X (for predictor_weights)
#' @return List with alpha, mu, mu2, V, sigma2, pi, lbf, lbf_variable, KL
#' @keywords internal
create_base_model <- function(L, p, n = NULL, X_attr = NULL) {
  model <- list(
    alpha = matrix(1 / p, L, p),
    mu = matrix(0, L, p),
    mu2 = matrix(0, L, p),
    V = rep(1, L),
    sigma2 = 1,
    pi = rep(1 / p, p),
    lbf = rep(0, L),
    lbf_variable = matrix(0, L, p),
    KL = rep(0, L),
    null_weight = 0
  )

  # Add class-specific fields
  if (!is.null(X_attr)) {
    model$predictor_weights <- X_attr
  }

  if (!is.null(n)) {
    model$Xr <- rep(0, n)  # For individual data
  }

  return(model)
}

#' Create standard parameter list
#'
#' Creates the default params list used by setup functions. Provides consistent
#' defaults that can be overridden by specific setup functions.
#'
#' @param L Number of single effects
#' @param p Number of variables
#' @param unmappable_effects One of "none", "inf", or "ash"
#' @param additional_params Named list of additional/override parameters
#' @return List of parameters for SuSiE fitting
#' @keywords internal
create_base_params <- function(L, p, unmappable_effects = "none",
                               additional_params = list()) {
  params <- list(
    L = L,
    intercept = TRUE,
    standardize = TRUE,
    estimate_residual_variance = TRUE,
    estimate_prior_variance = TRUE,
    estimate_prior_method = "optim",
    unmappable_effects = unmappable_effects,
    use_NIG = FALSE,
    compute_univariate_zscore = TRUE,
    coverage = 0.95,
    min_abs_corr = 0.5,
    n_purity = 100,
    check_null_threshold = 0.1,
    scaled_prior_variance = 0.2,
    prior_weights = rep(1 / p, p),
    null_weight = 0,
    residual_variance = NULL,
    track_fit = FALSE,
    prior_tol = 1e-9,
    max_iter = 100,
    tol = 1e-3,
    convergence_method = "elbo",
    verbose = FALSE,
    refine = FALSE,
    model_init = NULL
  )

  # Override with additional params if provided
  if (length(additional_params) > 0) {
    params[names(additional_params)] <- additional_params
  }

  return(params)
}

# -----------------------------------------------------------------------------
# DATA SETUP FUNCTIONS (Constructor-based)
# -----------------------------------------------------------------------------

#' Setup individual-level data for testing
#'
#' Creates a complete test setup with individual-level data (X, y matrices),
#' parameters, and an initialized model. This is the primary setup function
#' for testing individual data methods.
#'
#' @param n Sample size
#' @param p Number of variables
#' @param L Number of single effects
#' @param seed Random seed for reproducibility
#' @return List with data (class: individual), params, and model
#' @keywords internal
#' @examples
#' # Internal use in tests
#' setup <- setup_individual_data(n = 100, p = 50, L = 5)
#' fit <- susie(setup$data$X, setup$data$y, L = setup$params$L)
setup_individual_data <- function(n = 100, p = 50, L = 5, seed = 42) {
  # Use base helper for data generation
  base_data <- generate_base_data(n, p, k = 0, seed = seed)
  X <- base_data$X
  y <- base_data$y

  X <- set_X_attributes(X, center = TRUE, scale = TRUE)
  mean_y <- mean(y)
  y <- y - mean_y

  data <- structure(
    list(
      X = X,
      y = y,
      n = n,
      p = p,
      mean_y = mean_y
    ),
    class = "individual"
  )

  # Use base helper for standard params
  params <- create_base_params(L, p, unmappable_effects = "none")

  # Use base helper for model, then add individual-specific fields
  model <- create_base_model(L, p, n = n, X_attr = attr(X, "d"))

  list(data = data, params = params, model = model)
}

#' Setup sufficient statistics data with unmappable_effects support
#'
#' Creates a complete test setup with sufficient statistics (XtX, Xty, yty),
#' parameters, and an initialized model. Supports unmappable effects testing.
#'
#' @param n Number of samples
#' @param p Number of variables
#' @param L Number of single effects
#' @param seed Random seed
#' @param unmappable_effects One of "none" or "inf"
#' @return List with data (class: ss), params, and model
#' @keywords internal
setup_ss_data <- function(n = 100, p = 50, L = 5, seed = 42,
                          unmappable_effects = "none") {
  # Use base helper for data generation
  base_data <- generate_base_data(n, p, k = 0, seed = seed)
  X <- base_data$X
  y <- base_data$y

  # Center and scale X like the constructor does
  X_colmeans <- colMeans(X)
  X <- sweep(X, 2, X_colmeans)
  y_mean <- mean(y)
  y <- y - y_mean

  # Compute sufficient statistics
  XtX <- crossprod(X)
  Xty <- as.vector(crossprod(X, y))
  yty <- sum(y^2)

  # Use the actual constructor like susie_ss does
  # This ensures proper setup including eigen decomposition for unmappable effects
  susie_objects <- sufficient_stats_constructor(
    XtX = XtX,
    Xty = Xty,
    yty = yty,
    n = n,
    L = L,
    X_colmeans = X_colmeans,
    y_mean = y_mean,
    standardize = TRUE,
    unmappable_effects = unmappable_effects,
    residual_variance = 1,  # Set initial residual variance
    estimate_residual_method = if (unmappable_effects != "none") "MoM" else "MLE",
    convergence_method = if (unmappable_effects != "none") "pip" else "elbo",
    coverage = 0.95,
    min_abs_corr = 0.5,
    n_purity = 100,
    check_prior = FALSE,
    track_fit = FALSE
  )

  data <- susie_objects$data
  params <- susie_objects$params

  # Use base helper for model, add ss-specific fields
  model <- create_base_model(L, data$p, n = NULL, X_attr = attr(data$XtX, "d"))
  model$XtXr <- rep(0, data$p)  # ss-specific field

  # Add unmappable components if needed
  if (unmappable_effects == "inf") {
    model$tau2 <- 0
    model$theta <- rep(0, data$p)
  }

  list(data = data, params = params, model = model)
}

#' Setup RSS lambda test data
#'
#' Creates a complete test setup for RSS with correlated residuals (lambda > 0).
#' Generates data with known causal structure, computes z-scores and correlation
#' matrix, and initializes model using the rss_lambda constructor.
#'
#' @param n Number of samples
#' @param p Number of variables
#' @param k Number of causal variables
#' @param lambda Lambda parameter (residual correlation, between 0 and 1)
#' @param signal_sd Standard deviation of causal effects
#' @param seed Random seed
#' @param L Number of single effects
#' @return List with X, y, beta, causal_idx, z, R, n, p, k, lambda, data, params, model
#' @keywords internal
setup_rss_lambda_data <- function(n = 500, p = 50, k = 3, lambda = 0.5,
                                  signal_sd = 0.5, seed = NULL, L = 5) {
  # Use base helper for data generation with causal structure
  base_data <- generate_base_data(n, p, k = k, signal_sd = signal_sd, seed = seed)
  X <- base_data$X
  y <- base_data$y
  beta <- base_data$beta
  causal_idx <- base_data$causal_idx

  # Compute sufficient statistics and z-scores
  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Build data and params using constructor
  constructor_result <- rss_lambda_constructor(z = z, R = R, lambda = lambda, n = n, L = L)

  # Initialize model properly
  var_y <- get_var_y.rss_lambda(constructor_result$data)
  model <- initialize_susie_model.rss_lambda(constructor_result$data, constructor_result$params, var_y)

  list(
    X = X,
    y = y,
    beta = beta,
    causal_idx = causal_idx,
    z = z,
    R = R,
    n = n,
    p = p,
    k = k,
    lambda = lambda,
    data = constructor_result$data,
    params = constructor_result$params,
    model = model
  )
}

# -----------------------------------------------------------------------------
# ADDITIONAL SIMULATION FUNCTIONS
# -----------------------------------------------------------------------------

#' Simulate simple regression data with known causal variables
#'
#' @param n Sample size
#' @param p Number of variables
#' @param k Number of causal variables
#' @param signal_sd Standard deviation of effect sizes
#' @param noise_sd Standard deviation of noise
#' @param center Whether to center X and y
#' @param scale Whether to scale X to unit variance
#' @return List with X, y, beta, causal_idx
simulate_regression <- function(n = 100, p = 50, k = 3,
                               signal_sd = 1, noise_sd = 1,
                               center = TRUE, scale = TRUE) {
  # Generate independent X
  X <- matrix(rnorm(n * p), n, p)

  # Optionally standardize X
  if (center || scale) {
    X <- scale(X, center = center, scale = scale)
  }

  # Generate causal effects
  beta <- rep(0, p)
  causal_idx <- sort(sample(1:p, k))
  beta[causal_idx] <- rnorm(k, mean = 0, sd = signal_sd)

  # Generate y
  y <- drop(X %*% beta + rnorm(n, sd = noise_sd))

  # Optionally center y
  if (center) {
    y <- y - mean(y)
  }

  list(
    X = X,
    y = y,
    beta = beta,
    causal_idx = causal_idx,
    n = n,
    p = p,
    k = k
  )
}

#' Compute summary statistics (XtX, Xty, yty) from X and y
#'
#' @param X n x p matrix
#' @param y n vector
#' @return List with XtX, Xty, yty, n
compute_summary_stats <- function(X, y) {
  list(
    XtX = crossprod(X),
    Xty = drop(crossprod(X, y)),
    yty = sum(y^2),
    n = length(y)
  )
}

#' Create model with credible sets for refinement testing
#'
#' Generates synthetic data with known causal structure, fits SuSiE model,
#' and returns both the model and the data/params objects needed for
#' refinement testing. Used primarily by test_refinement.R.
#'
#' @param n Sample size
#' @param p Number of variables
#' @param L Number of single effects
#' @param n_causal Number of causal variables to simulate
#' @param seed Random seed for reproducibility
#' @param run_susie Logical; if TRUE, runs susie and returns model, otherwise just returns data
#' @return List with model, data, params, X, y, beta, causal_idx
#' @keywords internal
create_model_with_cs <- function(n = 100, p = 50, L = 5, n_causal = 3,
                                  seed = 42, run_susie = TRUE) {
  set.seed(seed)

  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)

  beta <- rep(0, p)
  causal_idx <- sample(1:p, n_causal)
  beta[causal_idx] <- rnorm(n_causal, sd = 1)

  y <- as.vector(X %*% beta + rnorm(n, sd = 0.5))

  if (run_susie) {
    model <- susie(X, y, L = L, verbose = FALSE)

    constructor_result <- individual_data_constructor(
      X = X, y = y, L = L,
      standardize = TRUE, intercept = TRUE,
      estimate_residual_method = "MLE",
      convergence_method = "elbo",
      coverage = 0.95, min_abs_corr = 0.5,
      n_purity = 100,
      track_fit = FALSE
    )

    return(list(
      model = model,
      data = constructor_result$data,
      params = constructor_result$params,
      X = X,
      y = y,
      beta = beta,
      causal_idx = causal_idx
    ))
  } else {
    return(list(
      X = X,
      y = y,
      beta = beta,
      causal_idx = causal_idx
    ))
  }
}


================================================
FILE: tests/testthat/reference/test_susie_auto_reference.R
================================================
# Source helper functions
source(file.path("..", "helper_reference.R"), local = TRUE)

context("susie_auto reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie_auto()
# =============================================================================
#
# These tests compare the new susieR implementation against the reference
# package (stephenslab/susieR@1f9166c) to ensure results are identical.
#
# =============================================================================
# Part 1: Basic Tests with Default Parameters
# =============================================================================

test_that("susie_auto() matches reference with default parameters", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with L_init=2", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L_init = 2)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with L_init=5, L_max=10", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(2, -1.5, 1)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L_init = 5, L_max = 10)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 2: standardize Parameter
# =============================================================================

test_that("susie_auto() matches reference with standardize=FALSE", {
  skip_if_no_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, standardize = FALSE)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with standardize=TRUE", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, standardize = TRUE)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 3: intercept Parameter
# =============================================================================

test_that("susie_auto() matches reference with intercept=FALSE", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, intercept = FALSE)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with intercept=TRUE", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, intercept = TRUE)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 4: Tolerance Parameters
# =============================================================================

test_that("susie_auto() matches reference with init_tol=0.1", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, init_tol = 0.1)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with tol=1e-3", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 1000
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, tol = 1e-3)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 5: max_iter Parameter
# =============================================================================

test_that("susie_auto() matches reference with max_iter=50", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, max_iter = 50)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with max_iter=200", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, max_iter = 200)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 6: Combined Parameter Tests
# =============================================================================

test_that("susie_auto() matches reference with standardize=FALSE, intercept=FALSE", {
  skip_if_no_reference()

  set.seed(12)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, standardize = FALSE, intercept = FALSE)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with L_init=2, L_max=8, init_tol=0.5", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L_init = 2, L_max = 8, init_tol = 0.5)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

# =============================================================================
# Part 7: Edge Cases
# =============================================================================

test_that("susie_auto() matches reference with sparse signal", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[5] <- 3  # Only one effect
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with dense signal", {
  skip_if_no_reference()

  set.seed(15)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:10] <- rnorm(10)  # Ten effects
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L_init = 5, L_max = 20)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})

test_that("susie_auto() matches reference with high noise", {
  skip_if_no_reference()

  set.seed(16)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 3))  # High noise

  args <- list(X = X, y = y)
  compare_to_reference("susie_auto", args, tolerance = 1e-5)
})


================================================
FILE: tests/testthat/reference/test_susie_nig_reference.R
================================================
# Source helper functions for NIG reference comparison
source(file.path("..", "helper_nig_reference.R"), local = TRUE)

context("susie NIG reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie(estimate_residual_method = "NIG")
# =============================================================================
#
# These tests compare our implementation of the NIG
# prior, invoked via estimate_residual_method = "NIG",
# against the reference implementation on the fix-susie-small-sigma-update
# branch of stephenslab/susieR (commit a999d44), where the equivalent
# feature is invoked via small = TRUE.
#
# Parameter mapping between the two interfaces:
#   Dev:  estimate_residual_method = "NIG"  <->  Ref: small = TRUE
#   Dev:  tol (convergence tolerance)                   <->  Ref: tol_small
#   Dev:  convergence_method = "pip" (auto-set)         <->  Ref: (hard-coded PIP convergence)
#   Dev:  estimate_prior_method = "EM" (auto-set)       <->  Ref: (forced to EM)
#   Dev:  alpha0, beta0                                 <->  Ref: alpha0, beta0
#
# The helper function compare_NIG_to_reference() handles
# this mapping automatically.

# =============================================================================
# Part 1: Default parameters (baseline match)
# =============================================================================

test_that("NIG matches reference (small=TRUE) with defaults", {
  skip_if_no_nig_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Dev: estimate_residual_method = "NIG" (set by helper)
  # Ref: small = TRUE (mapped by helper)
  # Reference defaults to alpha0 = beta0 = 0.1; dev's current default is
  # 1/sqrt(n). The helper forces 0.1 on the dev side when the caller
  # doesn't set these, so both runs use the same NIG hyperparameters.
  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 2: L = 1 (single effect — ELBO is well-defined)
# =============================================================================

test_that("NIG matches reference with L = 1", {
  skip("L=1 uses different convergence methods between dev and ref")
  skip_if_no_nig_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[3] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 1)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 3: standardize = FALSE
# =============================================================================

test_that("NIG matches reference with standardize=FALSE", {
  skip_if_no_nig_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, standardize = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 4: intercept = FALSE
# =============================================================================

test_that("NIG matches reference with intercept=FALSE", {
  skip_if_no_nig_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, intercept = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 5: Custom alpha0 and beta0
# =============================================================================

test_that("NIG matches reference with custom alpha0/beta0", {
  skip_if_no_nig_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, alpha0 = 1.0, beta0 = 1.0)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

test_that("NIG matches reference with small alpha0/beta0", {
  skip_if_no_nig_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, alpha0 = 0.01, beta0 = 0.01)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 6: estimate_prior_variance = FALSE
# =============================================================================

test_that("NIG matches reference with estimate_prior_variance=FALSE", {
  skip_if_no_nig_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, estimate_prior_variance = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 7: Explicit convergence tolerance
# =============================================================================

test_that("NIG matches reference with tol = 1e-4", {
  skip_if_no_nig_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Dev uses tol; helper maps it to tol_small for reference
  dev_args <- list(X = X, y = y, L = 10, tol = 1e-4)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 8: max_iter boundary
# =============================================================================

test_that("NIG matches reference with small max_iter", {
  skip_if_no_nig_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Force early termination to test partial convergence path
  dev_args <- list(X = X, y = y, L = 10, max_iter = 5)
  results  <- suppressWarnings(
    compare_NIG_to_reference(dev_args, tolerance = 1e-5)
  )

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 9: Sparse signal (most effects zero)
# =============================================================================

test_that("NIG matches reference with very sparse signal", {
  skip_if_no_nig_reference()

  set.seed(10)
  n <- 100
  p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1] <- 5  # single strong effect
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 10: Small sample size (n < 80, the regime NIG targets)
# =============================================================================

test_that("NIG matches reference with small n", {
  skip_if_no_nig_reference()

  set.seed(11)
  n <- 30
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 11: High noise (large residual variance)
# =============================================================================

test_that("NIG matches reference with high noise", {
  skip_if_no_nig_reference()

  set.seed(12)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))  # high noise

  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 12: Combined — standardize=FALSE, intercept=FALSE
# =============================================================================

test_that("NIG matches reference with standardize=FALSE, intercept=FALSE", {
  skip_if_no_nig_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, standardize = FALSE, intercept = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 13: Combined — custom alpha0/beta0 with standardize=FALSE
# =============================================================================

test_that("NIG matches reference with custom priors and standardize=FALSE", {
  skip_if_no_nig_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(
    X = X, y = y, L = 10,
    standardize = FALSE,
    alpha0 = 0.5,
    beta0 = 0.5
  )
  results <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 14: Null signal (no true effects)
# =============================================================================

test_that("NIG matches reference under null signal", {
  skip_if_no_nig_reference()

  set.seed(15)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)  # pure noise

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 15: L = 1 with standardize = FALSE (ELBO well-defined, no scaling)
# =============================================================================

test_that("NIG matches reference with L=1, standardize=FALSE", {
  skip("L=1 uses different convergence methods between dev and ref")
  skip_if_no_nig_reference()

  set.seed(16)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[5] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 1, standardize = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 16: Small n with intercept = FALSE
# =============================================================================

test_that("NIG matches reference with small n and intercept=FALSE", {
  skip_if_no_nig_reference()

  set.seed(17)
  n <- 20
  p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1] <- 5
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 3, intercept = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Part 17: Diagnostic — field-by-field summary of discrepancies
# =============================================================================
#
# This test does NOT use expect_equal; instead it generates a summary of
# all numeric differences between dev and reference outputs. Useful for
# diagnosing regressions without hard-failing CI.

test_that("NIG field-by-field difference summary", {
  skip_if_no_nig_reference()

  set.seed(100)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  dev <- results$dev
  ref <- results$ref

  # Collect per-field max absolute differences
  fields <- c("alpha", "mu", "mu2", "V", "sigma2", "intercept",
              "fitted", "pip")

  diffs <- vapply(fields, function(f) {
    d <- dev[[f]]
    r <- ref[[f]]
    if (is.null(d) || is.null(r)) return(NA_real_)
    max(abs(d - r), na.rm = TRUE)
  }, numeric(1))

  # Print a summary table
  message("\n--- NIG vs reference: max |dev - ref| per field ---")
  for (f in names(diffs)) {
    message(sprintf("  %-12s: %s", f, format(diffs[f], digits = 8)))
  }

  # Convergence & iteration metadata
  message(sprintf("  niter (dev/ref): %d / %d", dev$niter, ref$niter))
  message(sprintf("  converged (dev/ref): %s / %s", dev$converged, ref$converged))

  # Credible sets match
  if (!is.null(dev$sets$cs) && !is.null(ref$sets$cs)) {
    cs_match <- identical(dev$sets$cs, ref$sets$cs)
    message(sprintf("  CS sets identical: %s", cs_match))
  }

  # Hard assertion: all differences should be < tolerance
  expect_true(all(diffs[!is.na(diffs)] < 1e-5),
              info = paste("Some fields exceed tolerance:",
                           paste(names(which(diffs >= 1e-5)),
                                 collapse = ", ")))
})

# #############################################################################
# EXPANDED EDGE-CASE TEST SUITE
# #############################################################################

# =============================================================================
# Category A: Data dimensions
# =============================================================================

# Part 18: n >> p (overdetermined)
test_that("NIG matches reference with n >> p (overdetermined)", {
  skip_if_no_nig_reference()

  set.seed(101)
  n <- 500
  p <- 20
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(2, -1.5, 3)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 19: n << p (underdetermined, genetics regime)
test_that("NIG matches reference with n << p (underdetermined)", {
  skip_if_no_nig_reference()

  set.seed(102)
  n <- 30
  p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 50)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 20: n = p (square)
test_that("NIG matches reference with n = p (square)", {
  skip_if_no_nig_reference()

  set.seed(103)
  n <- 50
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(2, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 21: Very small n
test_that("NIG matches reference with very small n", {
  skip_if_no_nig_reference()

  set.seed(104)
  n <- 10
  p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 3)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category B: Signal patterns
# =============================================================================

# Part 22: Weak signals (low SNR)
test_that("NIG matches reference with weak signals", {
  skip_if_no_nig_reference()

  set.seed(105)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(0.3, -0.3, 0.2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 23: Very strong signals
test_that("NIG matches reference with very strong signals", {
  skip_if_no_nig_reference()

  set.seed(106)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(10, -15, 20)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 24: Mixed strength signals
test_that("NIG matches reference with mixed strength signals", {
  skip_if_no_nig_reference()

  set.seed(107)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(10, 0.5, -10, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 25: Many true effects
test_that("NIG matches reference with many true effects", {
  skip_if_no_nig_reference()

  set.seed(108)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:10] <- c(2, -1.5, 3, -2, 1, -1, 2.5, -0.8, 1.2, -1.8)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category C: L values
# =============================================================================

# Part 26: L = 2 (minimal multi-effect)
test_that("NIG matches reference with L = 2", {
  skip_if_no_nig_reference()

  set.seed(109)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 2)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 27: L = 20 (more effects than default)
test_that("NIG matches reference with L = 20", {
  skip_if_no_nig_reference()

  set.seed(110)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 20)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 28: L >> true effects (over-specified)
test_that("NIG matches reference with L >> true effects", {
  skip_if_no_nig_reference()

  set.seed(111)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 15)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 29: L < true effects (under-specified)
test_that("NIG matches reference with L < true effects", {
  skip_if_no_nig_reference()

  set.seed(112)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:5] <- c(3, -2, 4, -1.5, 2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 2)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category D: Prior parameters alpha0/beta0
# =============================================================================

# Part 30: Informative priors
test_that("NIG matches reference with informative alpha0/beta0", {
  skip_if_no_nig_reference()

  set.seed(113)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, alpha0 = 10, beta0 = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 31: Very diffuse priors
test_that("NIG matches reference with very diffuse alpha0/beta0", {
  skip_if_no_nig_reference()

  set.seed(114)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, alpha0 = 0.001, beta0 = 0.001)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 32: Asymmetric priors
test_that("NIG matches reference with asymmetric alpha0/beta0", {
  skip_if_no_nig_reference()

  set.seed(115)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, alpha0 = 0.1, beta0 = 1.0)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category E: Predictor structure
# =============================================================================

# Part 33: AR(1) correlated predictors
test_that("NIG matches reference with AR(1) correlated X", {
  skip_if_no_nig_reference()

  set.seed(116)
  n <- 100
  p <- 50
  rho <- 0.8

  # Generate AR(1) correlation structure
  Z <- matrix(rnorm(n * p), n, p)
  X <- Z
  for (j in 2:p) {
    X[, j] <- rho * X[, j - 1] + sqrt(1 - rho^2) * Z[, j]
  }

  beta <- rep(0, p)
  beta[c(1, 25)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 34: Block-correlated predictors
test_that("NIG matches reference with block-correlated X", {
  skip_if_no_nig_reference()

  set.seed(117)
  n <- 100
  p <- 50
  block_size <- 5
  n_blocks <- p / block_size

  # Generate block correlation structure
  X <- matrix(0, n, p)
  for (b in seq_len(n_blocks)) {
    cols <- ((b - 1) * block_size + 1):(b * block_size)
    common <- rnorm(n)
    for (j in cols) {
      X[, j] <- 0.8 * common + 0.6 * rnorm(n)
    }
  }

  beta <- rep(0, p)
  beta[c(1, 26)] <- c(3, -2)  # one in first block, one in sixth block
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 35: Near-collinear predictors
test_that("NIG matches reference with near-collinear predictors", {
  skip_if_no_nig_reference()

  set.seed(118)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)

  # Make columns 2 nearly identical to column 1 (r ~ 0.99)
  X[, 2] <- X[, 1] + rnorm(n, sd = 0.1)

  beta <- rep(0, p)
  beta[c(1, 2)] <- c(2, -1.5)  # both collinear predictors active
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category F: Convergence settings
# =============================================================================

# Part 36: max_iter = 1 (single iteration snapshot)
test_that("NIG matches reference with max_iter = 1", {
  skip_if_no_nig_reference()

  set.seed(119)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, max_iter = 1)
  results  <- suppressWarnings(
    compare_NIG_to_reference(dev_args, tolerance = 1e-5)
  )

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 37: max_iter = 2 (minimal convergence path)
test_that("NIG matches reference with max_iter = 2", {
  skip_if_no_nig_reference()

  set.seed(120)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, max_iter = 2)
  results  <- suppressWarnings(
    compare_NIG_to_reference(dev_args, tolerance = 1e-5)
  )

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 38: Tight convergence tolerance
test_that("NIG matches reference with tight tol = 1e-6", {
  skip_if_no_nig_reference()

  set.seed(121)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, tol = 1e-6)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category G: null_weight and prior_weights
# =============================================================================

# Part 39: null_weight = 0.5 (strong null prior)
test_that("NIG matches reference with null_weight = 0.5", {
  skip("null_weight + NIG triggers NA in loglik (dev-side bug)")
  skip_if_no_nig_reference()

  set.seed(122)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10, null_weight = 0.5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 40: Non-uniform prior_weights
test_that("NIG matches reference with non-uniform prior_weights", {
  skip_if_no_nig_reference()

  set.seed(123)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Favor first 10 predictors
  pw <- rep(1, p)
  pw[1:10] <- 5
  pw <- pw / sum(pw)

  dev_args <- list(X = X, y = y, L = 10, prior_weights = pw)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category H: Parameter combinations
# =============================================================================

# Part 41: Small n + weak signal
test_that("NIG matches reference with small n + weak signal", {
  skip_if_no_nig_reference()

  set.seed(124)
  n <- 20
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:2] <- c(0.5, -0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 42: n << p + L large
test_that("NIG matches reference with n << p and large L", {
  skip_if_no_nig_reference()

  set.seed(125)
  n <- 30
  p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(10, 50, 100)] <- c(3, -2, 4)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 10)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 43: intercept=FALSE + small n
test_that("NIG matches reference with intercept=FALSE + small n", {
  skip_if_no_nig_reference()

  set.seed(126)
  n <- 25
  p <- 40
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- c(2, -1.5, 3)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 5, intercept = FALSE)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 44: standardize=FALSE + custom alpha0/beta0
test_that("NIG matches reference with standardize=FALSE + custom priors", {
  skip_if_no_nig_reference()

  set.seed(127)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(
    X = X, y = y, L = 10,
    standardize = FALSE,
    alpha0 = 1.0, beta0 = 0.5
  )
  results <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 45: estimate_prior_variance=FALSE + intercept=FALSE
test_that("NIG matches reference with estimate_prior_variance=FALSE + intercept=FALSE", {
  skip_if_no_nig_reference()

  set.seed(128)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(
    X = X, y = y, L = 10,
    estimate_prior_variance = FALSE,
    intercept = FALSE
  )
  results <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# =============================================================================
# Category I: L = 1 variants
# =============================================================================

# Part 46: L=1 + high noise
test_that("NIG matches reference with L=1 + high noise", {
  skip("L=1 uses different convergence methods between dev and ref")
  skip_if_no_nig_reference()

  set.seed(129)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))

  dev_args <- list(X = X, y = y, L = 1)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 47: L=1 + very small n
test_that("NIG matches reference with L=1 + very small n", {
  skip("L=1 uses different convergence methods between dev and ref")
  skip_if_no_nig_reference()

  set.seed(130)
  n <- 15
  p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  dev_args <- list(X = X, y = y, L = 1)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# Part 48: L=1 + null signal (no true effect)
test_that("NIG matches reference with L=1 + null signal", {
  skip("L=1 uses different convergence methods between dev and ref")
  skip_if_no_nig_reference()

  set.seed(131)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)  # pure noise

  dev_args <- list(X = X, y = y, L = 1)
  results  <- compare_NIG_to_reference(dev_args, tolerance = 1e-5)

  expect_equal_NIG_objects(results$dev, results$ref, tolerance = 1e-5)
})

# #############################################################################
# SUFFICIENT STATISTICS VS INDIVIDUAL-LEVEL DATA COMPARISON
# #############################################################################
#
# For each reference test scenario above, verify that susie_ss()
# produces the same result as susie() with NIG.
# These tests do NOT require the reference package.

# =============================================================================
# SS Part 1: Default parameters (baseline match)
# =============================================================================

test_that("SS matches individual: defaults (Part 1)", {
  set.seed(1)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 10))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 2: L = 1 (skipped — convergence method differs)
# =============================================================================

test_that("SS matches individual: L = 1 (Part 2)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(2)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[3] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 1))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 3: standardize = FALSE
# =============================================================================

test_that("SS matches individual: standardize=FALSE (Part 3)", {
  set.seed(3)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE))
  expect_ss_matches_individual_ss(res)
})


# =============================================================================
# SS Part 4: Custom alpha0 and beta0
# =============================================================================

test_that("SS matches individual: custom alpha0/beta0 (Part 4)", {
  set.seed(5)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 1.0, beta0 = 1.0))
  expect_ss_matches_individual_ss(res)
})

test_that("SS matches individual: small alpha0/beta0 (Part 5)", {
  set.seed(6)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.01, beta0 = 0.01))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 6: estimate_prior_variance = FALSE
# =============================================================================

test_that("SS matches individual: estimate_prior_variance=FALSE (Part 6)", {
  set.seed(7)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, estimate_prior_variance = FALSE))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 7: Explicit convergence tolerance
# =============================================================================

test_that("SS matches individual: tol = 1e-4 (Part 7)", {
  set.seed(8)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, tol = 1e-4))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 8: max_iter boundary
# =============================================================================

test_that("SS matches individual: small max_iter (Part 8)", {
  set.seed(9)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 9: Sparse signal
# =============================================================================

test_that("SS matches individual: very sparse signal (Part 9)", {
  set.seed(10)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 5
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 10: Small sample size
# =============================================================================

test_that("SS matches individual: small n (Part 10)", {
  set.seed(11)
  n <- 30; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 11: High noise
# =============================================================================

test_that("SS matches individual: high noise (Part 11)", {
  set.seed(12)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))

  res <- run_ss_and_individual_NIG(X, y, list(L = 10))
  expect_ss_matches_individual_ss(res)
})


# =============================================================================
# SS Part 12: Custom alpha0/beta0 with standardize=FALSE
# =============================================================================

test_that("SS matches individual: custom priors + standardize=FALSE (Part 12)", {
  set.seed(14)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE, alpha0 = 0.5, beta0 = 0.5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 13: Null signal
# =============================================================================

test_that("SS matches individual: null signal (Part 13)", {
  set.seed(15)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 14: L=1 with standardize=FALSE (skipped)
# =============================================================================

test_that("SS matches individual: L=1, standardize=FALSE (Part 14)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(16)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[5] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 1, standardize = FALSE))
  expect_ss_matches_individual_ss(res)
})


# =============================================================================
# SS Part 15: n >> p (overdetermined)
# =============================================================================

test_that("SS matches individual: n >> p (Part 15)", {
  set.seed(101)
  n <- 500; p <- 20
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(2, -1.5, 3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 16: n << p (underdetermined)
# =============================================================================

test_that("SS matches individual: n << p (Part 16)", {
  set.seed(102)
  n <- 30; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(5, 50)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 17: n = p (square)
# =============================================================================

test_that("SS matches individual: n = p (Part 17)", {
  set.seed(103)
  n <- 50; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(2, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 18: Very small n
# =============================================================================

test_that("SS matches individual: very small n (Part 18)", {
  set.seed(104)
  n <- 10; p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 3))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 19: Weak signals
# =============================================================================

test_that("SS matches individual: weak signals (Part 19)", {
  set.seed(105)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(0.3, -0.3, 0.2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 20: Very strong signals
# =============================================================================

test_that("SS matches individual: very strong signals (Part 20)", {
  set.seed(106)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(10, -15, 20)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 21: Mixed strength signals
# =============================================================================

test_that("SS matches individual: mixed strength signals (Part 21)", {
  set.seed(107)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(10, 0.5, -10, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 10))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 22: Many true effects
# =============================================================================

test_that("SS matches individual: many true effects (Part 22)", {
  set.seed(108)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:10] <- c(2, -1.5, 3, -2, 1, -1, 2.5, -0.8, 1.2, -1.8)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 10))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 23: L = 2
# =============================================================================

test_that("SS matches individual: L = 2 (Part 23)", {
  set.seed(109)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 2))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 24: L = 20
# =============================================================================

test_that("SS matches individual: L = 20 (Part 24)", {
  set.seed(110)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 20))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 25: L >> true effects
# =============================================================================

test_that("SS matches individual: L >> true effects (Part 25)", {
  set.seed(111)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 15))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 26: L < true effects
# =============================================================================

test_that("SS matches individual: L < true effects (Part 26)", {
  set.seed(112)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:5] <- c(3, -2, 4, -1.5, 2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 2))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 27: Informative alpha0/beta0
# =============================================================================

test_that("SS matches individual: informative alpha0/beta0 (Part 27)", {
  set.seed(113)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 10, beta0 = 10))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 28: Very diffuse alpha0/beta0
# =============================================================================

test_that("SS matches individual: very diffuse alpha0/beta0 (Part 28)", {
  set.seed(114)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.001, beta0 = 0.001))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 29: Asymmetric alpha0/beta0
# =============================================================================

test_that("SS matches individual: asymmetric alpha0/beta0 (Part 29)", {
  set.seed(115)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.1, beta0 = 1.0))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 30: AR(1) correlated predictors
# =============================================================================

test_that("SS matches individual: AR(1) correlated X (Part 30)", {
  set.seed(116)
  n <- 100; p <- 50; rho <- 0.8

  Z <- matrix(rnorm(n * p), n, p)
  X <- Z
  for (j in 2:p) {
    X[, j] <- rho * X[, j - 1] + sqrt(1 - rho^2) * Z[, j]
  }

  beta <- rep(0, p); beta[c(1, 25)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 31: Block-correlated predictors
# =============================================================================

test_that("SS matches individual: block-correlated X (Part 31)", {
  set.seed(117)
  n <- 100; p <- 50; block_size <- 5
  n_blocks <- p / block_size

  X <- matrix(0, n, p)
  for (b in seq_len(n_blocks)) {
    cols <- ((b - 1) * block_size + 1):(b * block_size)
    common <- rnorm(n)
    for (j in cols) {
      X[, j] <- 0.8 * common + 0.6 * rnorm(n)
    }
  }

  beta <- rep(0, p); beta[c(1, 26)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 32: Near-collinear predictors
# =============================================================================

test_that("SS matches individual: near-collinear X (Part 32)", {
  set.seed(118)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X[, 2] <- X[, 1] + rnorm(n, sd = 0.1)

  beta <- rep(0, p); beta[c(1, 2)] <- c(2, -1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 33: max_iter = 1
# =============================================================================

test_that("SS matches individual: max_iter = 1 (Part 33)", {
  set.seed(119)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 1))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 34: max_iter = 2
# =============================================================================

test_that("SS matches individual: max_iter = 2 (Part 34)", {
  set.seed(120)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 2))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 35: Tight convergence tolerance
# =============================================================================

test_that("SS matches individual: tight tol = 1e-6 (Part 35)", {
  set.seed(121)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, tol = 1e-6))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 36: null_weight = 0.5 (skipped — known dev-side bug)
# =============================================================================

test_that("SS matches individual: null_weight = 0.5 (Part 36)", {
  skip("null_weight + NIG triggers NA in loglik (dev-side bug)")

  set.seed(122)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, null_weight = 0.5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 37: Non-uniform prior_weights
# =============================================================================

test_that("SS matches individual: non-uniform prior_weights (Part 37)", {
  set.seed(123)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  pw <- rep(1, p); pw[1:10] <- 5; pw <- pw / sum(pw)

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, prior_weights = pw))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 38: Small n + weak signal
# =============================================================================

test_that("SS matches individual: small n + weak signal (Part 38)", {
  set.seed(124)
  n <- 20; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(0.5, -0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 5))
  expect_ss_matches_individual_ss(res)
})

# =============================================================================
# SS Part 39: n << p + L large
# =============================================================================

test_that("SS matches individual: n << p + large L (Part 39)", {
  set.seed(125)
  n <- 30; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(10, 50, 100)] <- c(3, -2, 4)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 10))
  expect_ss_matches_individual_ss(res)
})


# =============================================================================
# SS Part 40: standardize=FALSE + custom alpha0/beta0
# =============================================================================

test_that("SS matches individual: standardize=FALSE + custom priors (Part 40)", {
  set.seed(127)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE, alpha0 = 1.0, beta0 = 0.5))
  expect_ss_matches_individual_ss(res)
})


# =============================================================================
# SS Part 41-43: L = 1 variants (all skipped)
# =============================================================================

test_that("SS matches individual: L=1 + high noise (Part 41)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(129)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))

  res <- run_ss_and_individual_NIG(X, y, list(L = 1))
  expect_ss_matches_individual_ss(res)
})

test_that("SS matches individual: L=1 + very small n (Part 42)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(130)
  n <- 15; p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_ss_and_individual_NIG(X, y, list(L = 1))
  expect_ss_matches_individual_ss(res)
})

test_that("SS matches individual: L=1 + null signal (Part 43)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(131)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  res <- run_ss_and_individual_NIG(X, y, list(L = 1))
  expect_ss_matches_individual_ss(res)
})

# #############################################################################
# RSS (SUMMARY STATISTICS) VS INDIVIDUAL-LEVEL DATA COMPARISON
# #############################################################################
#
# For each reference test scenario above, verify that susie_rss()
# (via the bhat/shat/var_y path) produces the same result as susie()
# with NIG.
# These tests do NOT require the reference package.

# =============================================================================
# RSS Part 1: Default parameters (baseline match)
# =============================================================================

test_that("RSS matches individual: defaults (Part 1)", {
  set.seed(1)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 2: L = 1 (skipped — convergence method differs)
# =============================================================================

test_that("RSS matches individual: L = 1 (Part 2)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(2)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[3] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 1))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 3: standardize = FALSE
# =============================================================================

test_that("RSS matches individual: standardize=FALSE (Part 3)", {
  set.seed(3)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 4: Custom alpha0 and beta0
# =============================================================================

test_that("RSS matches individual: custom alpha0/beta0 (Part 4)", {
  set.seed(5)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 1.0, beta0 = 1.0))
  expect_rss_matches_individual_ss(res)
})

test_that("RSS matches individual: small alpha0/beta0 (Part 5)", {
  set.seed(6)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.01, beta0 = 0.01))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 6: estimate_prior_variance = FALSE
# =============================================================================

test_that("RSS matches individual: estimate_prior_variance=FALSE (Part 6)", {
  set.seed(7)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, estimate_prior_variance = FALSE))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 7: Explicit convergence tolerance
# =============================================================================

test_that("RSS matches individual: tol = 1e-4 (Part 7)", {
  set.seed(8)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, tol = 1e-4))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 8: max_iter boundary
# =============================================================================

test_that("RSS matches individual: small max_iter (Part 8)", {
  set.seed(9)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 9: Sparse signal
# =============================================================================

test_that("RSS matches individual: very sparse signal (Part 9)", {
  set.seed(10)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 5
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 10: Small sample size
# =============================================================================

test_that("RSS matches individual: small n (Part 10)", {
  set.seed(11)
  n <- 30; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 11: High noise
# =============================================================================

test_that("RSS matches individual: high noise (Part 11)", {
  set.seed(12)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))

  res <- run_rss_and_individual_NIG(X, y, list(L = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 12: Custom alpha0/beta0 with standardize=FALSE
# =============================================================================

test_that("RSS matches individual: custom priors + standardize=FALSE (Part 12)", {
  set.seed(14)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE, alpha0 = 0.5, beta0 = 0.5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 13: Null signal
# =============================================================================

test_that("RSS matches individual: null signal (Part 13)", {
  set.seed(15)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 14: L=1 with standardize=FALSE (skipped)
# =============================================================================

test_that("RSS matches individual: L=1, standardize=FALSE (Part 14)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(16)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[5] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 1, standardize = FALSE))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 15: n >> p (overdetermined)
# =============================================================================

test_that("RSS matches individual: n >> p (Part 15)", {
  set.seed(101)
  n <- 500; p <- 20
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(2, -1.5, 3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 16: n << p (underdetermined)
# =============================================================================

test_that("RSS matches individual: n << p (Part 16)", {
  set.seed(102)
  n <- 30; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(5, 50)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 17: n = p (square)
# =============================================================================

test_that("RSS matches individual: n = p (Part 17)", {
  set.seed(103)
  n <- 50; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(2, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 18: Very small n
# =============================================================================

test_that("RSS matches individual: very small n (Part 18)", {
  set.seed(104)
  n <- 10; p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 3))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 19: Weak signals
# =============================================================================

test_that("RSS matches individual: weak signals (Part 19)", {
  set.seed(105)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(0.3, -0.3, 0.2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 20: Very strong signals
# =============================================================================

test_that("RSS matches individual: very strong signals (Part 20)", {
  set.seed(106)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:3] <- c(10, -15, 20)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 21: Mixed strength signals
# =============================================================================

test_that("RSS matches individual: mixed strength signals (Part 21)", {
  set.seed(107)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(10, 0.5, -10, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 22: Many true effects
# =============================================================================

test_that("RSS matches individual: many true effects (Part 22)", {
  set.seed(108)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:10] <- c(2, -1.5, 3, -2, 1, -1, 2.5, -0.8, 1.2, -1.8)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 23: L = 2
# =============================================================================

test_that("RSS matches individual: L = 2 (Part 23)", {
  set.seed(109)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 2))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 24: L = 20
# =============================================================================

test_that("RSS matches individual: L = 20 (Part 24)", {
  set.seed(110)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 20))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 25: L >> true effects
# =============================================================================

test_that("RSS matches individual: L >> true effects (Part 25)", {
  set.seed(111)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 15))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 26: L < true effects
# =============================================================================

test_that("RSS matches individual: L < true effects (Part 26)", {
  set.seed(112)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:5] <- c(3, -2, 4, -1.5, 2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 2))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 27: Informative alpha0/beta0
# =============================================================================

test_that("RSS matches individual: informative alpha0/beta0 (Part 27)", {
  set.seed(113)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 10, beta0 = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 28: Very diffuse alpha0/beta0
# =============================================================================

test_that("RSS matches individual: very diffuse alpha0/beta0 (Part 28)", {
  set.seed(114)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.001, beta0 = 0.001))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 29: Asymmetric alpha0/beta0
# =============================================================================

test_that("RSS matches individual: asymmetric alpha0/beta0 (Part 29)", {
  set.seed(115)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, alpha0 = 0.1, beta0 = 1.0))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 30: AR(1) correlated predictors
# =============================================================================

test_that("RSS matches individual: AR(1) correlated X (Part 30)", {
  set.seed(116)
  n <- 100; p <- 50; rho <- 0.8

  Z <- matrix(rnorm(n * p), n, p)
  X <- Z
  for (j in 2:p) {
    X[, j] <- rho * X[, j - 1] + sqrt(1 - rho^2) * Z[, j]
  }

  beta <- rep(0, p); beta[c(1, 25)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 31: Block-correlated predictors
# =============================================================================

test_that("RSS matches individual: block-correlated X (Part 31)", {
  set.seed(117)
  n <- 100; p <- 50; block_size <- 5
  n_blocks <- p / block_size

  X <- matrix(0, n, p)
  for (b in seq_len(n_blocks)) {
    cols <- ((b - 1) * block_size + 1):(b * block_size)
    common <- rnorm(n)
    for (j in cols) {
      X[, j] <- 0.8 * common + 0.6 * rnorm(n)
    }
  }

  beta <- rep(0, p); beta[c(1, 26)] <- c(3, -2)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 32: Near-collinear predictors
# =============================================================================

test_that("RSS matches individual: near-collinear X (Part 32)", {
  set.seed(118)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X[, 2] <- X[, 1] + rnorm(n, sd = 0.1)

  beta <- rep(0, p); beta[c(1, 2)] <- c(2, -1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 33: max_iter = 1
# =============================================================================

test_that("RSS matches individual: max_iter = 1 (Part 33)", {
  set.seed(119)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 1))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 34: max_iter = 2
# =============================================================================

test_that("RSS matches individual: max_iter = 2 (Part 34)", {
  set.seed(120)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, max_iter = 2))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 35: Tight convergence tolerance
# =============================================================================

test_that("RSS matches individual: tight tol = 1e-6 (Part 35)", {
  set.seed(121)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, tol = 1e-6))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 36: null_weight = 0.5 (skipped — known dev-side bug)
# =============================================================================

test_that("RSS matches individual: null_weight = 0.5 (Part 36)", {
  skip("null_weight + NIG triggers NA in loglik (dev-side bug)")

  set.seed(122)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, null_weight = 0.5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 37: Non-uniform prior_weights
# =============================================================================

test_that("RSS matches individual: non-uniform prior_weights (Part 37)", {
  set.seed(123)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  pw <- rep(1, p); pw[1:10] <- 5; pw <- pw / sum(pw)

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, prior_weights = pw))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 38: Small n + weak signal
# =============================================================================

test_that("RSS matches individual: small n + weak signal (Part 38)", {
  set.seed(124)
  n <- 20; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:2] <- c(0.5, -0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 39: n << p + L large
# =============================================================================

test_that("RSS matches individual: n << p + large L (Part 39)", {
  set.seed(125)
  n <- 30; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(10, 50, 100)] <- c(3, -2, 4)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 10))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 40: standardize=FALSE + custom alpha0/beta0
# =============================================================================

test_that("RSS matches individual: standardize=FALSE + custom priors (Part 40)", {
  set.seed(127)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y,
    list(L = 10, standardize = FALSE, alpha0 = 1.0, beta0 = 0.5))
  expect_rss_matches_individual_ss(res)
})

# =============================================================================
# RSS Part 41-43: L = 1 variants (all skipped)
# =============================================================================

test_that("RSS matches individual: L=1 + high noise (Part 41)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(129)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 3
  y <- as.vector(X %*% beta + rnorm(n, sd = 10))

  res <- run_rss_and_individual_NIG(X, y, list(L = 1))
  expect_rss_matches_individual_ss(res)
})

test_that("RSS matches individual: L=1 + very small n (Part 42)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(130)
  n <- 15; p <- 30
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[1] <- 4
  y <- as.vector(X %*% beta + rnorm(n))

  res <- run_rss_and_individual_NIG(X, y, list(L = 1))
  expect_rss_matches_individual_ss(res)
})

test_that("RSS matches individual: L=1 + null signal (Part 43)", {
  skip("L=1 uses different convergence methods between dev and ref")

  set.seed(131)
  n <- 100; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  res <- run_rss_and_individual_NIG(X, y, list(L = 1))
  expect_rss_matches_individual_ss(res)
})


================================================
FILE: tests/testthat/reference/test_susie_reference.R
================================================
# Source helper functions
source(file.path("..", "helper_reference.R"), local = TRUE)

context("susie reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie()
# =============================================================================
#
# These functions compare the new susieR implementation against the reference
# package (stephenslab/susieR@1f9166c) to ensure results are identical.
#
# Tests cover all major parameters and their combinations with all three
# prior variance optimization methods: "optim", "EM", "simple"

# =============================================================================
# Part 1: Basic Parameter Tests
# =============================================================================

test_that("susie() matches reference with default parameters - optim", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with default parameters - EM", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with default parameters - simple", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 2: standardize parameter
# =============================================================================

test_that("susie() matches reference with standardize=FALSE - optim", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, standardize = FALSE, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with standardize=FALSE - EM", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, standardize = FALSE, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with standardize=FALSE - simple", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, standardize = FALSE, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 3: intercept parameter
# =============================================================================

test_that("susie() matches reference with intercept=FALSE - optim", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, intercept = FALSE, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with intercept=FALSE - EM", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, intercept = FALSE, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with intercept=FALSE - simple", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, intercept = FALSE, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 4: estimate_prior_variance=FALSE
# =============================================================================

test_that("susie() matches reference with estimate_prior_variance=FALSE", {
  skip_if_no_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # When estimate_prior_variance=FALSE, the method doesn't matter
  args <- list(X = X, y = y, L = 10, estimate_prior_variance = FALSE)
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 5: estimate_residual_variance parameter
# =============================================================================

test_that("susie() matches reference with estimate_residual_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with estimate_residual_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with estimate_residual_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 6: Sparse matrix input
# =============================================================================

test_that("susie() matches reference with sparse matrix input - optim", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X_sparse <- Matrix::Matrix(X, sparse = TRUE)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X_sparse, y = y, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with sparse matrix input - EM", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X_sparse <- Matrix::Matrix(X, sparse = TRUE)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X_sparse, y = y, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with sparse matrix input - simple", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X_sparse <- Matrix::Matrix(X, sparse = TRUE)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X_sparse, y = y, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 7: Different L values
# =============================================================================

test_that("susie() matches reference with different L values - optim", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test L=1
  args1 <- list(X = X, y = y, L = 1, estimate_prior_method = "optim")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(X = X, y = y, L = 5, estimate_prior_method = "optim")
  compare_to_reference("susie", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(X = X, y = y, L = 20, estimate_prior_method = "optim")
  compare_to_reference("susie", args20, tolerance = 1e-5)
})

test_that("susie() matches reference with different L values - EM", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test L=1
  args1 <- list(X = X, y = y, L = 1, estimate_prior_method = "EM")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(X = X, y = y, L = 5, estimate_prior_method = "EM")
  compare_to_reference("susie", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(X = X, y = y, L = 20, estimate_prior_method = "EM")
  compare_to_reference("susie", args20, tolerance = 1e-5)
})

test_that("susie() matches reference with different L values - simple", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test L=1
  args1 <- list(X = X, y = y, L = 1, estimate_prior_method = "simple")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(X = X, y = y, L = 5, estimate_prior_method = "simple")
  compare_to_reference("susie", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(X = X, y = y, L = 20, estimate_prior_method = "simple")
  compare_to_reference("susie", args20, tolerance = 1e-5)
})

# =============================================================================
# Part 8: prior_weights
# =============================================================================

test_that("susie() matches reference with prior_weights - optim", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(X = X, y = y, L = 10, prior_weights = prior_weights, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with prior_weights - EM", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(X = X, y = y, L = 10, prior_weights = prior_weights, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with prior_weights - simple", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(X = X, y = y, L = 10, prior_weights = prior_weights, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 9: scaled_prior_variance
# =============================================================================

test_that("susie() matches reference with scaled_prior_variance - optim", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with scaled_prior_variance - EM", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with scaled_prior_variance - simple", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 10: coverage and min_abs_corr
# =============================================================================

test_that("susie() matches reference with coverage=0.99 - optim", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, coverage = 0.99, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with coverage=0.99 - EM", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, coverage = 0.99, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with coverage=0.99 - simple", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, coverage = 0.99, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with min_abs_corr=0.7 - optim", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, min_abs_corr = 0.7, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with min_abs_corr=0.7 - EM", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, min_abs_corr = 0.7, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with min_abs_corr=0.7 - simple", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(X = X, y = y, L = 10, min_abs_corr = 0.7, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 11: Combined parameter variations
# =============================================================================

test_that("susie() matches reference with combined parameters - optim", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test combination: standardize=FALSE, intercept=FALSE
  args1 <- list(X = X, y = y, L = 10, standardize = FALSE, intercept = FALSE, estimate_prior_method = "optim")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    X = X, y = y, L = 10,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args2, tolerance = 1e-5)
})

test_that("susie() matches reference with combined parameters - EM", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test combination: standardize=FALSE, intercept=FALSE
  args1 <- list(X = X, y = y, L = 10, standardize = FALSE, intercept = FALSE, estimate_prior_method = "EM")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    X = X, y = y, L = 10,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args2, tolerance = 1e-5)
})

test_that("susie() matches reference with combined parameters - simple", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Test combination: standardize=FALSE, intercept=FALSE
  args1 <- list(X = X, y = y, L = 10, standardize = FALSE, intercept = FALSE, estimate_prior_method = "simple")
  compare_to_reference("susie", args1, tolerance = 1e-5)

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    X = X, y = y, L = 10,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args2, tolerance = 1e-5)
})

# =============================================================================
# Part 12: prior_tol parameter
# =============================================================================

test_that("susie() matches reference with prior_tol=0.1 - optim", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with prior_tol=0.1 - EM", {
  skip("Intentional change: susieR2.0 adds a post-convergence trim_null_effects() pass that zeros model$V entries where V < prior_tol. The reference uses prior_tol only to filter PIPs in susie_get_pip(); it never zeros V. Any prior_tol value large enough to trigger the trim on dev but not the ref produces a divergence in the final V / alpha / mu that exceeds the 1e-5 tolerance.")
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with prior_tol=0.1 - simple", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 13: check_null_threshold parameter
# =============================================================================

test_that("susie() matches reference with check_null_threshold=0.1 - optim", {
  skip_if_no_reference()

  set.seed(15)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with check_null_threshold=0.1 - EM", {
  skip("Not a bug: susieR2.0 intentionally skips the check_null_threshold V-zeroing step for EM (see R/single_effect_regression.R:169 and stephenslab/mvsusieR#26). The check would zero V without recomputing the posterior, creating an inconsistent (q, V) pair that can decrease the ELBO. Null effects are instead removed by trim_null_effects() after convergence. Since dev ignores check_null_threshold for EM, this test cannot match a reference that always applies the check.")
  skip_if_no_reference()

  set.seed(15)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with check_null_threshold=0.1 - simple", {
  skip_if_no_reference()

  set.seed(15)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with check_null_threshold=0.5 - optim", {
  skip_if_no_reference()

  set.seed(16)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.5,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with check_null_threshold=0.5 - EM", {
  skip("Not a bug: susieR2.0 intentionally skips the check_null_threshold V-zeroing step for EM (see R/single_effect_regression.R:169 and stephenslab/mvsusieR#26). The check would zero V without recomputing the posterior, creating an inconsistent (q, V) pair that can decrease the ELBO. Since dev ignores check_null_threshold for EM, this test cannot match a reference that always applies the check.")
  skip_if_no_reference()

  set.seed(16)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.5,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with check_null_threshold=0.5 - simple", {
  skip_if_no_reference()

  set.seed(16)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  args <- list(
    X = X, y = y, L = 10,
    check_null_threshold = 0.5,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 14: residual_variance bounds
# =============================================================================

test_that("susie() matches reference with residual_variance_upperbound - optim", {
  skip_if_no_reference()

  set.seed(17)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set upperbound lower than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_upperbound = 0.8,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with residual_variance_upperbound - EM", {
  skip_if_no_reference()

  set.seed(17)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set upperbound lower than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_upperbound = 0.8,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with residual_variance_upperbound - simple", {
  skip("Intentional improvement: reference declares convergence on any ELBO change below tol (including negative), so it stops at iter 2 after the ELBO drops by ~25 (because the binding upperbound=0.8 forces sigma2 away from the MLE). susieR2.0 requires 0 <= ELBO_diff < tol (see R/model_methods.R:229-233), correctly continues iterating, and lands at a slightly better ELBO with different mu. Posterior alpha, V, and sigma2 match to ~1e-17; only mu differs (up to 0.5) because the reference returned a mid-drop snapshot.")
  skip_if_no_reference()

  set.seed(17)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set upperbound lower than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_upperbound = 0.8,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with residual_variance_lowerbound - optim", {
  skip_if_no_reference()

  set.seed(18)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set lowerbound higher than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_lowerbound = 1.5,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with residual_variance_lowerbound - EM", {
  skip_if_no_reference()

  set.seed(18)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set lowerbound higher than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_lowerbound = 1.5,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with residual_variance_lowerbound - simple", {
  skip_if_no_reference()

  set.seed(18)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Set lowerbound higher than natural variance (~1.07) to ensure it's binding
  args <- list(
    X = X, y = y, L = 10,
    residual_variance_lowerbound = 1.5,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 15: na.rm parameter
# =============================================================================

test_that("susie() matches reference with na.rm=TRUE - optim", {
  skip_if_no_reference()

  set.seed(19)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Introduce NA values
  y[c(1, 25, 50)] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with na.rm=TRUE - EM", {
  skip_if_no_reference()

  set.seed(19)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Introduce NA values
  y[c(1, 25, 50)] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, estimate_prior_method = "EM")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with na.rm=TRUE - simple", {
  skip_if_no_reference()

  set.seed(19)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Introduce NA values
  y[c(1, 25, 50)] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, estimate_prior_method = "simple")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with na.rm=TRUE and single NA - optim", {
  skip_if_no_reference()

  set.seed(20)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Single NA (the bug report case)
  y[1] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with na.rm=TRUE and standardize=FALSE", {
  skip_if_no_reference()

  set.seed(21)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Introduce NA values
  y[c(5, 10, 15)] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, standardize = FALSE,
               estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

test_that("susie() matches reference with na.rm=TRUE and intercept=FALSE", {
  skip_if_no_reference()

  set.seed(22)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Introduce NA values
  y[c(10, 20, 30)] <- NA

  args <- list(X = X, y = y, L = 10, na.rm = TRUE, intercept = FALSE,
               estimate_prior_method = "optim")
  compare_to_reference("susie", args, tolerance = 1e-5)
})

# =============================================================================
# Part 16: model_init parameter (dev) vs s_init (reference)
# =============================================================================
#
# These tests verify that our model_init parameter produces identical results
# to the reference package's s_init parameter. Each test runs an initial susie
# fit on both packages, then passes the result as model_init/s_init to a
# second call and compares outputs.

test_that("susie() matches reference with model_init - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(23)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Run initial fit on both packages (short run to get a non-trivial init)
  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  # Run with model_init (dev) / s_init (ref)
  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init - EM", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(23)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "EM")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_method = "EM")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_method = "EM")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(23)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with estimate_residual_variance=FALSE
test_that("susie() matches reference with model_init and estimate_residual_variance=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(24)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and estimate_residual_variance=FALSE - EM", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(24)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "EM")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "EM")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "EM")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and estimate_residual_variance=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(24)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_residual_variance = FALSE, residual_variance = 1.0,
                   estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with estimate_prior_variance=FALSE
test_that("susie() matches reference with model_init and estimate_prior_variance=FALSE", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(25)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_variance = FALSE)
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_variance = FALSE)
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_variance = FALSE)

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with standardize=FALSE
test_that("susie() matches reference with model_init and standardize=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(26)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    standardize = FALSE, estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   standardize = FALSE, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   standardize = FALSE, estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and standardize=FALSE - EM", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(26)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    standardize = FALSE, estimate_prior_method = "EM")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   standardize = FALSE, estimate_prior_method = "EM")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   standardize = FALSE, estimate_prior_method = "EM")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and standardize=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(26)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    standardize = FALSE, estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   standardize = FALSE, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   standardize = FALSE, estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with intercept=FALSE
test_that("susie() matches reference with model_init and intercept=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(27)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    intercept = FALSE, estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   intercept = FALSE, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   intercept = FALSE, estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and intercept=FALSE - EM", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(27)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    intercept = FALSE, estimate_prior_method = "EM")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   intercept = FALSE, estimate_prior_method = "EM")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   intercept = FALSE, estimate_prior_method = "EM")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and intercept=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(27)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    intercept = FALSE, estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   intercept = FALSE, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   intercept = FALSE, estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with L expansion (second call requests more effects than init)
test_that("susie() matches reference with model_init and L expansion - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(28)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Initial fit with L=3
  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  # Second fit with L=10 (expansion)
  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and L expansion - EM", {
  skip("Intentional improvement: susieR2.0 preserves fitted V during L expansion; reference resets all V to default. EM updates V incrementally so intermediate ELBOs differ, but final posteriors converge.")
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(28)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    estimate_prior_method = "EM")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   estimate_prior_method = "EM")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   estimate_prior_method = "EM")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and L expansion - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(28)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# model_init with combined standardize=FALSE and intercept=FALSE
test_that("susie() matches reference with model_init, standardize=FALSE, intercept=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(29)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    standardize = FALSE, intercept = FALSE,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   standardize = FALSE, intercept = FALSE,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   standardize = FALSE, intercept = FALSE,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 17: model_init with L expansion - deeper probing for differences
# =============================================================================
#
# These tests specifically target L expansion (model_init has fewer effects
# than the requested L) with various parameter combinations to find behavioral
# differences between model_init (dev) and s_init (ref).

# L expansion with estimate_prior_variance=FALSE
# When V is never re-estimated, any difference in V initialization should
# propagate through all iterations and affect final posteriors.
test_that("susie() matches reference with model_init, L expansion, estimate_prior_variance=FALSE - optim", {
  skip("Intentional improvement: susieR2.0 preserves fitted V during L expansion; reference resets all V to default. With estimate_prior_variance=FALSE, the V difference persists in final posteriors.")
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(30)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Initial fit with L=3
  init_args <- list(X = X, y = y, L = 3, max_iter = 5,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  # Second fit with L=8, estimate_prior_variance=FALSE
  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   estimate_prior_variance = FALSE,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   estimate_prior_variance = FALSE,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L expansion, estimate_prior_variance=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(30)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 5,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   estimate_prior_variance = FALSE,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   estimate_prior_variance = FALSE,
                   estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with BOTH estimate_prior_variance=FALSE AND estimate_residual_variance=FALSE
# Fully constrained variances - any V initialization difference is permanent.
test_that("susie() matches reference with model_init, L expansion, both variances fixed - optim", {
  skip("Intentional improvement: susieR2.0 preserves fitted V during L expansion; reference resets all V to default. With both variances fixed, the V difference persists in final posteriors.")
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(31)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 5,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   estimate_prior_variance = FALSE,
                   estimate_residual_variance = FALSE,
                   residual_variance = 1.0,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   estimate_prior_variance = FALSE,
                   estimate_residual_variance = FALSE,
                   residual_variance = 1.0,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L expansion, both variances fixed - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(31)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 5,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   estimate_prior_variance = FALSE,
                   estimate_residual_variance = FALSE,
                   residual_variance = 1.0,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   estimate_prior_variance = FALSE,
                   estimate_residual_variance = FALSE,
                   residual_variance = 1.0,
                   estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with standardize=FALSE
test_that("susie() matches reference with model_init, L expansion, standardize=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(32)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    standardize = FALSE, estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   standardize = FALSE, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   standardize = FALSE, estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L expansion, standardize=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(32)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    standardize = FALSE, estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   standardize = FALSE, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   standardize = FALSE, estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with intercept=FALSE
test_that("susie() matches reference with model_init, L expansion, intercept=FALSE - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(33)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    intercept = FALSE, estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   intercept = FALSE, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   intercept = FALSE, estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L expansion, intercept=FALSE - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(33)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    intercept = FALSE, estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   intercept = FALSE, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   intercept = FALSE, estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with non-default scaled_prior_variance
test_that("susie() matches reference with model_init, L expansion, scaled_prior_variance=0.5 - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(34)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    scaled_prior_variance = 0.5,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_init,
                   scaled_prior_variance = 0.5,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_init,
                   scaled_prior_variance = 0.5,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 18: model_init with L contraction (model_init has more effects than L)
# =============================================================================

test_that("susie() matches reference with model_init, L contraction - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(35)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Initial fit with L=10
  init_args <- list(X = X, y = y, L = 10, max_iter = 5,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  # Second fit with L=5 (contraction - model_init has more effects)
  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_method = "optim")

  dev_result <- suppressWarnings(suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))))
  ref_result <- suppressWarnings(suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L contraction - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(35)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 10, max_iter = 5,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   estimate_prior_method = "simple")

  dev_result <- suppressWarnings(suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))))
  ref_result <- suppressWarnings(suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 19: model_init with susie_init_coef
# =============================================================================

test_that("susie() matches reference with susie_init_coef as model_init - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(36)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Create init from known coefficients
  dev_coef_init <- dev_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)
  ref_coef_init <- ref_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_coef_init,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_coef_init,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with susie_init_coef as model_init - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(36)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_coef_init <- dev_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)
  ref_coef_init <- ref_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)

  dev_args <- list(X = X, y = y, L = 10, model_init = dev_coef_init,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 10, s_init = ref_coef_init,
                   estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# susie_init_coef with same L (no expansion)
test_that("susie() matches reference with susie_init_coef as model_init, matching L - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(37)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  dev_coef_init <- dev_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)
  ref_coef_init <- ref_env$env[["susie_init_coef"]](1:4, c(2, 3, -2, 1.5), p)

  dev_args <- list(X = X, y = y, L = 4, model_init = dev_coef_init,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 4, s_init = ref_coef_init,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 20: model_init with null_weight
# =============================================================================

test_that("susie() matches reference with model_init and null_weight - optim", {
  skip("Bug fix: susieR1.0 incorrectly set lpo=0 for infinite shat2 (null column), ignoring the actual null_weight. susieR2.0 correctly uses log(prior_weights).")
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(38)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    null_weight = 0.5,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   null_weight = 0.5,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   null_weight = 0.5,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and null_weight - simple", {
  skip("Bug fix: susieR1.0 incorrectly set lpo=0 for infinite shat2 (null column), ignoring the actual null_weight. susieR2.0 correctly uses log(prior_weights).")
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(38)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    null_weight = 0.5,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   null_weight = 0.5,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   null_weight = 0.5,
                   estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 21: model_init with prior_weights
# =============================================================================

test_that("susie() matches reference with model_init and prior_weights - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(39)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  # Non-uniform prior weights
  pw <- runif(p)
  pw <- pw / sum(pw)

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    prior_weights = pw,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   prior_weights = pw,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   prior_weights = pw,
                   estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init and prior_weights - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(39)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  pw <- runif(p)
  pw <- pw / sum(pw)

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    prior_weights = pw,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   prior_weights = pw,
                   estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   prior_weights = pw,
                   estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with prior_weights
test_that("susie() matches reference with model_init, L expansion, and prior_weights - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(40)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  pw <- runif(p)
  pw <- pw / sum(pw)

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    prior_weights = pw,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   prior_weights = pw,
                   estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   prior_weights = pw,
                   estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# =============================================================================
# Part 22: model_init with max_iter=1 (single iteration - check initialization)
# =============================================================================
# Running with max_iter=1 ensures we're testing the initialization path itself,
# not just the converged output.

test_that("susie() matches reference with model_init, max_iter=1 - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(41)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   max_iter = 1, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   max_iter = 1, estimate_prior_method = "optim")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, max_iter=1 - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(41)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 5, max_iter = 3,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 5, model_init = dev_init,
                   max_iter = 1, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 5, s_init = ref_init,
                   max_iter = 1, estimate_prior_method = "simple")

  dev_result <- do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args))
  ref_result <- do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

# L expansion with max_iter=1
test_that("susie() matches reference with model_init, L expansion, max_iter=1 - optim", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(42)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    estimate_prior_method = "optim")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   max_iter = 1, estimate_prior_method = "optim")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   max_iter = 1, estimate_prior_method = "optim")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})

test_that("susie() matches reference with model_init, L expansion, max_iter=1 - simple", {
  skip_if_no_reference()

  ref_env <- load_reference_env()
  dev_env <- load_development_env()

  set.seed(42)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  init_args <- list(X = X, y = y, L = 3, max_iter = 3,
                    estimate_prior_method = "simple")
  dev_init <- do.call(dev_env$env[["susie"]], inject_em_null_check(init_args))
  ref_init <- do.call(ref_env$env[["susie"]], inject_em_null_check(init_args))

  dev_args <- list(X = X, y = y, L = 8, model_init = dev_init,
                   max_iter = 1, estimate_prior_method = "simple")
  ref_args <- list(X = X, y = y, L = 8, s_init = ref_init,
                   max_iter = 1, estimate_prior_method = "simple")

  dev_result <- suppressMessages(do.call(dev_env$env[["susie"]], inject_em_null_check(dev_args)))
  ref_result <- suppressMessages(do.call(ref_env$env[["susie"]], inject_em_null_check(ref_args)))

  expect_equal_susie_objects(dev_result, ref_result, tolerance = 1e-5)
})


================================================
FILE: tests/testthat/reference/test_susie_rss_lambda_reference.R
================================================
# Source helper functions
source(file.path("..", "helper_reference.R"), local = TRUE)

context("susie_rss with lambda reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie_rss_lambda() with lambda > 0
# =============================================================================
#
# These tests compare susie_rss_lambda(lambda > 0) against the historical
# susie_rss(lambda > 0) implementation from stephenslab/susieR@1f9166c.
#

# =============================================================================
# Part 1: Different lambda values
# =============================================================================

test_that("susie_rss_lambda() matches reference with lambda=1e-5 - optim", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=1e-5 - EM", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=1e-5 - simple", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.1 - optim", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.1, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.1 - EM", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.1, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.1 - simple", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.1, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.5 - optim", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.5 - EM", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with lambda=0.5 - simple", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 0.5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 2: Different L values
# =============================================================================

test_that("susie_rss_lambda() matches reference with different L values - optim", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, L = 1, lambda = 1e-5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args1, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=5
  args5 <- list(z = z, R = R, L = 5, lambda = 1e-5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args5, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=20
  args20 <- list(z = z, R = R, L = 20, lambda = 1e-5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args20, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with different L values - EM", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, L = 1, lambda = 1e-5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args1, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=5
  args5 <- list(z = z, R = R, L = 5, lambda = 1e-5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args5, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=20
  args20 <- list(z = z, R = R, L = 20, lambda = 1e-5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args20, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with different L values - simple", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, L = 1, lambda = 1e-5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args1, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=5
  args5 <- list(z = z, R = R, L = 5, lambda = 1e-5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args5, tolerance = 1e-5, ref_func_name = "susie_rss")

  # Test L=20
  args20 <- list(z = z, R = R, L = 20, lambda = 1e-5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args20, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 3: estimate_prior_variance parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with estimate_prior_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with estimate_prior_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with estimate_prior_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 4: estimate_residual_variance parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with estimate_residual_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with estimate_residual_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with estimate_residual_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with residual_variance fixed - optim", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with residual_variance fixed - EM", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with residual_variance fixed - simple", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 5: prior_variance parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with prior_variance=100 - optim", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_variance = 100, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_variance=100 - EM", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_variance = 100, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_variance=100 - simple", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_variance = 100, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 6: prior_weights
# =============================================================================

test_that("susie_rss_lambda() matches reference with prior_weights - optim", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_weights = prior_weights, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_weights - EM", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_weights = prior_weights, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_weights - simple", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, L = 10, lambda = 1e-5, prior_weights = prior_weights, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 7: maf filtering
# =============================================================================

test_that("susie_rss_lambda() matches reference with maf filtering - optim", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "optim",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with maf filtering - EM", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "EM",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with maf filtering - simple", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "simple",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 8: coverage and min_abs_corr
# =============================================================================

test_that("susie_rss_lambda() matches reference with coverage=0.99 - optim", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, coverage = 0.99, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with coverage=0.99 - EM", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, coverage = 0.99, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with coverage=0.99 - simple", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, coverage = 0.99, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with min_abs_corr=0.7 - optim", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, min_abs_corr = 0.7, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with min_abs_corr=0.7 - EM", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, min_abs_corr = 0.7, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with min_abs_corr=0.7 - simple", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, min_abs_corr = 0.7, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 9: prior_tol parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with prior_tol=1e-5 - optim", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Disable check_null_threshold so we can see prior_tol effects
  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    prior_tol = 0.1,
    estimate_prior_method = "optim",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_tol=1e-5 - EM", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    prior_tol = 0.1,
    estimate_prior_method = "EM",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with prior_tol=1e-5 - simple", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    prior_tol = 0.1,
    estimate_prior_method = "simple",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 10: check_null_threshold parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with check_null_threshold=0.1 - optim", {
  skip_if_no_reference()

  set.seed(14)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    check_null_threshold = 0.1,
    estimate_prior_method = "optim",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with check_null_threshold=0.1 - EM", {
  skip("Not a bug: susieR2.0 intentionally skips the check_null_threshold V-zeroing step for EM (see R/single_effect_regression.R:169 and stephenslab/mvsusieR#26). The check would zero V without recomputing the posterior, creating an inconsistent (q, V) pair that can decrease the ELBO. Since dev ignores check_null_threshold for EM, this test cannot match a reference that always applies the check.")
  skip_if_no_reference()

  set.seed(14)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    check_null_threshold = 0.1,
    estimate_prior_method = "EM",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with check_null_threshold=0.1 - simple", {
  skip_if_no_reference()

  set.seed(14)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    check_null_threshold = 0.1,
    estimate_prior_method = "simple",
    estimate_residual_variance = TRUE
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 11: intercept_value parameter
# =============================================================================

test_that("susie_rss_lambda() matches reference with intercept_value=0.5 - optim", {
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, intercept_value = 0.5, estimate_prior_method = "optim", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with intercept_value=0.5 - EM", {
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, intercept_value = 0.5, estimate_prior_method = "EM", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with intercept_value=0.5 - simple", {
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, lambda = 1e-5, intercept_value = 0.5, estimate_prior_method = "simple", estimate_residual_variance = TRUE)
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

# =============================================================================
# Part 12: Combined parameter tests
# =============================================================================

test_that("susie_rss_lambda() matches reference with combined params - optim", {
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with combined params - EM", {
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})

test_that("susie_rss_lambda() matches reference with combined params - simple", {
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, L = 10, lambda = 1e-5,
    estimate_prior_variance = FALSE,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss_lambda", args, tolerance = 1e-5, ref_func_name = "susie_rss")
})


================================================
FILE: tests/testthat/reference/test_susie_rss_reference.R
================================================
# Source helper functions
source(file.path("..", "helper_reference.R"), local = TRUE)

context("susie_rss reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie_rss() with lambda = 0
# =============================================================================
#
# These tests compare the new susie_rss() implementation (lambda = 0) against
# the reference package susie_rss() from stephenslab/susieR@1f9166c
#
# Tests cover all major parameters with all three prior variance optimization
# methods: "optim", "EM", "simple"

# =============================================================================
# Part 1: Basic Input Formats
# =============================================================================
# Test that different input formats (z, bhat/shat) work correctly

test_that("susie_rss() matches reference with z-scores - optim", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  # Compute z-scores and R using standard approach
  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with z-scores - EM", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with z-scores - simple", {
  skip_if_no_reference()

  set.seed(1)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with bhat/shat - optim", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  # Compute bhat, shat and R
  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with bhat/shat - EM", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with bhat/shat - simple", {
  skip_if_no_reference()

  set.seed(2)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 2: Sample size n parameter
# =============================================================================
# Test with n provided vs. not provided (large n approximation)

test_that("susie_rss() matches reference with n provided - optim", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with n provided - EM", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with n provided - simple", {
  skip_if_no_reference()

  set.seed(3)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference without n - optim", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Note: n not provided - uses large n approximation
  args <- list(z = z, R = R, L = 10, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference without n - EM", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference without n - simple", {
  skip_if_no_reference()

  set.seed(4)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, L = 10, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 3: Different L values
# =============================================================================

test_that("susie_rss() matches reference with different L values - optim", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, n = n, L = 1, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(z = z, R = R, n = n, L = 5, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(z = z, R = R, n = n, L = 20, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args20, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with different L values - EM", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, n = n, L = 1, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(z = z, R = R, n = n, L = 5, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(z = z, R = R, n = n, L = 20, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args20, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with different L values - simple", {
  skip_if_no_reference()

  set.seed(5)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Test L=1
  args1 <- list(z = z, R = R, n = n, L = 1, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args1, tolerance = 1e-5)

  # Test L=5
  args5 <- list(z = z, R = R, n = n, L = 5, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args5, tolerance = 1e-5)

  # Test L=20
  args20 <- list(z = z, R = R, n = n, L = 20, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args20, tolerance = 1e-5)
})

# =============================================================================
# Part 4: estimate_prior_variance parameter
# =============================================================================

test_that("susie_rss() matches reference with estimate_prior_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_prior_variance = FALSE,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_prior_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_prior_variance = FALSE,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_prior_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(6)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_prior_variance = FALSE,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 5: estimate_residual_variance parameter
# =============================================================================

test_that("susie_rss() matches reference with estimate_residual_variance=TRUE - optim", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_residual_variance=TRUE - EM", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_residual_variance=TRUE - simple", {
  skip_if_no_reference()

  set.seed(7)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = TRUE,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_residual_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_residual_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with estimate_residual_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(8)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    estimate_residual_variance = FALSE,
    residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 6: prior_weights
# =============================================================================

test_that("susie_rss() matches reference with prior_weights - optim", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, n = n, L = 10, prior_weights = prior_weights, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with prior_weights - EM", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, n = n, L = 10, prior_weights = prior_weights, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with prior_weights - simple", {
  skip_if_no_reference()

  set.seed(9)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(z = z, R = R, n = n, L = 10, prior_weights = prior_weights, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 7: scaled_prior_variance
# =============================================================================

test_that("susie_rss() matches reference with scaled_prior_variance - optim", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with scaled_prior_variance - EM", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with scaled_prior_variance - simple", {
  skip_if_no_reference()

  set.seed(10)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, scaled_prior_variance = 0.5, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 8: var_y parameter
# =============================================================================

test_that("susie_rss() matches reference with var_y - optim", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  # Compute bhat, shat and R
  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat
  var_y <- var(y)

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, var_y = var_y, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with var_y - EM", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat
  var_y <- var(y)

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, var_y = var_y, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with var_y - simple", {
  skip_if_no_reference()

  set.seed(11)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  bhat <- ss$betahat
  shat <- ss$sebetahat
  var_y <- var(y)

  args <- list(bhat = bhat, shat = shat, R = R, n = n, L = 10, var_y = var_y, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 9: coverage and min_abs_corr
# =============================================================================

test_that("susie_rss() matches reference with coverage=0.99 - optim", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, coverage = 0.99, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with coverage=0.99 - EM", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, coverage = 0.99, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with coverage=0.99 - simple", {
  skip_if_no_reference()

  set.seed(12)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, coverage = 0.99, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with min_abs_corr=0.7 - optim", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, min_abs_corr = 0.7, estimate_prior_method = "optim")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with min_abs_corr=0.7 - EM", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, min_abs_corr = 0.7, estimate_prior_method = "EM")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with min_abs_corr=0.7 - simple", {
  skip_if_no_reference()

  set.seed(13)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(z = z, R = R, n = n, L = 10, min_abs_corr = 0.7, estimate_prior_method = "simple")
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 10: prior_tol parameter
# =============================================================================

test_that("susie_rss() matches reference with prior_tol=1e-5 - optim", {
  skip("Intentional change: susieR2.0 adds a post-convergence trim_null_effects() pass that zeros model$V entries where V < prior_tol. The reference uses prior_tol only to filter PIPs; it never zeros V. The args here use prior_tol=0.1 (despite the test name), which triggers the trim on dev and produces a V / alpha / mu divergence above 1e-5.")
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Disable check_null_threshold so we can see prior_tol effects
  args <- list(
    z = z, R = R, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with prior_tol=1e-5 - EM", {
  skip("Intentional change: susieR2.0 adds a post-convergence trim_null_effects() pass that zeros model$V entries where V < prior_tol. The reference uses prior_tol only to filter PIPs; it never zeros V. Triggers a V / alpha / mu divergence above 1e-5.")
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with prior_tol=1e-5 - simple", {
  skip_if_no_reference()

  set.seed(15)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 11: check_null_threshold parameter
# =============================================================================

test_that("susie_rss() matches reference with check_null_threshold=0.1 - optim", {
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with check_null_threshold=0.1 - EM", {
  skip("Not a bug: susieR2.0 intentionally skips the check_null_threshold V-zeroing step for EM (see R/single_effect_regression.R:169 and stephenslab/mvsusieR#26). The check would zero V without recomputing the posterior, creating an inconsistent (q, V) pair that can decrease the ELBO. Since dev ignores check_null_threshold for EM, this test cannot match a reference that always applies the check.")
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with check_null_threshold=0.1 - simple", {
  skip_if_no_reference()

  set.seed(16)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  args <- list(
    z = z, R = R, n = n, L = 10,
    check_null_threshold = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

# =============================================================================
# Part 11: MAF filtering
# =============================================================================

test_that("susie_rss() matches reference with maf filtering - optim", {
  skip_if_no_reference()

  set.seed(17)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with maf filtering - EM", {
  skip_if_no_reference()

  set.seed(17)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})

test_that("susie_rss() matches reference with maf filtering - simple", {
  skip_if_no_reference()

  set.seed(17)
  n <- 500
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[c(5, 10, 20)] <- c(0.5, 0.4, 0.3)
  y <- as.vector(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  ss <- univariate_regression(X, y)
  R <- with(input_ss, cov2cor(XtX))
  R <- (R + t(R)) / 2
  z <- with(ss, betahat / sebetahat)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    z = z, R = R, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_rss", args, tolerance = 1e-5)
})


================================================
FILE: tests/testthat/reference/test_susie_ss_reference.R
================================================
# Source helper functions
source(file.path("..", "helper_reference.R"), local = TRUE)

context("susie_ss reference comparison")

# =============================================================================
# REFERENCE TESTS FOR susie_ss()
# =============================================================================
#
# These tests compare the new susie_ss() implementation against the reference
# susie_suff_stat() from stephenslab/susieR@1f9166c
#
# Tests cover all major parameters and their combinations with all three
# prior variance optimization methods: "optim", "EM", "simple"

# =============================================================================
# Part 1: Basic Parameter Tests
# =============================================================================

test_that("susie_ss() matches reference with default parameters - optim", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with default parameters - EM", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with default parameters - simple", {
  skip_if_no_reference()

  set.seed(1)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 2: X_colmeans and y_mean (intercept estimation)
# =============================================================================

test_that("susie_ss() matches reference with X_colmeans and y_mean - optim", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_colmeans <- colMeans(X)
  y_mean <- mean(y)
  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - y_mean
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    X_colmeans = X_colmeans, y_mean = y_mean,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with X_colmeans and y_mean - EM", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_colmeans <- colMeans(X)
  y_mean <- mean(y)
  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - y_mean
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    X_colmeans = X_colmeans, y_mean = y_mean,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with X_colmeans and y_mean - simple", {
  skip_if_no_reference()

  set.seed(2)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_colmeans <- colMeans(X)
  y_mean <- mean(y)
  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - y_mean
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    X_colmeans = X_colmeans, y_mean = y_mean,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 3: standardize parameter
# =============================================================================

test_that("susie_ss() matches reference with standardize=FALSE - optim", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with standardize=FALSE - EM", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with standardize=FALSE - simple", {
  skip_if_no_reference()

  set.seed(3)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 4: estimate_prior_variance=FALSE
# =============================================================================

test_that("susie_ss() matches reference with estimate_prior_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with estimate_prior_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with estimate_prior_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(4)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 5: estimate_residual_variance parameter
# =============================================================================

test_that("susie_ss() matches reference with estimate_residual_variance=FALSE - optim", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_residual_variance = FALSE, residual_variance = 1.0,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with estimate_residual_variance=FALSE - EM", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_residual_variance = FALSE, residual_variance = 1.0,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with estimate_residual_variance=FALSE - simple", {
  skip_if_no_reference()

  set.seed(5)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_residual_variance = FALSE, residual_variance = 1.0,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 6: Different L values
# =============================================================================

test_that("susie_ss() matches reference with different L values - optim", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test L=1
  args1 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 1, estimate_prior_method = "optim")
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=5
  args5 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 5, estimate_prior_method = "optim")
  compare_to_reference("susie_ss", args5, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=20
  args20 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 20, estimate_prior_method = "optim")
  compare_to_reference("susie_ss", args20, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with different L values - EM", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test L=1
  args1 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 1, estimate_prior_method = "EM")
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=5
  args5 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 5, estimate_prior_method = "EM")
  compare_to_reference("susie_ss", args5, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=20
  args20 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 20, estimate_prior_method = "EM")
  compare_to_reference("susie_ss", args20, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with different L values - simple", {
  skip_if_no_reference()

  set.seed(6)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test L=1
  args1 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 1, estimate_prior_method = "simple")
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=5
  args5 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 5, estimate_prior_method = "simple")
  compare_to_reference("susie_ss", args5, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test L=20
  args20 <- list(XtX = XtX, Xty = Xty, yty = yty, n = n, L = 20, estimate_prior_method = "simple")
  compare_to_reference("susie_ss", args20, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 7: prior_weights
# =============================================================================

test_that("susie_ss() matches reference with prior_weights - optim", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_weights = prior_weights, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with prior_weights - EM", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_weights = prior_weights, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with prior_weights - simple", {
  skip_if_no_reference()

  set.seed(7)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Use non-uniform prior weights
  prior_weights <- runif(p)
  prior_weights <- prior_weights / sum(prior_weights)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_weights = prior_weights, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 8: scaled_prior_variance
# =============================================================================

test_that("susie_ss() matches reference with scaled_prior_variance - optim", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    scaled_prior_variance = 0.5, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with scaled_prior_variance - EM", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    scaled_prior_variance = 0.5, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with scaled_prior_variance - simple", {
  skip_if_no_reference()

  set.seed(8)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    scaled_prior_variance = 0.5, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 9: coverage, min_abs_corr, and n_purity
# =============================================================================

test_that("susie_ss() matches reference with coverage=0.99 - optim", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    coverage = 0.99, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with coverage=0.99 - EM", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    coverage = 0.99, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with coverage=0.99 - simple", {
  skip_if_no_reference()

  set.seed(9)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    coverage = 0.99, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with min_abs_corr=0.7 - optim", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    min_abs_corr = 0.7, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with min_abs_corr=0.7 - EM", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    min_abs_corr = 0.7, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with min_abs_corr=0.7 - simple", {
  skip_if_no_reference()

  set.seed(10)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    min_abs_corr = 0.7, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with n_purity=3 - optim", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Set seed before calling to ensure same variant selection
  set.seed(999)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    n_purity = 3, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with n_purity=3 - EM", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Set seed before calling to ensure same variant selection
  set.seed(999)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    n_purity = 3, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with n_purity=3 - simple", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Set seed before calling to ensure same variant selection
  set.seed(999)
  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    n_purity = 3, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 10: Combined parameter variations
# =============================================================================

test_that("susie_ss() matches reference with combined parameters - optim", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test combination: standardize=FALSE, estimate_prior_variance=FALSE
  args1 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_variance = FALSE,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_residual_variance = FALSE,
    residual_variance = 1.0, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args2, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with combined parameters - EM", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test combination: standardize=FALSE, estimate_prior_variance=FALSE
  args1 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_variance = FALSE,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_residual_variance = FALSE,
    residual_variance = 1.0, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args2, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with combined parameters - simple", {
  skip_if_no_reference()

  set.seed(11)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Test combination: standardize=FALSE, estimate_prior_variance=FALSE
  args1 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    standardize = FALSE, estimate_prior_variance = FALSE,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args1, tolerance = 1e-5, ref_func_name = "susie_suff_stat")

  # Test combination: estimate_prior_variance=FALSE, estimate_residual_variance=FALSE
  args2 <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    estimate_prior_variance = FALSE, estimate_residual_variance = FALSE,
    residual_variance = 1.0, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args2, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 11: prior_tol parameter
# =============================================================================

test_that("susie_ss() matches reference with prior_tol=1e-5 - optim", {
  skip_if_no_reference()

  set.seed(12)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with prior_tol=0.1 - EM", {
  skip("Intentional change: susieR2.0 adds a post-convergence trim_null_effects() pass that zeros model$V entries where V < prior_tol. The reference uses prior_tol only to filter PIPs; it never zeros V. Triggers a V / alpha / mu divergence above 1e-5.")
  skip_if_no_reference()

  set.seed(12)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with prior_tol=0.1 - simple", {
  skip_if_no_reference()

  set.seed(12)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    prior_tol = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 12: check_null_threshold parameter
# =============================================================================

test_that("susie_ss() matches reference with check_null_threshold=0.1 - optim", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    check_null_threshold = 0.1, estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with check_null_threshold=0.1 - EM", {
  skip("Not a bug: susieR2.0 intentionally skips the check_null_threshold V-zeroing step for EM (see R/single_effect_regression.R:169 and stephenslab/mvsusieR#26). The check would zero V without recomputing the posterior, creating an inconsistent (q, V) pair that can decrease the ELBO. Since dev ignores check_null_threshold for EM, this test cannot match a reference that always applies the check.")
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    check_null_threshold = 0.1, estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with check_null_threshold=0.1 - simple", {
  skip_if_no_reference()

  set.seed(13)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    check_null_threshold = 0.1, estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

# =============================================================================
# Part 13: maf and maf_thresh parameters
# =============================================================================

test_that("susie_ss() matches reference with maf filtering - optim", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "optim"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with maf filtering - EM", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "EM"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})

test_that("susie_ss() matches reference with maf filtering - simple", {
  skip_if_no_reference()

  set.seed(14)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:4] <- c(2, 3, -2, 1.5)
  y <- as.vector(X %*% beta + rnorm(n))

  X_centered <- scale(X, center = TRUE, scale = FALSE)
  y_centered <- y - mean(y)
  XtX <- crossprod(X_centered)
  Xty <- crossprod(X_centered, y_centered)
  yty <- sum(y_centered^2)

  # Simulate minor allele frequencies
  maf <- runif(p, 0.05, 0.5)

  args <- list(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 10,
    maf = maf, maf_thresh = 0.1,
    estimate_prior_method = "simple"
  )
  compare_to_reference("susie_ss", args, tolerance = 1e-5, ref_func_name = "susie_suff_stat")
})


================================================
FILE: tests/testthat/test_X_centering.R
================================================
# Test that susie_rss gives equivalent results for raw, centered,
# and standardized X inputs.

context("X centering equivalence")

test_that("Full-rank X: raw, centered, standardized give same results", {
  set.seed(1)
  n <- 200
  p <- 50

  # Generate X with non-zero column means (raw)
  X_raw <- matrix(rnorm(n * p, mean = 5, sd = 2), n, p)
  X_raw[, 1:3] <- X_raw[, 1:3] + 10  # make some columns have large means

  # Centered and standardized versions
  X_centered <- scale(X_raw, center = TRUE, scale = FALSE)
  X_standardized <- scale(X_raw, center = TRUE, scale = TRUE)

  # Generate z-scores from centered X
  beta_true <- rep(0, p)
  beta_true[c(5, 15, 30)] <- c(0.5, -0.3, 0.4)
  y <- X_centered %*% beta_true + rnorm(n)
  z <- as.vector(sqrt(n) * cor(X_centered, y))

  # Fit with all three forms of X (full-rank path: nrow >= ncol)
  fit_raw  <- susie_rss(z = z, X = X_raw, n = n, max_iter = 50)
  fit_cent <- susie_rss(z = z, X = X_centered, n = n, max_iter = 50)
  fit_std  <- susie_rss(z = z, X = X_standardized, n = n, max_iter = 50)

  # All should produce identical results (full-rank path uses safe_cor
  # which centers internally, but we also center before calling safe_cor)
  expect_equal(fit_raw$elbo, fit_cent$elbo, tolerance = 1e-10)
  expect_equal(fit_raw$elbo, fit_std$elbo, tolerance = 1e-10)
  expect_equal(fit_raw$pip, fit_cent$pip, tolerance = 1e-10)
  expect_equal(fit_raw$pip, fit_std$pip, tolerance = 1e-10)
})

test_that("Low-rank X: raw and centered give identical results", {
  set.seed(2)
  n <- 200
  p <- 500
  B <- 100  # reference factor rows < p, triggers low-rank path

  # Generate full X and z-scores
  X_full <- matrix(rnorm(n * p), n, p)
  beta_true <- rep(0, p)
  beta_true[c(10, 50, 200)] <- c(0.5, -0.3, 0.4)
  y <- X_full %*% beta_true + rnorm(n)
  z <- as.vector(sqrt(n) * cor(X_full, y))

  # Create a reference factor matrix (B x p, B < p)
  S <- matrix(rnorm(B * n) / sqrt(B), B, n)
  X_ref <- S %*% X_full  # B x p reference factor

  # Add offset to create "raw" version with non-zero column means
  X_ref_raw <- X_ref + 10
  # Manually center (avoid scale() attributes)
  X_ref_centered <- X_ref_raw - rep(colMeans(X_ref_raw), each = B)

  # Fit with both forms (low-rank path: nrow < ncol)
  fit_raw  <- susie_rss(z = z, X = X_ref_raw, n = n, L = 5, max_iter = 50)
  fit_cent <- susie_rss(z = z, X = X_ref_centered, n = n, L = 5, max_iter = 50)

  # Raw and centered should give identical results
  expect_equal(fit_raw$elbo, fit_cent$elbo, tolerance = 1e-10)
  expect_equal(fit_raw$pip, fit_cent$pip, tolerance = 1e-10)
})

test_that("Low-rank X: raw vs centered give same results (no n)", {
  set.seed(3)
  p <- 300
  B <- 80

  # Generate reference factor matrix with non-zero means
  X_raw <- matrix(rnorm(B * p, mean = 3), B, p)
  X_centered <- X_raw - rep(colMeans(X_raw), each = B)

  z <- rnorm(p)
  z[c(5, 100)] <- c(4, -3.5)

  fit_raw  <- susie_rss(z = z, X = X_raw, L = 5, max_iter = 30)
  fit_cent <- susie_rss(z = z, X = X_centered, L = 5, max_iter = 30)

  expect_equal(fit_raw$elbo, fit_cent$elbo, tolerance = 1e-10)
  expect_equal(fit_raw$pip, fit_cent$pip, tolerance = 1e-10)
})

test_that("Low-rank X with lambda: raw and centered give same results", {
  set.seed(4)
  p <- 200
  B <- 50

  X_raw <- matrix(rnorm(B * p, mean = 2, sd = 3), B, p)
  X_centered <- X_raw - rep(colMeans(X_raw), each = B)

  z <- rnorm(p)
  z[c(10, 80)] <- c(5, -4)

  fit_raw  <- susie_rss_lambda(z = z, X = X_raw, lambda = 0.1, L = 5, max_iter = 30)
  fit_cent <- susie_rss_lambda(z = z, X = X_centered, lambda = 0.1, L = 5, max_iter = 30)

  expect_equal(fit_raw$elbo, fit_cent$elbo, tolerance = 1e-10)
  expect_equal(fit_raw$pip, fit_cent$pip, tolerance = 1e-10)
})

test_that("Low-rank X: large offset does not break fitting", {
  # Verify that adding a large constant offset to X columns does not
  # break the fitting (because centering removes it).
  set.seed(5)
  p <- 200
  B <- 80

  X_centered <- matrix(rnorm(B * p), B, p)
  X_offset <- X_centered + 1000  # huge offset

  z <- rnorm(p)
  z[c(10, 80)] <- c(5, -4)

  # Both should give identical results
  fit_cent <- susie_rss(z = z, X = X_centered, n = 500, L = 5, max_iter = 50)
  fit_off  <- susie_rss(z = z, X = X_offset, n = 500, L = 5, max_iter = 50)

  # Tolerance accounts for floating-point cancellation when subtracting
  # the large offset (1000 * machine_eps ≈ 2e-13, amplified by iterations)
  expect_equal(fit_cent$elbo, fit_off$elbo, tolerance = 1e-6)
  expect_equal(fit_cent$pip, fit_off$pip, tolerance = 1e-6)
})


================================================
FILE: tests/testthat/test_coef_predict.R
================================================
context("coef and predict S3 methods")

# =============================================================================
# COEF.SUSIE - EXTRACT COEFFICIENTS
# =============================================================================

test_that("coef.susie returns correct format", {
  set.seed(1)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  coefs <- coef(fit)

  expect_length(coefs, dat$p + 1)
  expect_type(coefs, "double")
  expect_named(coefs, NULL)
})

test_that("coef.susie includes intercept as first element", {
  set.seed(2)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  coefs <- coef(fit)

  expect_equal(coefs[1], fit$intercept)
})

test_that("coef.susie computes coefficients correctly", {
  set.seed(3)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  coefs <- coef(fit)

  expected <- c(fit$intercept,
                colSums(fit$alpha * fit$mu) / fit$X_column_scale_factors)
  expect_equal(coefs, expected)
})

test_that("coef.susie handles intercept=FALSE", {
  set.seed(4)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, intercept = FALSE, verbose = FALSE)

  coefs <- coef(fit)

  expect_equal(coefs[1], 0)
})

test_that("coef.susie handles standardize=FALSE", {
  set.seed(5)
  dat <- simulate_regression(n = 100, p = 50, k = 3, center = FALSE, scale = FALSE)
  fit <- susie(dat$X, dat$y, L = 5, standardize = FALSE, verbose = FALSE)

  coefs <- coef(fit)

  expect_length(coefs, dat$p + 1)
  expect_type(coefs, "double")
})

# =============================================================================
# PREDICT.SUSIE - MAKE PREDICTIONS
# =============================================================================

test_that("predict.susie with type='coefficients' returns coef", {
  set.seed(6)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  pred_coef <- predict(fit, type = "coefficients")
  expected_coef <- coef(fit)

  expect_equal(pred_coef, expected_coef)
})

test_that("predict.susie with type='coefficients' errors if newx provided", {
  set.seed(7)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  newx <- matrix(rnorm(10 * 50), 10, 50)

  expect_error(
    predict(fit, newx = newx, type = "coefficients"),
    "Do not supply newx"
  )
})

test_that("predict.susie without newx returns fitted values", {
  set.seed(8)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  pred <- predict(fit, type = "response")

  expect_equal(pred, fit$fitted)
  expect_length(pred, dat$n)
})

test_that("predict.susie with newx computes predictions correctly", {
  set.seed(9)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  newx <- matrix(rnorm(20 * 50), 20, 50)
  newx <- scale(newx, center = TRUE, scale = TRUE)

  pred <- predict(fit, newx = newx, type = "response")

  expect_length(pred, 20)
  expect_type(pred, "double")

  coefs <- coef(fit)
  expected <- drop(fit$intercept + newx %*% coefs[-1])
  expect_equal(pred, expected)
})

test_that("predict.susie handles intercept=FALSE with newx", {
  set.seed(10)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, intercept = FALSE, verbose = FALSE)

  newx <- matrix(rnorm(20 * 50), 20, 50)
  newx <- scale(newx, center = TRUE, scale = TRUE)

  pred <- predict(fit, newx = newx)

  coefs <- coef(fit)
  expected <- drop(newx %*% coefs[-1])
  expect_equal(pred, expected)
})

test_that("predict.susie with NA intercept warns and uses 0", {
  set.seed(11)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_summary_stats(dat$X, dat$y)
  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  expect_true(is.na(fit$intercept))

  newx <- matrix(rnorm(20 * 50), 20, 50)
  newx <- scale(newx, center = TRUE, scale = TRUE)

  expect_message(
    pred <- predict(fit, newx = newx),
    "intercept = 0"
  )

  coefs <- coef(fit)
  expected <- drop(newx %*% coefs[-1])
  expect_equal(pred, expected)
})

test_that("predict.susie default type is response", {
  set.seed(12)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  pred1 <- predict(fit)
  pred2 <- predict(fit, type = "response")

  expect_equal(pred1, pred2)
})

test_that("predict.susie works with single new observation", {
  set.seed(13)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  newx <- matrix(rnorm(50), 1, 50)
  newx <- scale(newx, center = TRUE, scale = TRUE)

  pred <- predict(fit, newx = newx)

  expect_length(pred, 1)
  expect_type(pred, "double")
})

test_that("predict.susie handles matrix vs data.frame newx", {
  set.seed(14)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  newx_mat <- matrix(rnorm(20 * 50), 20, 50)
  newx_mat <- scale(newx_mat, center = TRUE, scale = TRUE)
  newx_df <- as.data.frame(newx_mat)

  pred_mat <- predict(fit, newx = newx_mat)
  pred_df <- predict(fit, newx = as.matrix(newx_df))

  expect_equal(pred_mat, pred_df)
})

# =============================================================================
# INTEGRATION - COEF & PREDICT CONSISTENCY
# =============================================================================

test_that("coef and predict work together consistently", {
  set.seed(15)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  coefs <- coef(fit)
  newx <- matrix(rnorm(10 * 50), 10, 50)
  newx <- scale(newx, center = TRUE, scale = TRUE)

  pred_via_predict <- predict(fit, newx = newx)
  pred_via_coef <- drop(coefs[1] + newx %*% coefs[-1])

  expect_equal(pred_via_predict, pred_via_coef)
})

test_that("coef.susie with all V=0 returns zero coefficients", {
  set.seed(16)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  fit$V <- rep(0, 5)
  fit$alpha <- matrix(1/dat$p, 5, dat$p)
  fit$mu <- matrix(0, 5, dat$p)

  coefs <- coef(fit)

  expect_equal(coefs[-1], rep(0, dat$p))
})

test_that("predict.susie with standardize=FALSE", {
  set.seed(17)
  dat <- simulate_regression(n = 100, p = 50, k = 3, center = FALSE, scale = FALSE)
  fit <- susie(dat$X, dat$y, L = 5, standardize = FALSE, verbose = FALSE)

  pred <- predict(fit)

  expect_equal(pred, fit$fitted)
  expect_length(pred, dat$n)
})


================================================
FILE: tests/testthat/test_compute_marginal_bhat_shat.R
================================================
# compute_marginal_bhat_shat
#
# Per-position marginal OLS regression helper. Used by susieR's own
# T = 1 SER path (cosmetic refactor candidate), mvsusieR's OLS
# branch, and mfsusieR's prior init / SER. Three contracts:
#   1. Vector-Y input is treated as a single-column matrix.
#   2. predictor_weights override matches recompute from colSums(X^2).
#   3. sigma2 supplied gives single-effect-residual Shat shape.

set.seed(42)
N <- 50
J <- 5

test_that("vector Y is treated as a single-column matrix", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  y <- rnorm(N)

  out_vec <- compute_marginal_bhat_shat(X, y)
  out_mat <- compute_marginal_bhat_shat(X, matrix(y, ncol = 1))

  expect_equal(dim(out_vec$Bhat), c(J, 1L))
  expect_equal(dim(out_vec$Shat), c(J, 1L))
  expect_equal(out_vec$Bhat, out_mat$Bhat, tolerance = 0)
  expect_equal(out_vec$Shat, out_mat$Shat, tolerance = 0)
})

test_that("matrix Y returns J x T Bhat / Shat", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  Y <- matrix(rnorm(N * 3), N, 3)

  out <- compute_marginal_bhat_shat(X, Y)

  expect_equal(dim(out$Bhat), c(J, 3L))
  expect_equal(dim(out$Shat), c(J, 3L))
})

test_that("predictor_weights override matches recompute from colSums(X^2)", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  Y <- matrix(rnorm(N * 4), N, 4)

  pw <- colSums(X^2)

  out_default <- compute_marginal_bhat_shat(X, Y)
  out_override <- compute_marginal_bhat_shat(X, Y, predictor_weights = pw)

  expect_equal(out_default$Bhat, out_override$Bhat, tolerance = 0)
  expect_equal(out_default$Shat, out_override$Shat, tolerance = 0)
})

test_that("sigma2 supplied gives single-effect-residual Shat (sqrt(sigma2 / pw))", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  Y <- matrix(rnorm(N * 2), N, 2)

  out <- compute_marginal_bhat_shat(X, Y, sigma2 = 0.5)

  pw <- colSums(X^2)
  expected_shat <- matrix(sqrt(0.5 / pw), nrow = J, ncol = 2)
  expect_equal(out$Shat, expected_shat, tolerance = 0)
})

test_that("Bhat = X'Y / colSums(X^2) for centred X", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  Y <- matrix(rnorm(N * 3), N, 3)

  out <- compute_marginal_bhat_shat(X, Y)
  expected_bhat <- crossprod(X, Y) / colSums(X^2)

  expect_equal(out$Bhat, expected_bhat, tolerance = 0)
})

test_that("Shat (no sigma2) matches per-column residual SD / sqrt(n-1)", {
  X <- matrix(rnorm(N * J), N, J)
  X <- scale(X, center = TRUE, scale = FALSE)
  Y <- matrix(rnorm(N * 2), N, 2)

  out <- compute_marginal_bhat_shat(X, Y)

  # Manual recompute, no Rfast.
  Bhat <- crossprod(X, Y) / colSums(X^2)
  expected_shat <- matrix(0, nrow = J, ncol = 2)
  for (t in 1:2) {
    for (j in 1:J) {
      r <- Y[, t] - X[, j] * Bhat[j, t]
      expected_shat[j, t] <- sqrt(var(r))
    }
  }
  expected_shat <- expected_shat / sqrt(N - 1)

  expect_equal(out$Shat, expected_shat, tolerance = 1e-12)
})


================================================
FILE: tests/testthat/test_generic_methods.R
================================================
context("Generic methods infrastructure")

# =============================================================================
# GENERIC EXISTENCE
# =============================================================================

test_that("all core generics are defined", {
  # Data initialization
  expect_true(exists("configure_data", mode = "function"))
  expect_true(exists("get_var_y", mode = "function"))

  # Model initialization
  expect_true(exists("initialize_susie_model", mode = "function"))
  expect_true(exists("initialize_fitted", mode = "function"))
  expect_true(exists("validate_prior", mode = "function"))
  expect_true(exists("track_ibss_fit", mode = "function"))

  # Single effect regression
  expect_true(exists("compute_residuals", mode = "function"))
  expect_true(exists("compute_ser_statistics", mode = "function"))
  expect_true(exists("SER_posterior_e_loglik", mode = "function"))
  expect_true(exists("calculate_posterior_moments", mode = "function"))
  expect_true(exists("compute_kl", mode = "function"))
  expect_true(exists("get_ER2", mode = "function"))
  expect_true(exists("Eloglik", mode = "function"))
  expect_true(exists("loglik", mode = "function"))
  expect_true(exists("neg_loglik", mode = "function"))

  # Model updates
  expect_true(exists("update_fitted_values", mode = "function"))
  expect_true(exists("update_variance_components", mode = "function"))
  expect_true(exists("update_derived_quantities", mode = "function"))

  # Output generation
  expect_true(exists("get_scale_factors", mode = "function"))
  expect_true(exists("get_intercept", mode = "function"))
  expect_true(exists("get_fitted", mode = "function"))
  expect_true(exists("get_cs", mode = "function"))
  expect_true(exists("get_variable_names", mode = "function"))
  expect_true(exists("get_zscore", mode = "function"))
  expect_true(exists("cleanup_model", mode = "function"))
})

# =============================================================================
# METHOD DISPATCH
# =============================================================================

test_that("methods exist for all three data types", {
  classes <- c("individual", "ss", "rss_lambda")

  # Core generics that all data types must implement
  key_generics <- c(
    "configure_data",
    "get_var_y",
    "initialize_susie_model",
    "initialize_fitted",
    "compute_residuals",
    "compute_ser_statistics",
    "SER_posterior_e_loglik",
    "calculate_posterior_moments",
    "get_ER2",
    "Eloglik",
    "loglik",
    "neg_loglik",
    "update_fitted_values",
    "update_variance_components",
    "get_scale_factors",
    "get_intercept",
    "get_fitted",
    "get_cs",
    "get_variable_names",
    "cleanup_model"
  )

  for (generic in key_generics) {
    for (cls in classes) {
      method_name <- paste0(generic, ".", cls)
      expect_true(exists(method_name, mode = "function"),
                  info = paste("Missing method:", method_name))
    }
  }
})

test_that("default methods exist for optional generics", {
  default_methods <- c(
    "configure_data.default",
    "validate_prior.default",
    "track_ibss_fit.default",
    "compute_kl.default",
    "update_variance_components.default",
    "update_derived_quantities.default",
    "get_fitted.default",
    "get_zscore.default",
    "cleanup_model.default"
  )

  for (method in default_methods) {
    expect_true(exists(method, mode = "function"),
                info = paste("Missing default method:", method))
  }
})

# =============================================================================
# DEFAULT METHOD BEHAVIOR
# =============================================================================

test_that("default methods have sensible fallback behavior", {
  data <- structure(list(n = 50, p = 10), class = "test_class")
  params <- list(track_fit = FALSE)
  model <- list(alpha = matrix(1/10, 3, 10), V = c(0.1, 0.2, 0.3), sigma2 = 1)

  # configure_data.default returns data unchanged
  expect_identical(configure_data.default(data, params), data)

  # validate_prior.default returns TRUE
  expect_true(validate_prior.default(data, params, model))

  # update_derived_quantities.default returns model unchanged
  expect_identical(update_derived_quantities.default(data, params, model), model)

  # get_fitted.default and get_zscore.default return NULL
  expect_null(get_fitted.default(data, params, model))
  expect_null(get_zscore.default(data, params, model))
})

test_that("track_ibss_fit.default stores iteration snapshots", {
  data <- structure(list(), class = "test_class")
  params <- list(track_fit = TRUE)
  model <- list(alpha = matrix(1/10, 3, 10), V = c(0.1, 0.2, 0.3), sigma2 = 1)
  tracking <- list()

  # Should store snapshot at iteration 1
  result <- track_ibss_fit.default(data, params, model, tracking, iter = 1, elbo = c(-Inf))
  expect_true(is.list(result[[1]]))
  expect_true(is.matrix(result[[1]]$alpha))
  expect_equal(result[[1]]$sigma2, 1)

  # Should store snapshot at iteration 2
  result2 <- track_ibss_fit.default(data, params, model, result, iter = 2, elbo = c(-Inf, 100))
  expect_equal(length(result2), 2)
  expect_equal(result2[[2]]$niter, 2)

  # With track_fit = FALSE, tracking stays empty
  params_no_track <- list(track_fit = FALSE)
  result3 <- track_ibss_fit.default(data, params_no_track, model, list(), iter = 1, elbo = c(-Inf))
  expect_equal(length(result3), 0)
})

test_that("cleanup_model.default removes temporary fields", {
  data <- structure(list(), class = "test_class")
  params <- list()
  model <- list(
    alpha = matrix(1/10, 3, 10),
    mu = matrix(0, 3, 10),
    sigma2 = 1,
    V = c(0.1, 0.2, 0.3),
    # Temporary fields to remove
    null_weight = 0,
    predictor_weights = rep(1/10, 10),
    residuals = rnorm(50),
    fitted_without_l = rnorm(50),
    runtime = list(prev_elbo = -100, prev_alpha = matrix(1/10, 3, 10), prev_pip_diff = 0.01)
  )

  result <- cleanup_model.default(data, params, model)

  # Keep core fields
  expect_true("alpha" %in% names(result))
  expect_true("mu" %in% names(result))
  expect_true("sigma2" %in% names(result))
  expect_true("V" %in% names(result))

  # Remove temporary fields
  expect_false("null_weight" %in% names(result))
  expect_false("predictor_weights" %in% names(result))
  expect_false("residuals" %in% names(result))
  expect_false("fitted_without_l" %in% names(result))
  expect_false("runtime" %in% names(result))
})

# =============================================================================
# DEFAULT METHOD ERROR MESSAGES
# =============================================================================

test_that("get_var_y.default throws error for unimplemented class", {
  data <- structure(list(y = rnorm(50)), class = "unsupported_class")

  expect_error(
    get_var_y.default(data),
    "get_var_y: no method for class 'unsupported_class'"
  )
})

test_that("initialize_susie_model.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list(L = 5)

  expect_error(
    initialize_susie_model.default(data, params),
    "initialize_susie_model: no method for class 'unsupported_class'"
  )
})

test_that("initialize_fitted.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  mat_init <- matrix(0, 5, 10)

  expect_error(
    initialize_fitted.default(data, mat_init),
    "initialize_fitted: no method for class 'unsupported_class'"
  )
})

test_that("compute_residuals.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), V = rep(1, 5))
  l <- 1

  expect_error(
    compute_residuals.default(data, params, model, l),
    "compute_residuals: no method for class 'unsupported_class'"
  )
})

test_that("compute_ser_statistics.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), residuals = rnorm(50))
  l <- 1

  expect_error(
    compute_ser_statistics.default(data, params, model, l),
    "compute_ser_statistics: no method for class 'unsupported_class'"
  )
})

test_that("SER_posterior_e_loglik.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), lbf_variable = matrix(0, 5, 10))
  l <- 1

  expect_error(
    SER_posterior_e_loglik.default(data, params, model, l),
    "SER_posterior_e_loglik: no method for class 'unsupported_class'"
  )
})

test_that("calculate_posterior_moments.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10))
  V <- 1.0

  expect_error(
    calculate_posterior_moments.default(data, params, model, V),
    "calculate_posterior_moments: no method for class 'unsupported_class'"
  )
})

test_that("get_ER2.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  model <- list(alpha = matrix(1/10, 5, 10), sigma2 = 1)

  expect_error(
    get_ER2.default(data, model),
    "get_ER2: no method for class 'unsupported_class'"
  )
})

test_that("Eloglik.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  model <- list(alpha = matrix(1/10, 5, 10), sigma2 = 1)

  expect_error(
    Eloglik.default(data, model),
    "Eloglik: no method for class 'unsupported_class'"
  )
})

test_that("loglik.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), sigma2 = 1)
  V <- 1.0
  ser_stats <- list(betahat = rnorm(10), shat2 = rep(1, 10))

  expect_error(
    loglik.default(data, params, model, V, ser_stats),
    "loglik: no method for class 'unsupported_class'"
  )
})

test_that("neg_loglik.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), sigma2 = 1)
  V_param <- 0.0  # log scale
  ser_stats <- list(betahat = rnorm(10), shat2 = rep(1, 10))

  expect_error(
    neg_loglik.default(data, params, model, V_param, ser_stats),
    "neg_loglik: no method for class 'unsupported_class'"
  )
})

test_that("update_fitted_values.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), mu = matrix(0, 5, 10))
  l <- 1

  expect_error(
    update_fitted_values.default(data, params, model, l),
    "update_fitted_values: no method for class 'unsupported_class'"
  )
})

test_that("get_scale_factors.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()

  expect_error(
    get_scale_factors.default(data, params),
    "get_scale_factors: no method for class 'unsupported_class'"
  )
})

test_that("get_intercept.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list()
  model <- list(alpha = matrix(1/10, 5, 10), mu = matrix(0, 5, 10))

  expect_error(
    get_intercept.default(data, params, model),
    "get_intercept: no method for class 'unsupported_class'"
  )
})

test_that("get_cs.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  params <- list(coverage = 0.95, min_abs_corr = 0.5)
  model <- list(alpha = matrix(1/10, 5, 10))

  expect_error(
    get_cs.default(data, params, model),
    "get_cs: no method for class 'unsupported_class'"
  )
})

test_that("get_variable_names.default throws error for unimplemented class", {
  data <- structure(list(n = 50, p = 10), class = "unsupported_class")
  model <- list(alpha = matrix(1/10, 5, 10))

  expect_error(
    get_variable_names.default(data, model),
    "get_variable_names: no method for class 'unsupported_class'"
  )
})

# =============================================================================
# Per-class verbose-row generics (format_sigma2_summary, format_extra_diag)
# =============================================================================

test_that("format_sigma2_summary.default returns sprintf %.4f of scalar sigma2", {
  model <- list(sigma2 = 1.2345678)
  expect_equal(format_sigma2_summary(model), sprintf("%.4f", 1.2345678))
  expect_type(format_sigma2_summary(model), "character")
  expect_length(format_sigma2_summary(model), 1L)
})

test_that("format_extra_diag.default returns empty string", {
  model <- list()
  expect_identical(format_extra_diag(model), "")
})

# =============================================================================
# cleanup_extra_fields generic
# =============================================================================

test_that("cleanup_extra_fields.default returns character(0)", {
  data <- list()
  expect_identical(cleanup_extra_fields(data), character(0))
})

test_that("cleanup_model.default strips standard temp fields", {
  data <- list()  # default class
  model <- list(
    null_weight       = 0.5,
    runtime           = list(prev_elbo = -Inf),
    fitted_without_l  = NA,
    keep_me           = 42
  )
  out <- cleanup_model.default(data, params = list(), model = model)
  expect_null(out$null_weight)
  expect_null(out$runtime)
  expect_null(out$fitted_without_l)
  expect_equal(out$keep_me, 42)
})

# =============================================================================
# get_objective.default sum(KL) tolerates NA entries via na.rm = TRUE
# =============================================================================

test_that("get_objective.default skips NA entries in KL via na.rm = TRUE", {
  # Construct a minimal model where KL contains NA on a null effect.
  # Eloglik will throw because the model class is generic; instead we
  # intercept at the line that computes objective. Use a tiny test:
  model <- list(
    alpha  = matrix(1/10, 5, 10),
    KL     = c(1.0, NA_real_, 2.0, NA_real_, 0.5),
    sigma2 = 1.0
  )

  # Direct test: does sum(model$KL, na.rm = TRUE) equal 3.5?
  expect_equal(sum(model$KL, na.rm = TRUE), 3.5)
})


================================================
FILE: tests/testthat/test_ibss.R
================================================
context("Iterative Bayesian Stepwise Selection (IBSS)")

# =============================================================================
# IBSS_INITIALIZE - Basic Structure and Components
# =============================================================================

test_that("ibss_initialize returns correct structure with susie class", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_s3_class(model, "susie")
  expect_type(model, "list")
})

test_that("ibss_initialize creates all required model components", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  # Core posterior components
  expect_true("alpha" %in% names(model))
  expect_true("mu" %in% names(model))
  expect_true("mu2" %in% names(model))
  expect_true("V" %in% names(model))
  expect_true("sigma2" %in% names(model))

  # Tracking components
  expect_true("lbf" %in% names(model))
  expect_true("lbf_variable" %in% names(model))
  expect_true("KL" %in% names(model))

  # Prior components
  expect_true("pi" %in% names(model))
  expect_true("predictor_weights" %in% names(model))

  # Fitted values
  expect_true("Xr" %in% names(model))
  expect_true("null_index" %in% names(model))
})

test_that("ibss_initialize creates matrices with correct dimensions", {
  n <- 100
  p <- 50
  L <- 5
  setup <- setup_individual_data(n = n, p = p, L = L)

  model <- ibss_initialize(setup$data, setup$params)

  expect_equal(dim(model$alpha), c(L, p))
  expect_equal(dim(model$mu), c(L, p))
  expect_equal(dim(model$mu2), c(L, p))
  expect_equal(dim(model$lbf_variable), c(L, p))
  expect_length(model$V, L)
  expect_length(model$lbf, L)
  expect_length(model$KL, L)
  expect_length(model$Xr, n)
})

# =============================================================================
# IBSS_INITIALIZE - Parameter Validation
# =============================================================================

test_that("ibss_initialize adjusts L when p < L", {
  setup <- setup_individual_data(n = 100, p = 10, L = 20)

  model <- ibss_initialize(setup$data, setup$params)

  # L should be reduced to p
  expect_equal(nrow(model$alpha), 10)
  expect_equal(length(model$V), 10)
})

test_that("ibss_initialize validates residual variance is positive", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$residual_variance <- -1

  expect_error(
    ibss_initialize(setup$data, setup$params),
    "Residual variance sigma2 must be positive"
  )
})

test_that("ibss_initialize validates residual variance is scalar", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$residual_variance <- c(1, 2)

  expect_error(
    ibss_initialize(setup$data, setup$params),
    "Input residual variance sigma2 must be a scalar"
  )
})

test_that("ibss_initialize validates residual variance is numeric", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$residual_variance <- "one"

  expect_error(
    ibss_initialize(setup$data, setup$params),
    "Input residual variance sigma2 must be numeric"
  )
})

test_that("ibss_initialize sets default residual variance to var(y)", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$residual_variance <- NULL

  var_y <- var(drop(setup$data$y))
  model <- ibss_initialize(setup$data, setup$params)

  expect_equal(model$sigma2, var_y)
})

test_that("ibss_initialize uses provided residual variance", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$residual_variance <- 2.5

  model <- ibss_initialize(setup$data, setup$params)

  expect_equal(model$sigma2, 2.5)
})

# =============================================================================
# IBSS_INITIALIZE - Model Initialization (model_init)
# =============================================================================

test_that("ibss_initialize works without model_init", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$model_init <- NULL

  model <- ibss_initialize(setup$data, setup$params)

  expect_equal(dim(model$alpha), c(5, 50))
  expect_true(all(model$alpha >= 0 & model$alpha <= 1))
  expect_true(all(is.finite(model$mu)))
})

test_that("ibss_initialize accepts valid susie model_init", {
  setup <- setup_individual_data(n = 100, p = 50, L = 3)

  # Create a proper previous susie fit to use as model_init
  model_init <- ibss_initialize(setup$data, setup$params)
  model_init$V <- rep(0.5, 3)  # Set some prior variance

  # Use it as initialization for a new fit
  setup2 <- setup_individual_data(n = 100, p = 50, L = 3)
  setup2$params$model_init <- model_init

  model <- ibss_initialize(setup2$data, setup2$params)

  expect_equal(dim(model$alpha), c(3, 50))
  expect_true(all(model$alpha >= 0 & model$alpha <= 1))
})

test_that("ibss_initialize handles model_init with fewer effects than L", {
  setup <- setup_individual_data(n = 100, p = 50, L = 2)

  # Create init with 2 effects
  model_init <- ibss_initialize(setup$data, setup$params)
  model_init$V <- rep(0.5, 2)

  # Try to expand to 5 effects
  setup2 <- setup_individual_data(n = 100, p = 50, L = 5)
  setup2$params$model_init <- model_init

  model <- ibss_initialize(setup2$data, setup2$params)

  # Should expand to L=5 effects
  expect_equal(dim(model$alpha), c(5, 50))
})

test_that("ibss_initialize handles model_init with more effects than L", {
  setup <- setup_individual_data(n = 100, p = 50, L = 6)

  # Create init with 6 effects
  model_init <- ibss_initialize(setup$data, setup$params)
  model_init$V <- rep(0.5, 6)

  # Try to reduce to 3 effects
  setup2 <- setup_individual_data(n = 100, p = 50, L = 3)
  setup2$params$model_init <- model_init

  # When model_init has more effects, it keeps all of them (expands L)
  expect_message(
    model <- ibss_initialize(setup2$data, setup2$params),
    "using L = 6"
  )

  # Should keep all 6 effects from model_init
  expect_equal(dim(model$alpha), c(6, 50))
})

# =============================================================================
# IBSS_INITIALIZE - Mathematical Properties
# =============================================================================

test_that("ibss_initialize alpha rows sum to 1", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  row_sums <- rowSums(model$alpha)
  expect_equal(row_sums, rep(1, 5), tolerance = 1e-10)
})

test_that("ibss_initialize alpha values are valid probabilities", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true(all(model$alpha >= 0 & model$alpha <= 1))
})

test_that("ibss_initialize V values are non-negative", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true(all(model$V >= 0))
  expect_true(all(is.finite(model$V)))
})

test_that("ibss_initialize sigma2 is positive", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true(model$sigma2 > 0)
  expect_true(is.finite(model$sigma2))
})

test_that("ibss_initialize KL and lbf are initialized to NA", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$model_init <- NULL

  model <- ibss_initialize(setup$data, setup$params)

  expect_true(all(is.na(model$KL)))
  expect_true(all(is.na(model$lbf)))
})

# =============================================================================
# IBSS_INITIALIZE - Fitted Values
# =============================================================================

test_that("ibss_initialize creates fitted values for individual data", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true("Xr" %in% names(model))
  expect_length(model$Xr, 100)
  expect_true(all(is.finite(model$Xr)))
})

test_that("ibss_initialize creates fitted values for sufficient stats", {
  setup <- setup_ss_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true("XtXr" %in% names(model))
  expect_length(model$XtXr, 50)
  expect_true(all(is.finite(model$XtXr)))
})

test_that("ibss_initialize creates fitted values for rss_lambda", {
  setup <- setup_rss_lambda_data(n = 500, p = 50, L = 5, lambda = 0.5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_true("Rz" %in% names(model))
  expect_length(model$Rz, 50)
  expect_true(all(is.finite(model$Rz)))
})

# =============================================================================
# IBSS_INITIALIZE - Null Index
# =============================================================================

test_that("ibss_initialize sets null_index to 0 when null_weight = 0", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$model$null_weight <- 0

  model <- ibss_initialize(setup$data, setup$params)

  expect_equal(model$null_index, 0)
})

test_that("ibss_initialize sets null_index when null_weight > 0", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$null_weight <- 0.5

  model <- ibss_initialize(setup$data, setup$params)

  expect_true(model$null_index > 0)
})

# =============================================================================
# IBSS_INITIALIZE - Data Type Compatibility
# =============================================================================

test_that("ibss_initialize works with individual data", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_s3_class(model, "susie")
  expect_true("Xr" %in% names(model))
})

test_that("ibss_initialize works with sufficient stats", {
  setup <- setup_ss_data(n = 100, p = 50, L = 5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_s3_class(model, "susie")
  expect_true("XtXr" %in% names(model))
})

test_that("ibss_initialize works with rss_lambda", {
  setup <- setup_rss_lambda_data(n = 500, p = 50, L = 5, lambda = 0.5)

  model <- ibss_initialize(setup$data, setup$params)

  expect_s3_class(model, "susie")
  expect_true("Rz" %in% names(model))
})

# =============================================================================
# IBSS_FIT - Basic Functionality
# =============================================================================

test_that("ibss_fit updates all L effects", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  # Fit one iteration
  model_updated <- ibss_fit(setup$data, setup$params, model)

  # All effects should still have valid probabilities
  for (l in 1:5) {
    expect_equal(sum(model_updated$alpha[l, ]), 1, tolerance = 1e-10)
  }

  # V should be updated (even if to 0 for no signal)
  expect_true(all(is.finite(model_updated$V)))
  expect_true(all(model_updated$V >= 0))
})

test_that("ibss_fit updates V for all effects", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  # Store initial V
  V_init <- model$V

  # Fit one iteration
  model_updated <- ibss_fit(setup$data, setup$params, model)

  # V should be updated (unless it converged to same values)
  expect_length(model_updated$V, 5)
  expect_true(all(model_updated$V >= 0))
  expect_true(all(is.finite(model_updated$V)))
})

test_that("ibss_fit updates lbf for all effects", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  # Fit one iteration
  model_updated <- ibss_fit(setup$data, setup$params, model)

  expect_length(model_updated$lbf, 5)
  expect_true(all(is.finite(model_updated$lbf)))
})

test_that("ibss_fit updates KL for all effects", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  # Fit one iteration
  model_updated <- ibss_fit(setup$data, setup$params, model)

  expect_length(model_updated$KL, 5)
  expect_true(all(is.finite(model_updated$KL)))
  # KL divergence should be non-negative
  expect_true(all(model_updated$KL >= -1e-6))
})

# =============================================================================
# IBSS_FIT - Mathematical Properties
# =============================================================================

test_that("ibss_fit maintains valid probability distributions", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  model_updated <- ibss_fit(setup$data, setup$params, model)

  # Each row of alpha should sum to 1
  row_sums <- rowSums(model_updated$alpha)
  expect_equal(row_sums, rep(1, 5), tolerance = 1e-10)

  # All alpha values should be valid probabilities
  expect_true(all(model_updated$alpha >= 0))
  expect_true(all(model_updated$alpha <= 1))
})

test_that("ibss_fit maintains finite values", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  model_updated <- ibss_fit(setup$data, setup$params, model)

  expect_true(all(model_updated$alpha >= 0 & model_updated$alpha <= 1))
  expect_true(all(is.finite(model_updated$mu)))
  expect_true(all(is.finite(model_updated$mu2)))
  expect_true(all(is.finite(model_updated$V)))
})

test_that("ibss_fit updates fitted values", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  Xr_init <- model$Xr
  model_updated <- ibss_fit(setup$data, setup$params, model)

  # Fitted values should be updated
  expect_true("Xr" %in% names(model_updated))
  expect_length(model_updated$Xr, 100)
})

# =============================================================================
# IBSS_FIT - Edge Cases
# =============================================================================

test_that("ibss_fit works with L=1", {
  setup <- setup_individual_data(n = 100, p = 50, L = 1)
  model <- ibss_initialize(setup$data, setup$params)

  model_updated <- ibss_fit(setup$data, setup$params, model)

  expect_equal(dim(model_updated$alpha), c(1, 50))
  expect_equal(sum(model_updated$alpha), 1, tolerance = 1e-10)
})

test_that("ibss_fit works with L=0 (no effects)", {
  setup <- setup_individual_data(n = 100, p = 50, L = 0)
  model <- list(alpha = matrix(0, 0, 50))

  # Should handle gracefully
  model_updated <- ibss_fit(setup$data, setup$params, model)

  expect_equal(nrow(model_updated$alpha), 0)
})

test_that("ibss_fit works with different data types", {
  # Individual data
  setup_ind <- setup_individual_data(n = 100, p = 50, L = 5)
  model_ind <- ibss_initialize(setup_ind$data, setup_ind$params)
  model_ind_updated <- ibss_fit(setup_ind$data, setup_ind$params, model_ind)
  expect_s3_class(model_ind_updated, "susie")

  # Sufficient stats
  setup_ss <- setup_ss_data(n = 100, p = 50, L = 5)
  model_ss <- ibss_initialize(setup_ss$data, setup_ss$params)
  model_ss_updated <- ibss_fit(setup_ss$data, setup_ss$params, model_ss)
  expect_s3_class(model_ss_updated, "susie")

  # RSS lambda
  setup_rss <- setup_rss_lambda_data(n = 500, p = 50, L = 5, lambda = 0.5)
  model_rss <- ibss_initialize(setup_rss$data, setup_rss$params)
  model_rss_updated <- ibss_fit(setup_rss$data, setup_rss$params, model_rss)
  expect_s3_class(model_rss_updated, "susie")
})

# =============================================================================
# IBSS_FIT - Iterative Behavior
# =============================================================================

test_that("ibss_fit can be called iteratively", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)

  # Run multiple iterations
  for (iter in 1:3) {
    model <- ibss_fit(setup$data, setup$params, model)

    # Check validity after each iteration
    expect_equal(rowSums(model$alpha), rep(1, 5), tolerance = 1e-10)
    expect_true(all(model$V >= 0))
  }
})

# =============================================================================
# IBSS_FINALIZE - Basic Functionality
# =============================================================================

test_that("ibss_finalize adds required output fields", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  # Check for required output fields
  expect_true("niter" %in% names(model_final))
  expect_true("intercept" %in% names(model_final))
  expect_true("fitted" %in% names(model_final))
  expect_true("sets" %in% names(model_final))
  expect_true("pip" %in% names(model_final))
  expect_true("X_column_scale_factors" %in% names(model_final))
})

test_that("ibss_finalize sets iteration count", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 42L, tracking = NULL)

  expect_equal(model_final$niter, 42L)
})

test_that("ibss_finalize computes PIPs", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_length(model_final$pip, 50)
  expect_true(all(model_final$pip >= 0))
  expect_true(all(model_final$pip <= 1))
  expect_true(all(is.finite(model_final$pip)))
})

test_that("ibss_finalize computes credible sets", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_true("sets" %in% names(model_final))
  expect_type(model_final$sets, "list")
})

test_that("ibss_finalize computes fitted values", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_true("fitted" %in% names(model_final))
  expect_length(model_final$fitted, 100)
  expect_true(all(is.finite(model_final$fitted)))
})

test_that("ibss_finalize computes intercept", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$intercept <- TRUE
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_true("intercept" %in% names(model_final))
  expect_true(is.finite(model_final$intercept))
})

# =============================================================================
# IBSS_FINALIZE - Tracking
# =============================================================================

test_that("ibss_finalize includes tracking when track_fit=TRUE", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$track_fit <- TRUE
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  # Create mock tracking data
  tracking <- list(
    elbo = c(100, 110, 115),
    sigma2 = c(1, 0.9, 0.85)
  )

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 3L, tracking = tracking)

  expect_true("trace" %in% names(model_final))
  expect_type(model_final$trace, "list")
})

test_that("ibss_finalize excludes tracking when track_fit=FALSE", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$track_fit <- FALSE
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 3L, tracking = NULL)

  expect_false("trace" %in% names(model_final))
})

# =============================================================================
# IBSS_FINALIZE - Variable Names
# =============================================================================

test_that("ibss_finalize assigns variable names when available", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  # Add column names to X
  colnames(setup$data$X) <- paste0("var", 1:50)

  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  # Check that variable names are assigned to pip
  expect_named(model_final$pip, paste0("var", 1:50))
})

# =============================================================================
# IBSS_FINALIZE - Z-scores
# =============================================================================

test_that("ibss_finalize computes z-scores for individual data", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_true("z" %in% names(model_final))
  if (!is.null(model_final$z)) {
    expect_length(model_final$z, 50)
    expect_true(all(is.finite(model_final$z)))
  }
})

# =============================================================================
# IBSS_FINALIZE - Scale Factors
# =============================================================================

test_that("ibss_finalize computes X_column_scale_factors", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_true("X_column_scale_factors" %in% names(model_final))
  expect_length(model_final$X_column_scale_factors, 50)
})

# =============================================================================
# IBSS_FINALIZE - Data Type Compatibility
# =============================================================================

test_that("ibss_finalize works with individual data", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  model <- ibss_initialize(setup$data, setup$params)
  model <- ibss_fit(setup$data, setup$params, model)

  model_final <- ibss_finalize(setup$data, setup$params, model,
                               elbo = NULL, iter = 10L, tracking = NULL)

  expect_s3_class(model_final, "susie")
  expect_true("fitted" %in% names(model_final))
  expect_length(model_final$fitted, 100)
})


# =============================================================================
# FULL IBSS PIPELINE
# =============================================================================

test_that("Full IBSS pipeline produces valid susie object", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  # Initialize
  model <- ibss_initialize(setup$data, setup$params)

  # Fit (run 5 iterations)
  for (i in 1:5) {
    model <- ibss_fit(setup$data, setup$params, model)
  }

  # Finalize
  model <- ibss_finalize(setup$data, setup$params, model,
                        elbo = NULL, iter = 5L, tracking = NULL)

  # Check final model is complete
  expect_s3_class(model, "susie")
  expect_true("alpha" %in% names(model))
  expect_true("mu" %in% names(model))
  expect_true("V" %in% names(model))
  expect_true("pip" %in% names(model))
  expect_true("sets" %in% names(model))
  expect_true("fitted" %in% names(model))
  expect_true("niter" %in% names(model))
  expect_equal(model$niter, 5L)
})

test_that("Full IBSS pipeline maintains mathematical properties", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  # Initialize
  model <- ibss_initialize(setup$data, setup$params)

  # Fit (run 3 iterations)
  for (i in 1:3) {
    model <- ibss_fit(setup$data, setup$params, model)
  }

  # Finalize
  model <- ibss_finalize(setup$data, setup$params, model,
                        elbo = NULL, iter = 3L, tracking = NULL)

  # Check mathematical properties
  expect_equal(rowSums(model$alpha), rep(1, 5), tolerance = 1e-10)
  expect_true(all(model$pip >= 0))
  expect_true(all(model$pip <= 1))
  expect_true(all(model$V >= 0))
})


================================================
FILE: tests/testthat/test_individual_data_methods.R
================================================
context("S3 methods for individual data class")

# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
# =============================================================================

test_that("configure_data.individual returns data when unmappable_effects='none'", {
  setup <- setup_individual_data()
  setup$params$unmappable_effects <- "none"

  result <- configure_data.individual(setup$data, setup$params)

  expect_true("individual" %in% class(result))
})

test_that("get_var_y.individual computes variance of y", {
  setup <- setup_individual_data()

  var_y <- get_var_y.individual(setup$data)

  expect_type(var_y, "double")
  expect_length(var_y, 1)
  expect_true(var_y > 0)
  expect_equal(var_y, var(setup$data$y))
})

# =============================================================================
# MODEL INITIALIZATION & SETUP
# =============================================================================

test_that("initialize_susie_model.individual creates model with predictor_weights", {
  setup <- setup_individual_data()
  var_y <- var(setup$data$y)

  model <- initialize_susie_model.individual(setup$data, setup$params, var_y)

  expect_true("predictor_weights" %in% names(model))
  expect_length(model$predictor_weights, setup$data$p)
  expect_equal(model$predictor_weights, attr(setup$data$X, "d"))
})

test_that("initialize_fitted.individual creates Xr", {
  setup <- setup_individual_data()

  mat_init <- list(
    alpha = setup$model$alpha,
    mu = setup$model$mu
  )

  fitted <- initialize_fitted.individual(setup$data, mat_init)

  expect_true("Xr" %in% names(fitted))
  expect_length(fitted$Xr, setup$data$n)
})

test_that("validate_prior.individual delegates to default method", {
  setup <- setup_individual_data()

  result <- validate_prior.individual(setup$data, setup$params, setup$model)

  expect_type(result, "logical")
})

test_that("track_ibss_fit.individual delegates to default method", {
  setup <- setup_individual_data()
  tracking <- list()
  iter <- 1
  elbo <- -100

  result <- track_ibss_fit.individual(setup$data, setup$params, setup$model,
                                      tracking, iter, elbo)

  expect_type(result, "list")
})

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
# =============================================================================

test_that("compute_residuals.individual computes residuals correctly", {
  setup <- setup_individual_data()
  l <- 1

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  expect_true("residuals" %in% names(model))
  expect_true("fitted_without_l" %in% names(model))
  expect_true("raw_residuals" %in% names(model))
  expect_true("residual_variance" %in% names(model))

  expect_length(model$residuals, setup$data$p)
  expect_length(model$raw_residuals, setup$data$n)
})

test_that("compute_ser_statistics.individual computes betahat and shat2", {
  setup <- setup_individual_data()
  l <- 1

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.individual(setup$data, setup$params, model, l)

  expect_true("betahat" %in% names(ser_stats))
  expect_true("shat2" %in% names(ser_stats))
  expect_true("optim_init" %in% names(ser_stats))
  expect_true("optim_bounds" %in% names(ser_stats))
  expect_true("optim_scale" %in% names(ser_stats))

  expect_length(ser_stats$betahat, setup$data$p)
  expect_length(ser_stats$shat2, setup$data$p)
  expect_true(all(ser_stats$shat2 > 0))
})

test_that("calculate_posterior_moments.individual computes posterior correctly", {
  setup <- setup_individual_data()
  l <- 1
  V <- 1.0

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  model <- calculate_posterior_moments.individual(setup$data, setup$params, model, V, l)

  expect_length(model$mu[l, ], setup$data$p)
  expect_length(model$mu2[l, ], setup$data$p)

  post_var <- model$mu2[l, ] - model$mu[l, ]^2
  expect_true(all(post_var >= -1e-10))
  expect_true(all(model$mu2[l, ] >= model$mu[l, ]^2 - 1e-10))
})

test_that("calculate_posterior_moments.individual handles V=0", {
  setup <- setup_individual_data()
  l <- 1
  V <- 0

  setup$params$use_NIG <- TRUE
  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  model <- calculate_posterior_moments.individual(setup$data, setup$params, model, V, l)

  expect_equal(model$mu[l, ], rep(0, setup$data$p))
  expect_equal(model$mu2[l, ], rep(0, setup$data$p))
})

test_that("compute_kl.individual computes KL divergence", {
  setup <- setup_individual_data()
  l <- 1

  setup$model$lbf <- rep(0, setup$params$L)
  setup$model$alpha[l, ] <- rep(1/setup$data$p, setup$data$p)
  setup$model$mu[l, ] <- rnorm(setup$data$p, sd = 0.1)
  setup$model$mu2[l, ] <- setup$model$mu[l, ]^2 + 0.1

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  model <- compute_kl.individual(setup$data, setup$params, model, l)

  expect_type(model$KL[l], "double")
  expect_length(model$KL[l], 1)
})

test_that("get_ER2.individual computes expected squared residuals", {
  setup <- setup_individual_data()

  er2 <- get_ER2.individual(setup$data, setup$model)

  expect_type(er2, "double")
  expect_length(er2, 1)
  expect_true(er2 >= 0)
})

test_that("Eloglik.individual computes expected log-likelihood", {
  setup <- setup_individual_data()

  e_loglik <- Eloglik.individual(setup$data, setup$model)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
})

test_that("loglik.individual computes log Bayes factors", {
  setup <- setup_individual_data()
  l <- 1
  V <- 1.0

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.individual(setup$data, setup$params, model, l)
  model <- loglik.individual(setup$data, setup$params, model, V, ser_stats, l)

  expect_length(model$lbf_variable[l, ], setup$data$p)
  expect_length(model$alpha[l, ], setup$data$p)

  expect_true(all(model$alpha[l, ] >= 0))
  expect_true(abs(sum(model$alpha[l, ]) - 1) < 1e-10)
  expect_true(is.numeric(model$lbf[l]))
})

test_that("neg_loglik.individual returns negative log-likelihood", {
  setup <- setup_individual_data()
  l <- 1
  V_param <- log(1.0)

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.individual(setup$data, setup$params, model, l)
  neg_ll <- neg_loglik.individual(setup$data, setup$params, model, V_param, ser_stats)

  expect_type(neg_ll, "double")
  expect_length(neg_ll, 1)
})

test_that("SER_posterior_e_loglik.individual computes expected log-likelihood", {
  setup <- setup_individual_data()
  l <- 1

  setup$model$alpha[l, ] <- rep(1/setup$data$p, setup$data$p)
  setup$model$mu[l, ] <- rnorm(setup$data$p)
  setup$model$mu2[l, ] <- setup$model$mu[l, ]^2 + 0.1

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  e_loglik <- SER_posterior_e_loglik.individual(setup$data, setup$params, model, l)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
})

# =============================================================================
# MODEL UPDATES & FITTING
# =============================================================================

test_that("update_fitted_values.individual updates Xr", {
  setup <- setup_individual_data()
  l <- 1

  model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  setup$model$fitted_without_l <- model$fitted_without_l

  updated_model <- update_fitted_values.individual(setup$data, setup$params, setup$model, l)

  expect_true("Xr" %in% names(updated_model))
  expect_length(updated_model$Xr, setup$data$n)
})

test_that("update_variance_components.individual delegates to default method", {
  setup <- setup_individual_data()

  result <- update_variance_components.individual(setup$data, setup$params, setup$model)

  expect_type(result, "list")
})

test_that("update_derived_quantities.individual delegates to default method", {
  setup <- setup_individual_data()

  result <- update_derived_quantities.individual(setup$data, setup$params, setup$model)

  expect_type(result, "list")
})

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
# =============================================================================

test_that("get_scale_factors.individual returns column scale factors", {
  setup <- setup_individual_data()

  scales <- get_scale_factors.individual(setup$data, setup$params)

  expect_length(scales, setup$data$p)
  expect_true(all(scales > 0))
  expect_equal(scales, attr(setup$data$X, "scaled:scale"))
})

test_that("get_intercept.individual computes intercept when intercept=TRUE", {
  setup <- setup_individual_data()
  setup$params$intercept <- TRUE

  intercept <- get_intercept.individual(setup$data, setup$params, setup$model)

  expect_type(intercept, "double")
  expect_length(intercept, 1)
})

test_that("get_intercept.individual returns 0 when intercept=FALSE", {
  setup <- setup_individual_data()
  setup$params$intercept <- FALSE

  intercept <- get_intercept.individual(setup$data, setup$params, setup$model)

  expect_equal(intercept, 0)
})

test_that("get_fitted.individual returns fitted values with correct length", {
  setup <- setup_individual_data()

  fitted <- get_fitted.individual(setup$data, setup$params, setup$model)

  expect_length(fitted, setup$data$n)
  expect_type(fitted, "double")
})

test_that("get_fitted.individual adds intercept when intercept=TRUE", {
  setup <- setup_individual_data()
  setup$params$intercept <- TRUE
  setup$data$mean_y <- 5.0

  fitted <- get_fitted.individual(setup$data, setup$params, setup$model)

  expect_true(any(fitted != setup$model$Xr))
})

test_that("get_fitted.individual does not add intercept when intercept=FALSE", {
  setup <- setup_individual_data()
  setup$params$intercept <- FALSE
  setup$data$mean_y <- 0

  fitted <- get_fitted.individual(setup$data, setup$params, setup$model)

  expect_equal(fitted, drop(setup$model$Xr))
})

test_that("get_cs.individual returns NULL when coverage is NULL", {
  setup <- setup_individual_data()
  setup$params$coverage <- NULL

  cs <- get_cs.individual(setup$data, setup$params, setup$model)

  expect_null(cs)
})

test_that("get_cs.individual returns NULL when min_abs_corr is NULL", {
  setup <- setup_individual_data()
  setup$params$min_abs_corr <- NULL

  cs <- get_cs.individual(setup$data, setup$params, setup$model)

  expect_null(cs)
})

test_that("get_variable_names.individual assigns variable names to model", {
  setup <- setup_individual_data()
  colnames(setup$data$X) <- paste0("var", 1:setup$data$p)
  setup$model$pip <- rep(0.1, setup$data$p)
  setup$model$null_weight <- NULL
  setup$model$alpha <- matrix(0, 5, setup$data$p)
  setup$model$mu <- matrix(0, 5, setup$data$p)
  setup$model$mu2 <- matrix(0, 5, setup$data$p)
  setup$model$lbf_variable <- matrix(0, 5, setup$data$p)

  model_with_names <- get_variable_names.individual(setup$data, setup$model)

  expect_true(all(grepl("var", colnames(model_with_names$alpha))))
  expect_true(all(grepl("var", colnames(model_with_names$mu))))
  expect_true(all(grepl("var", colnames(model_with_names$mu2))))
  expect_true(all(grepl("var", names(model_with_names$pip))))
})

test_that("get_zscore.individual computes z-scores", {
  setup <- setup_individual_data()
  setup$params$compute_univariate_zscore <- TRUE

  z <- get_zscore.individual(setup$data, setup$params, setup$model)

  expect_length(z, setup$data$p)
  expect_type(z, "double")
})

test_that("get_zscore.individual handles null_weight", {
  setup <- setup_individual_data()
  setup$params$compute_univariate_zscore <- TRUE
  setup$model$null_weight <- 0.1

  setup$data$X <- cbind(setup$data$X, 0)

  z <- get_zscore.individual(setup$data, setup$params, setup$model)

  expect_length(z, setup$data$p)
})

test_that("get_zscore.individual returns default when compute_univariate_zscore=FALSE", {
  setup <- setup_individual_data()
  setup$params$compute_univariate_zscore <- FALSE

  z <- get_zscore.individual(setup$data, setup$params, setup$model)

  expect_null(z)
})

test_that("get_zscore.individual warns when X is not a matrix (sparse/trend filtering)", {
  setup <- setup_individual_data()
  setup$params$compute_univariate_zscore <- TRUE

  # Convert X to sparse matrix
  setup$data$X <- Matrix::Matrix(setup$data$X, sparse = TRUE)

  # Should produce warning about slow computation
  expect_message(
    z <- get_zscore.individual(setup$data, setup$params, setup$model),
    "Calculation of univariate regression z-scores is not implemented specifically for sparse or trend filtering matrices"
  )

  # Should still compute z-scores
  expect_length(z, setup$data$p)
  expect_type(z, "double")
})

test_that("cleanup_model.individual removes temporary fields", {
  setup <- setup_individual_data()

  setup$model$raw_residuals <- rnorm(setup$data$n)
  setup$model$residuals <- rnorm(setup$data$p)

  cleaned <- cleanup_model.individual(setup$data, setup$params, setup$model)

  expect_false("raw_residuals" %in% names(cleaned))
})

================================================
FILE: tests/testthat/test_l_greedy.R
================================================
# Greedy-L outer loop in susie_workhorse.
# Contracts: (1) L_greedy = NULL is bit-identical to fixed-L susie.
# (2) L_greedy != NULL grows L until min(lbf) < lbf_min or L reaches
# params$L.

set.seed(42)
N <- 200
J <- 100
X <- matrix(rnorm(N * J), N, J)
true_idx <- c(10, 30)                   # K = 2 real effects
beta <- numeric(J)
beta[true_idx] <- c(2.5, -1.8)
y <- X %*% beta + rnorm(N, sd = 0.3)

test_that("L_greedy = NULL is bit-identical to fixed-L susie", {
  fit_fixed <- susie(X, y, L = 5)

  obj <- susie(X, y, L = 5, init_only = TRUE)
  obj$params$L_greedy <- NULL
  fit_direct <- susie_workhorse(obj$data, obj$params)

  expect_equal(fit_direct$alpha, fit_fixed$alpha, tolerance = 0)
  expect_equal(fit_direct$lbf,   fit_fixed$lbf,   tolerance = 0)
  expect_equal(fit_direct$elbo,  fit_fixed$elbo,  tolerance = 0)
})

test_that("L_greedy grows L in steps of L_greedy, capped at params$L", {
  obj <- susie(X, y, L = 10, init_only = TRUE)
  obj$params$L_greedy <- 3
  obj$params$lbf_min  <- 0.1
  fit <- susie_workhorse(obj$data, obj$params)

  final_L <- nrow(fit$alpha)
  expect_true(final_L %in% c(3, 6, 9, 10))     # multiple of 3, capped at 10
  expect_lte(final_L, 9)                        # K = 2 real, saturates early
})

test_that("L_greedy >= K_true saturates in a single round", {
  # L_greedy = 6, K = 2 real. Round 1 at L = 6 has empty slots so
  # min(lbf) < lbf_min fires immediately, no wasted second round.
  obj <- susie(X, y, L = 12, init_only = TRUE)
  obj$params$L_greedy <- 6
  obj$params$lbf_min  <- 0.1
  fit <- susie_workhorse(obj$data, obj$params)

  expect_identical(nrow(fit$alpha), 6L)
})

test_that("K_true > L_greedy keeps growing past the first round", {
  set.seed(7)
  Xh <- matrix(rnorm(N * J), N, J)
  bh <- numeric(J)
  bh[c(5, 20, 45, 70)] <- c(2.5, -2.0, 1.8, -1.5)   # K = 4 real effects
  yh <- Xh %*% bh + rnorm(N, sd = 0.3)

  obj <- susie(Xh, yh, L = 10, init_only = TRUE)
  obj$params$L_greedy <- 3
  obj$params$lbf_min  <- 0.1
  fit <- susie_workhorse(obj$data, obj$params)

  expect_gte(nrow(fit$alpha), 6)
  expect_lte(nrow(fit$alpha), 10)
})

test_that("L_greedy = L stops after one round at L", {
  obj <- susie(X, y, L = 3, init_only = TRUE)
  obj$params$L_greedy <- 3
  fit <- susie_workhorse(obj$data, obj$params)

  expect_identical(nrow(fit$alpha), 3L)
})

test_that("L_greedy is exposed through susie interfaces", {
  fit <- susie(X, y, L = 8, L_greedy = 3, greedy_lbf_cutoff = 0.1,
               verbose = FALSE)
  expect_lte(nrow(fit$alpha), 8)
  expect_gte(nrow(fit$alpha), 3)

  y_vec <- drop(y)
  ss <- compute_suff_stat(X, y_vec, standardize = TRUE)
  fit_ss <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 8,
                     L_greedy = 3, greedy_lbf_cutoff = 0.1,
                     verbose = FALSE)
  expect_lte(nrow(fit_ss$alpha), 8)
  expect_gte(nrow(fit_ss$alpha), 3)

  z <- as.vector(crossprod(scale(X), drop(scale(y_vec))) / sqrt(nrow(X) - 1))
  R <- cor(X)
  fit_rss <- susie_rss(z = z, R = R, n = nrow(X), L = 8,
                       L_greedy = 3, greedy_lbf_cutoff = 0.1,
                       verbose = FALSE)
  expect_lte(nrow(fit_rss$alpha), 8)
  expect_gte(nrow(fit_rss$alpha), 3)
})


================================================
FILE: tests/testthat/test_mixture_prior.R
================================================
# Tests for estimate_prior_method = "fixed_mixture"
#
# Key invariant: a K=1 mixture with grid = c(V) and weights = c(1)
# must produce identical results to the scalar V path with
# estimate_prior_variance = FALSE and prior_variance = V.

context("Fixed mixture prior")

# Generate a small test dataset
set.seed(1)
n <- 200
p <- 50
X <- matrix(rnorm(n * p), n, p)
beta <- rep(0, p)
beta[c(1, 5, 10)] <- c(0.5, -0.3, 0.4)
y <- X %*% beta + rnorm(n)

# Compute summary stats
R <- cor(X)
z <- as.vector(sqrt(n) * crossprod(X, y) / sqrt(n * diag(crossprod(X))))

# =============================================================================
# Test 1: K=1 mixture matches scalar V exactly (individual data)
# =============================================================================
test_that("K=1 mixture matches scalar V for individual data", {
  L <- 5
  # Run scalar path first to find effective V
  fit_scalar <- susie(X, y, L = L,
                      estimate_prior_variance = FALSE,
                      estimate_residual_variance = FALSE,
                      max_iter = 20, tol = 1e-4)
  V_eff <- fit_scalar$V[1]

  # K=1 mixture path with the same effective V
  fit_mixture <- susie(X, y, L = L,
                       prior_variance_grid = c(V_eff),
                       mixture_weights = c(1),
                       estimate_residual_variance = FALSE,
                       max_iter = 20, tol = 1e-4)

  expect_equal(fit_scalar$pip, fit_mixture$pip, tolerance = 1e-10)
  expect_equal(fit_scalar$alpha, fit_mixture$alpha, tolerance = 1e-10)
  expect_equal(fit_scalar$mu, fit_mixture$mu, tolerance = 1e-10)
  expect_equal(fit_scalar$lbf, fit_mixture$lbf, tolerance = 1e-10)
})

# =============================================================================
# Test 2: K=1 mixture matches scalar V exactly (RSS data)
# =============================================================================
test_that("K=1 mixture matches scalar V for RSS data", {
  L <- 5
  # Run scalar path first to find what V is actually used
  fit_scalar <- susie_rss(z = z, R = R, n = n, L = L,
                          estimate_prior_variance = FALSE,
                          estimate_residual_variance = FALSE,
                          max_iter = 20, tol = 1e-4)
  # The effective V is stored in fit_scalar$V[1] (same for all L since
  # scaled_prior_variance is a scalar and estimate_prior_variance = FALSE)
  V_eff <- fit_scalar$V[1]

  # K=1 mixture path with the same effective V
  fit_mixture <- susie_rss(z = z, R = R, n = n, L = L,
                           prior_variance_grid = c(V_eff),
                           mixture_weights = c(1),
                           estimate_residual_variance = FALSE,
                           max_iter = 20, tol = 1e-4)

  expect_equal(fit_scalar$pip, fit_mixture$pip, tolerance = 1e-10)
  expect_equal(fit_scalar$alpha, fit_mixture$alpha, tolerance = 1e-10)
  expect_equal(fit_scalar$mu, fit_mixture$mu, tolerance = 1e-10)
  expect_equal(fit_scalar$lbf, fit_mixture$lbf, tolerance = 1e-10)
})

# =============================================================================
# Test 3: K=1 mixture matches scalar V exactly (sufficient stats)
# =============================================================================
test_that("K=1 mixture matches scalar V for sufficient stats", {
  L <- 5
  XtX <- crossprod(X)
  Xty <- crossprod(X, y)
  yty <- sum(y^2)

  # Run scalar path first to find effective V
  fit_scalar <- susie_ss(XtX = XtX, Xty = Xty, yty = yty, n = n, L = L,
                         estimate_prior_variance = FALSE,
                         estimate_residual_variance = FALSE,
                         max_iter = 20, tol = 1e-4)
  V_eff <- fit_scalar$V[1]

  # K=1 mixture path with the same effective V
  fit_mixture <- susie_ss(XtX = XtX, Xty = Xty, yty = yty, n = n, L = L,
                          prior_variance_grid = c(V_eff),
                          mixture_weights = c(1),
                          estimate_residual_variance = FALSE,
                          max_iter = 20, tol = 1e-4)

  expect_equal(fit_scalar$pip, fit_mixture$pip, tolerance = 1e-10)
  expect_equal(fit_scalar$alpha, fit_mixture$alpha, tolerance = 1e-10)
  expect_equal(fit_scalar$mu, fit_mixture$mu, tolerance = 1e-10)
  expect_equal(fit_scalar$lbf, fit_mixture$lbf, tolerance = 1e-10)
})

# =============================================================================
# Test 4: K>1 mixture produces valid outputs
# =============================================================================
test_that("K=3 mixture produces valid outputs for RSS data", {
  L <- 5
  grid <- c(1, 10, 50)
  w <- c(0.3, 0.5, 0.2)

  fit <- susie_rss(z = z, R = R, n = n, L = L,
                   prior_variance_grid = grid,
                   mixture_weights = w,
                   estimate_residual_variance = FALSE,
                   max_iter = 20, tol = 1e-4)

  # PIPs in [0, 1]
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
  # Alpha rows sum to 1
  expect_equal(rowSums(fit$alpha), rep(1, L), tolerance = 1e-10)
  # lbf_grid is a list of L elements
  expect_length(fit$lbf_grid, L)
  # Each element is p x K matrix
  expect_equal(dim(fit$lbf_grid[[1]]), c(p, 3))
  # Posterior means are finite
  expect_true(all(is.finite(fit$mu)))
  # Posterior second moments >= posterior means squared
  expect_true(all(fit$mu2 >= fit$mu^2 - 1e-10))
})

# =============================================================================
# Test 5: Uniform weights produces correct mixture BF
# =============================================================================
test_that("Uniform mixture weights give correct BF", {
  L <- 1
  grid <- c(1, 50)
  w <- c(0.5, 0.5)

  fit <- susie_rss(z = z, R = R, n = n, L = L,
                   prior_variance_grid = grid,
                   mixture_weights = w,
                   estimate_residual_variance = FALSE,
                   max_iter = 1)

  # Manually compute mixture BF for variant 1
  # lbf(V) = -0.5*log(1 + V*R[1,1]) + 0.5*z[1]^2*V*R[1,1]/(V*R[1,1]+1)
  # For RSS with lambda=0, sigma2=1: shat2 = 1/R[1,1], betahat = z[1]/R[1,1] * shat2
  # This is approximate due to eigendecomposition; just check BF matrix shape
  expect_equal(ncol(fit$lbf_grid[[1]]), 2)
  expect_equal(nrow(fit$lbf_grid[[1]]), p)
})

# =============================================================================
# Test 6: Input validation
# =============================================================================
test_that("Invalid mixture prior inputs are rejected", {
  # Mismatched lengths
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 5,
              prior_variance_grid = c(1, 10),
              mixture_weights = c(1)),
    "length"
  )
  # Negative grid values
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 5,
              prior_variance_grid = c(-1, 10),
              mixture_weights = c(0.5, 0.5)),
    "prior_variance_grid"
  )
  # Weights not summing to 1
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 5,
              prior_variance_grid = c(1, 10),
              mixture_weights = c(0.3, 0.3)),
    "sum"
  )
})

# =============================================================================
# Test 7: Default weights (uniform) when mixture_weights is NULL
# =============================================================================
test_that("NULL mixture_weights defaults to uniform", {
  L <- 5
  grid <- c(1, 10, 50)

  # Should not error, should use uniform weights
  fit <- susie_rss(z = z, R = R, n = n, L = L,
                   prior_variance_grid = grid,
                   estimate_residual_variance = FALSE,
                   max_iter = 5)

  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

# =============================================================================
# Test 8: Existing tests still pass (backward compatibility)
# =============================================================================
test_that("Standard susie_rss without mixture prior is unchanged", {
  fit <- susie_rss(z = z, R = R, n = n, L = 5,
                   estimate_prior_variance = TRUE,
                   estimate_residual_variance = FALSE,
                   max_iter = 20)
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
  expect_null(fit$lbf_grid)  # no grid stored in standard path
})

# =============================================================================
# Test 9: K=1 mixture with RSS-lambda path (explicit lambda > 0)
# =============================================================================
test_that("K=1 mixture matches scalar V with lambda regularization", {
  L <- 3
  lam <- 0.1
  fit_scalar <- susie_rss_lambda(z = z, R = R, n = n, L = L, lambda = lam,
                          estimate_prior_variance = FALSE,
                          estimate_residual_variance = FALSE,
                          max_iter = 10)
  V_eff <- fit_scalar$V[1]

  fit_mixture <- susie_rss_lambda(z = z, R = R, n = n, L = L, lambda = lam,
                           prior_variance_grid = c(V_eff),
                           mixture_weights = c(1),
                           estimate_residual_variance = FALSE,
                           max_iter = 10)

  expect_equal(fit_scalar$alpha, fit_mixture$alpha, tolerance = 1e-10)
  expect_equal(fit_scalar$mu, fit_mixture$mu, tolerance = 1e-10)
  expect_equal(fit_scalar$lbf, fit_mixture$lbf, tolerance = 1e-10)
})

# =============================================================================
# Test 10: Mixture prior with finite-reference R inflation (inflated shat2)
# =============================================================================
test_that("Mixture prior works with finite-reference R inflation", {
  skip_if_not_installed("Matrix")
  L <- 3
  grid <- c(1, 10, 50)
  w <- c(0.3, 0.5, 0.2)

  # Run with R_finite to trigger shat2 inflation
  fit <- susie_rss(z = z, R = R, n = n, L = L,
                   prior_variance_grid = grid,
                   mixture_weights = w,
                   estimate_residual_variance = FALSE,
                   R_finite = 30,
                   max_iter = 5)

  # Basic validity
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
  expect_equal(rowSums(fit$alpha), rep(1, L), tolerance = 1e-10)
  expect_length(fit$lbf_grid, L)
})

# =============================================================================
# Test 11: Mixture weights are correctly used (asymmetric weights)
# =============================================================================
test_that("Asymmetric mixture weights shift PIPs correctly", {
  L <- 3
  # Large V component only: should produce wider credible intervals
  fit_large <- susie_rss(z = z, R = R, n = n, L = L,
                         prior_variance_grid = c(0.001, 100),
                         mixture_weights = c(0.01, 0.99),
                         estimate_residual_variance = FALSE,
                         max_iter = 10)
  # Small V component only: should produce tighter credible intervals
  fit_small <- susie_rss(z = z, R = R, n = n, L = L,
                         prior_variance_grid = c(0.001, 100),
                         mixture_weights = c(0.99, 0.01),
                         estimate_residual_variance = FALSE,
                         max_iter = 10)

  # Both should be valid
  expect_true(all(fit_large$pip >= 0 & fit_large$pip <= 1))
  expect_true(all(fit_small$pip >= 0 & fit_small$pip <= 1))
  # PIPs should differ
  expect_false(all(abs(fit_large$pip - fit_small$pip) < 1e-6))
})

# =============================================================================
# Test 12: K=1 individual data exact match (L=1, single iteration)
# =============================================================================
test_that("K=1 mixture is numerically identical for L=1 individual data", {
  L <- 1
  fit_scalar <- susie(X, y, L = L,
                      estimate_prior_variance = FALSE,
                      estimate_residual_variance = FALSE,
                      max_iter = 1)
  V_eff <- fit_scalar$V[1]

  fit_mixture <- susie(X, y, L = L,
                       prior_variance_grid = c(V_eff),
                       mixture_weights = c(1),
                       estimate_residual_variance = FALSE,
                       max_iter = 1)

  # After exactly 1 iteration with L=1, results must match to machine precision
  expect_equal(fit_scalar$alpha, fit_mixture$alpha, tolerance = .Machine$double.eps * 10)
  expect_equal(fit_scalar$mu, fit_mixture$mu, tolerance = .Machine$double.eps * 10)
  expect_equal(fit_scalar$lbf, fit_mixture$lbf, tolerance = .Machine$double.eps * 10)
})


================================================
FILE: tests/testthat/test_mr_ash_equivalence.R
================================================
# =============================================================================
# Test: mr.ash vs mr.ash.rss Equivalence
# =============================================================================
#
# Verifies that mr.ash (individual-level data) and mr.ash.rss (summary
# statistics) produce equivalent results when fed the same data.
#
# The key mathematical relationship is:
#   mr.ash model: beta_j ~ sum_k pi_k * N(0, sigma2 * sa2[k])
#   mr.ash.rss reconstructs X'X, X'y from (bhat, shat, R, var_y, n)
#   and uses s0 as the prior variance scale (multiplied by sigma2_e internally).
#
# Summary statistics are derived from individual data as:
#   bhat_j = X_j'y / X_j'X_j  (univariate OLS)
#   shat_j = sqrt(RSS_j / ((n-2) * X_j'X_j))  (standard error with n-2 df)
#   R = cor(X)
#   var_y = var(y)
# =============================================================================

# Helper: derive summary statistics from individual data
# Uses n-2 df for shat to match the PVE adjustment in mr.ash.rss
derive_summary_stats <- function(X, y) {
  n <- nrow(X)
  p <- ncol(X)
  bhat <- sapply(1:p, function(j) sum(X[, j] * y) / sum(X[, j]^2))
  shat <- sapply(1:p, function(j) {
    resid <- y - X[, j] * bhat[j]
    sqrt(sum(resid^2) / ((n - 2) * sum(X[, j]^2)))
  })
  R_mat <- cor(X)
  var_y <- c(var(y))
  list(bhat = bhat, shat = shat, R = R_mat, var_y = var_y, n = n)
}

# Helper: generate test data and prior
setup_mr_ash_test <- function(n = 100, p = 50, k = 5, seed = 42) {
  set.seed(seed)
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = FALSE)
  beta_true <- rep(0, p)
  causal <- sample(1:p, k)
  beta_true[causal] <- rnorm(k, sd = 2)
  y <- c(X %*% beta_true + rnorm(n))
  y <- y - mean(y)

  # Prior matching mr.ash defaults
  sa2 <- c(0, (2^((1:19) / 20) - 1)^2)
  w <- colSums(X^2)
  sa2 <- sa2 / median(w) * n
  K <- length(sa2)
  pi0 <- rep(1 / K, K)
  sigma2_init <- c(var(y))

  list(
    X = X, y = y, n = n, p = p,
    sa2 = sa2, K = K, pi0 = pi0, sigma2_init = sigma2_init
  )
}

test_that("mr.ash and mr.ash.rss produce identical beta with fixed sigma and pi", {
  d <- setup_mr_ash_test(n = 100, p = 50, k = 5, seed = 42)

  fit_ind <- mr.ash(d$X, d$y,
    sa2 = d$sa2, pi = d$pi0, sigma2 = d$sigma2_init,
    intercept = FALSE, standardize = FALSE,
    update.sigma2 = FALSE, update.pi = FALSE,
    max.iter = 100, verbose = FALSE
  )

  ss <- derive_summary_stats(d$X, d$y)
  fit_rss <- mr.ash.rss(
    bhat = ss$bhat, shat = ss$shat, R = ss$R,
    var_y = ss$var_y, n = ss$n,
    sigma2_e = d$sigma2_init, s0 = d$sa2, w0 = d$pi0,
    tol = 1e-4, max_iter = 100,
    update_w0 = FALSE, update_sigma = FALSE
  )

  # Should match to near-machine precision (ignore dim attributes from Armadillo)
  expect_equal(c(fit_rss$beta), c(fit_ind$beta), tolerance = 1e-10)
  expect_equal(c(fit_rss$sigma2), c(fit_ind$sigma2), tolerance = 1e-10)
  expect_equal(c(fit_rss$pi), c(fit_ind$pi), tolerance = 1e-10)
})

test_that("mr.ash and mr.ash.rss agree with sigma2 updates enabled", {
  d <- setup_mr_ash_test(n = 100, p = 50, k = 5, seed = 42)

  fit_ind <- mr.ash(d$X, d$y,
    sa2 = d$sa2, pi = d$pi0, sigma2 = d$sigma2_init,
    intercept = FALSE, standardize = FALSE,
    update.sigma2 = TRUE, update.pi = FALSE,
    max.iter = 200, verbose = FALSE
  )

  ss <- derive_summary_stats(d$X, d$y)
  fit_rss <- mr.ash.rss(
    bhat = ss$bhat, shat = ss$shat, R = ss$R,
    var_y = ss$var_y, n = ss$n,
    sigma2_e = d$sigma2_init, s0 = d$sa2, w0 = d$pi0,
    tol = 1e-4, max_iter = 200,
    update_w0 = FALSE, update_sigma = TRUE
  )

  expect_equal(c(fit_rss$beta), c(fit_ind$beta), tolerance = 1e-3)
  expect_equal(c(fit_rss$sigma2), c(fit_ind$sigma2), tolerance = 1e-4)
})

test_that("mr.ash and mr.ash.rss agree with full EM (sigma + pi updates)", {
  d <- setup_mr_ash_test(n = 100, p = 50, k = 5, seed = 42)

  fit_ind <- mr.ash(d$X, d$y,
    sa2 = d$sa2, pi = d$pi0, sigma2 = d$sigma2_init,
    intercept = FALSE, standardize = FALSE,
    update.sigma2 = TRUE, update.pi = TRUE,
    max.iter = 200, verbose = FALSE
  )

  ss <- derive_summary_stats(d$X, d$y)
  fit_rss <- mr.ash.rss(
    bhat = ss$bhat, shat = ss$shat, R = ss$R,
    var_y = ss$var_y, n = ss$n,
    sigma2_e = d$sigma2_init, s0 = d$sa2, w0 = d$pi0,
    tol = 1e-4, max_iter = 200,
    update_w0 = TRUE, update_sigma = TRUE
  )

  expect_equal(c(fit_rss$beta), c(fit_ind$beta), tolerance = 1e-3)
  expect_equal(c(fit_rss$sigma2), c(fit_ind$sigma2), tolerance = 1e-3)
  expect_equal(c(fit_rss$pi), c(fit_ind$pi), tolerance = 1e-2)
})

test_that("mr.ash.rss output format matches mr.ash", {
  d <- setup_mr_ash_test(n = 80, p = 20, k = 3, seed = 123)

  ss <- derive_summary_stats(d$X, d$y)
  fit_rss <- mr.ash.rss(
    bhat = ss$bhat, shat = ss$shat, R = ss$R,
    var_y = ss$var_y, n = ss$n,
    sigma2_e = 1.0, s0 = d$sa2, w0 = d$pi0,
    tol = 1e-4, max_iter = 100,
    update_w0 = FALSE, update_sigma = FALSE
  )

  # Check that mr.ash-compatible fields exist and have correct types
  expect_true(is.numeric(fit_rss$beta))
  expect_true(is.numeric(fit_rss$sigma2))
  expect_true(is.numeric(fit_rss$pi))
  expect_true(is.integer(fit_rss$iter))
  expect_true(is.numeric(fit_rss$varobj))

  # Check dimensions
  expect_length(fit_rss$beta, d$p)
  expect_length(fit_rss$sigma2, 1)
  expect_length(fit_rss$pi, d$K)
  expect_true(fit_rss$iter > 0)
  expect_true(length(fit_rss$varobj) > 0)
  expect_true(length(fit_rss$varobj) <= 100)

  # Original RSS-specific fields also present
  expect_true(!is.null(fit_rss$mu1))
  expect_true(!is.null(fit_rss$sigma2_1))
  expect_true(!is.null(fit_rss$w1))
  expect_true(!is.null(fit_rss$sigma2_e))
  expect_true(!is.null(fit_rss$w0))
})

test_that("mr.ash and mr.ash.rss agree on different data sizes", {
  # Test with a wider range of n, p combinations
  for (params in list(
    list(n = 80, p = 20, k = 3, seed = 100),
    list(n = 200, p = 30, k = 5, seed = 200)
  )) {
    d <- setup_mr_ash_test(
      n = params$n, p = params$p,
      k = params$k, seed = params$seed
    )

    fit_ind <- mr.ash(d$X, d$y,
      sa2 = d$sa2, pi = d$pi0, sigma2 = d$sigma2_init,
      intercept = FALSE, standardize = FALSE,
      update.sigma2 = FALSE, update.pi = FALSE,
      max.iter = 50, verbose = FALSE
    )

    ss <- derive_summary_stats(d$X, d$y)
    fit_rss <- mr.ash.rss(
      bhat = ss$bhat, shat = ss$shat, R = ss$R,
      var_y = ss$var_y, n = ss$n,
      sigma2_e = d$sigma2_init, s0 = d$sa2, w0 = d$pi0,
      tol = 1e-4, max_iter = 50,
      update_w0 = FALSE, update_sigma = FALSE
    )

    expect_equal(c(fit_rss$beta), c(fit_ind$beta), tolerance = 1e-10,
      label = sprintf("beta (n=%d, p=%d)", params$n, params$p)
    )
  }
})


================================================
FILE: tests/testthat/test_plotting.R
================================================
context("Plotting functions")

# =============================================================================
# SUSIE_PLOT - BASIC FUNCTIONALITY
# =============================================================================

test_that("susie_plot with PIP creates plot without error", {
  set.seed(1)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Should not error
  expect_error(
    susie_plot(fit, "PIP"),
    NA
  )
})

test_that("susie_plot with z-scores requires compute_univariate_zscore", {
  set.seed(2)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = FALSE, verbose = FALSE)

  # Should error when z-scores not computed
  expect_error(
    susie_plot(fit, "z"),
    "z-scores are not available"
  )
})

test_that("susie_plot with z_original also requires z-scores", {
  set.seed(51)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = FALSE, verbose = FALSE)

  # Should error when trying to plot z_original without z-scores
  expect_error(
    susie_plot(fit, "z_original"),
    "z-scores are not available"
  )
})

test_that("susie_plot with z-scores works when available", {
  set.seed(3)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = TRUE, verbose = FALSE)

  # Should not error
  expect_error(
    susie_plot(fit, "z"),
    NA
  )
})

test_that("susie_plot with z_original works", {
  set.seed(4)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = TRUE, verbose = FALSE)

  expect_error(
    susie_plot(fit, "z_original"),
    NA
  )
})

test_that("susie_plot with log10PIP works", {
  set.seed(5)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "log10PIP"),
    NA
  )
})

test_that("susie_plot with invalid y type errors", {
  set.seed(6)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "invalid_type"),
    "Need to specify"
  )
})

test_that("susie_plot errors when pos list missing required elements", {
  set.seed(34)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$genomic_position <- 1000 + (1:length(fit$pip))

  # Missing 'attr'
  expect_error(
    susie_plot(fit, "PIP", pos = list(start = 1000, end = 1025)),
    "pos argument should be a list"
  )

  # Missing 'start'
  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "genomic_position", end = 1025)),
    "pos argument should be a list"
  )

  # Missing 'end'
  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "genomic_position", start = 1000)),
    "pos argument should be a list"
  )
})

test_that("susie_plot errors when pos$attr not in model", {
  set.seed(35)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "nonexistent_attr", start = 1, end = 25)),
    "Cannot find attribute nonexistent_attr"
  )
})

test_that("susie_plot errors when pos$start >= pos$end", {
  set.seed(36)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$genomic_position <- 1000 + (1:length(fit$pip))

  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "genomic_position", start = 1025, end = 1000)),
    "Position start should be smaller than end"
  )

  # Equal values
  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "genomic_position", start = 1000, end = 1000)),
    "Position start should be smaller than end"
  )
})

test_that("susie_plot errors when numeric pos outside range", {
  set.seed(37)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP", pos = 1:100),  # Only 50 variables
    "Provided position is outside the range"
  )

  expect_error(
    susie_plot(fit, "PIP", pos = c(0, 1, 2)),  # 0 is out of range
    "Provided position is outside the range"
  )
})

# =============================================================================
# SUSIE_PLOT - PARAMETERS
# =============================================================================

test_that("susie_plot with add_bar=TRUE works", {
  set.seed(7)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP", add_bar = TRUE),
    NA
  )
})

test_that("susie_plot with add_legend=TRUE works", {
  set.seed(8)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP", add_legend = TRUE),
    NA
  )
})

test_that("susie_plot with add_legend location string works", {
  set.seed(9)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP", add_legend = "bottomright"),
    NA
  )
})

test_that("susie_plot with pos as numeric vector works", {
  set.seed(10)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Plot subset of variables
  expect_error(
    susie_plot(fit, "PIP", pos = 1:25),
    NA
  )
})

test_that("susie_plot with pos as list works", {
  set.seed(11)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$genomic_position <- 1000 + (1:length(fit$pip))

  # Plot with custom position attribute
  expect_error(
    susie_plot(fit, "PIP", pos = list(attr = "genomic_position", start = 1000, end = 1025)),
    NA
  )
})

test_that("susie_plot with b (true effects) works", {
  set.seed(12)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Highlight true effects
  expect_error(
    susie_plot(fit, "PIP", b = dat$beta),
    NA
  )
})

test_that("susie_plot with max_cs parameter works", {
  set.seed(13)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Limit number of CS displayed
  expect_error(
    susie_plot(fit, "PIP", max_cs = 2),
    NA
  )
})

test_that("susie_plot with max_cs purity threshold works", {
  set.seed(38)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Filter by purity (< 1)
  expect_error(
    susie_plot(fit, "PIP", max_cs = 0.5, add_legend = TRUE),
    NA
  )

  # Very strict purity filter (should exclude most/all CS)
  expect_error(
    susie_plot(fit, "PIP", max_cs = 0.99),
    NA
  )

  # Very lenient purity filter
  expect_error(
    susie_plot(fit, "PIP", max_cs = 0.1),
    NA
  )
})

test_that("susie_plot with different legend positions works", {
  set.seed(39)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  positions <- c("topleft", "top", "left", "center",
                 "right", "bottomleft", "bottom")

  for (pos in positions) {
    expect_error(
      susie_plot(fit, "PIP", add_legend = pos),
      NA,
      info = paste("Failed for legend position:", pos)
    )
  }
})

test_that("susie_plot with invalid legend position defaults to topright", {
  set.seed(40)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Invalid position should default to "topright" (no error)
  expect_error(
    susie_plot(fit, "PIP", add_legend = "invalid_position"),
    NA
  )
})

test_that("susie_plot respects custom plotting parameters", {
  set.seed(41)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Test various plotting parameters
  expect_error(
    susie_plot(fit, "PIP", main = "Custom Title", col = "blue", cex = 0.5),
    NA
  )

  expect_error(
    susie_plot(fit, "PIP", xlim = c(0, 30), ylim = c(0, 1)),
    NA
  )
})

# =============================================================================
# SUSIE_PLOT - VECTOR INPUT
# =============================================================================

test_that("susie_plot with PIP vector input works", {
  set.seed(14)
  pip <- runif(50)

  expect_error(
    susie_plot(pip, "PIP"),
    NA
  )
})

test_that("susie_plot with z-score vector input works", {
  set.seed(15)
  z <- rnorm(50)

  expect_error(
    susie_plot(z, "z"),
    NA
  )
})

test_that("susie_plot with non-susie vector and different y types", {
  set.seed(42)

  # Test with z_original on vector
  z_vec <- rnorm(50)
  expect_error(susie_plot(z_vec, "z_original"), NA)

  # Test with log10PIP on vector
  pip_vec <- runif(50)
  expect_error(susie_plot(pip_vec, "log10PIP"), NA)

  # Test with generic data (not PIP, z, etc.)
  data_vec <- runif(50, 0, 10)
  expect_error(susie_plot(data_vec, "custom_data"), NA)
})

# =============================================================================
# SUSIE_PLOT - EDGE CASES
# =============================================================================

test_that("susie_plot with no credible sets works", {
  set.seed(16)
  dat <- simulate_regression(n = 100, p = 50, k = 0)  # No signal
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP"),
    NA
  )
})

test_that("susie_plot with single variable works", {
  set.seed(17)
  dat <- simulate_regression(n = 100, p = 1, k = 1)
  fit <- susie(dat$X, dat$y, L = 1, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP"),
    NA
  )
})

test_that("susie_plot returns NULL invisibly", {
  set.seed(18)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  result <- susie_plot(fit, "PIP")

  expect_null(result)
})

test_that("susie_plot with list pos and credible sets adjusts correctly", {
  set.seed(43)
  # Create data with clear signal so we get CS
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$genomic_position <- 1000 + (1:length(fit$pip))

  # Should successfully plot with CS adjusted to new positions
  expect_error(
    susie_plot(fit, "PIP",
               pos = list(attr = "genomic_position", start = 1000, end = 1050),
               add_legend = TRUE),
    NA
  )
})

test_that("susie_plot with b parameter highlights specific positions", {
  set.seed(44)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Test with b having non-zero elements at specific positions
  b_test <- rep(0, 50)
  b_test[c(10, 20, 30)] <- 1
  expect_error(
    susie_plot(fit, "PIP", b = b_test),
    NA
  )

  # Test with actual beta from simulation and add_bar
  expect_error(
    susie_plot(fit, "PIP", b = dat$beta, add_bar = TRUE, add_legend = TRUE),
    NA
  )
})

test_that("susie_plot sets x0 and y1 to NULL when CS filtered by max_cs", {
  set.seed(52)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS with purity info
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 0) {
    # Use very strict max_cs filter (size < 1) to exclude CS
    # This should trigger the else branch: x0 <- NULL; y1 <- NULL
    expect_error(
      susie_plot(fit, "PIP", max_cs = 1, add_legend = TRUE),  # Only CS with size < 1
      NA
    )

    # Also test with very high purity threshold (max_cs as purity)
    expect_error(
      susie_plot(fit, "PIP", max_cs = 0.999, add_legend = TRUE),  # Very high purity
      NA
    )
  } else {
    skip("No CS found for max_cs filter test")
  }
})

test_that("susie_plot skips CS when x0 is NULL (next statement)", {
  set.seed(53)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 0) {
    # Use max_cs to filter out large CS, causing is.null(x0) to be TRUE
    # This should trigger the next statement to skip those CS
    expect_error(
      susie_plot(fit, "PIP", max_cs = 2),  # Skip CS with > 2 variables
      NA
    )
  } else {
    skip("No CS found for next statement test")
  }
})

test_that("susie_plot uses cs_index when available (else uses cs_idx)", {
  set.seed(54)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS which should populate cs_index
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 0) {
    # When cs_index exists, should use it
    expect_true(!is.null(fit$sets$cs_index))

    # Plot with legend to see cs_index values
    expect_error(
      susie_plot(fit, "PIP", add_legend = TRUE),
      NA
    )

    # Test the else branch: remove cs_index to force use of cs_idx
    fit_no_index <- fit
    fit_no_index$sets$cs_index <- NULL

    expect_error(
      susie_plot(fit_no_index, "PIP", add_legend = TRUE),
      NA
    )
  } else {
    skip("No CS found for cs_index test")
  }
})

# =============================================================================
# SUSIE_PLOT_ITERATION
# =============================================================================

test_that("susie_plot_iteration uses tempdir when file_prefix missing", {
  set.seed(55)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, track_fit = FALSE, verbose = FALSE)

  # Don't provide file_prefix - should use tempdir()
  result <- invisible(capture.output({
    suppressMessages(susie_plot_iteration(fit, L = 5))
  }, type = "output"))

  # Check that file was created in tempdir
  expected_path <- file.path(tempdir(), "susie_plot.pdf")
  expect_true(file.exists(expected_path))

  # Clean up
  if (file.exists(expected_path)) file.remove(expected_path)
})

test_that("susie_plot_iteration with track_fit=FALSE uses final fit only", {
  set.seed(19)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # Without track_fit
  fit <- susie(dat$X, dat$y, L = 5, track_fit = FALSE, verbose = FALSE)

  temp_prefix <- tempfile("susie_iter_no_track_")

  # Should work but only plot final iteration
  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix))
    }, type = "output"))
  }, NA)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                           pattern = basename(temp_prefix),
                           full.names = TRUE)
  file.remove(temp_files)
})

test_that("susie_plot_iteration works with track_fit=TRUE", {
  set.seed(20)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # With track_fit
  fit <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, max_iter = 10, verbose = FALSE)

  # Create temp file for output
  temp_prefix <- tempfile("susie_iter_")

  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix))
    }, type = "output"))
  }, NA)

  # Clean up temp files
  temp_files <- list.files(dirname(temp_prefix),
                           pattern = basename(temp_prefix),
                           full.names = TRUE)
  file.remove(temp_files)
})

test_that("susie_plot_iteration with pos parameter works", {
  set.seed(21)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, max_iter = 10, verbose = FALSE)

  temp_prefix <- tempfile("susie_iter_pos_")

  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix, pos = 1:25))
    }, type = "output"))
  }, NA)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                           pattern = basename(temp_prefix),
                           full.names = TRUE)
  file.remove(temp_files)
})

test_that("susie_plot_iteration creates PDF files", {
  set.seed(22)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, max_iter = 5, verbose = FALSE)

  temp_dir <- tempdir()
  temp_prefix <- file.path(temp_dir, "test_susie_iter")

  invisible(capture.output({
    suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix))
  }, type = "output"))

  # Check that PDF files were created
  pdf_files <- list.files(temp_dir, pattern = "test_susie_iter.*\\.pdf$", full.names = TRUE)

  expect_true(length(pdf_files) > 0)

  # Clean up
  file.remove(pdf_files)
})

test_that("susie_plot_iteration with L greater than nrow(alpha)", {
  set.seed(45)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 3, track_fit = TRUE, verbose = FALSE)

  temp_prefix <- tempfile("test_large_L_")

  # Request L=10 when fit only has L=3
  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit, L = 10, file_prefix = temp_prefix))
    }, type = "output"))
  }, NA)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                          pattern = basename(temp_prefix),
                          full.names = TRUE)
  if (length(temp_files) > 0) file.remove(temp_files)
})

test_that("susie_plot_iteration with few iterations", {
  set.seed(46)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  # Use max_iter=5 to ensure we have some iterations tracked
  fit <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, max_iter = 5, verbose = FALSE)

  temp_prefix <- tempfile("test_few_iter_")

  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix))
    }, type = "output"))
  }, NA)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                          pattern = basename(temp_prefix),
                          full.names = TRUE)
  if (length(temp_files) > 0) file.remove(temp_files)
})

test_that("susie_plot_iteration returns invisibly", {
  set.seed(47)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, track_fit = FALSE, verbose = FALSE)

  temp_prefix <- tempfile("test_invisible_")

  invisible(capture.output({
    result <- suppressMessages(susie_plot_iteration(fit, L = 5, file_prefix = temp_prefix))
  }, type = "output"))

  expect_null(result)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                          pattern = basename(temp_prefix),
                          full.names = TRUE)
  if (length(temp_files) > 0) file.remove(temp_files)
})

# =============================================================================
# SUSIE_PLOT_CHANGEPOINT
# =============================================================================

test_that("susie_plot_changepoint with basic usage works", {
  set.seed(23)
  mu <- c(rep(0, 25), rep(2, 25), rep(-1, 25), rep(1, 25))
  y <- mu + rnorm(100, sd = 0.5)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(
    susie_plot_changepoint(s, y),
    NA
  )
})

test_that("susie_plot_changepoint with custom colors works", {
  set.seed(24)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(
    susie_plot_changepoint(s, y, line_col = "red", line_size = 2),
    NA
  )
})

test_that("susie_plot_changepoint with cs_col parameter works", {
  set.seed(25)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(
    susie_plot_changepoint(s, y, cs_col = "green"),
    NA
  )
})

test_that("susie_plot_changepoint with single changepoint works", {
  set.seed(28)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(
    susie_plot_changepoint(s, y),
    NA
  )
})

test_that("susie_plot_changepoint with no changepoints works", {
  set.seed(29)
  y <- rnorm(50, mean = 5, sd = 0.5)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(
    susie_plot_changepoint(s, y),
    NA
  )
})

test_that("susie_plot_changepoint returns ggplot object", {
  set.seed(30)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  result <- susie_plot_changepoint(s, y)

  expect_s3_class(result, "gg")
  expect_s3_class(result, "ggplot")
})

test_that("susie_plot_changepoint with multiple changepoints", {
  set.seed(48)
  # Create data with multiple clear changepoints
  mu <- c(rep(0, 25), rep(2, 25), rep(-1, 25), rep(1, 25))
  y <- mu + rnorm(100, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  result <- susie_plot_changepoint(s, y)

  # Verify it's a ggplot object
  expect_s3_class(result, "gg")

  # Check that CS were found
  cs <- susie_get_cs(s)
  expect_true(length(cs$cs) > 0)
})

test_that("susie_plot_changepoint with very strong signal", {
  set.seed(49)
  # Very clear changepoints with low noise
  mu <- c(rep(0, 30), rep(5, 30))
  y <- mu + rnorm(60, sd = 0.1)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  result <- susie_plot_changepoint(s, y, line_col = "red", line_size = 2, cs_col = "blue")

  expect_s3_class(result, "gg")
  expect_s3_class(result, "ggplot")
})

test_that("susie_plot_changepoint can be modified after creation", {
  set.seed(50)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)

  s <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  # Use all defaults
  result <- susie_plot_changepoint(s, y)

  expect_s3_class(result, "ggplot")

  # Can add to the plot after creation
  expect_error(
    result + ggplot2::ggtitle("Custom Title"),
    NA
  )
})

# =============================================================================
# INTEGRATION TESTS
# =============================================================================

test_that("susie_plot works with susie_ss output", {
  set.seed(31)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP"),
    NA
  )
})

test_that("susie_plot works with susie_rss output", {
  set.seed(32)
  n <- 200
  p <- 100
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  beta[1:3] <- 1
  y <- X %*% beta + rnorm(n)

  ss <- univariate_regression(X, y)
  R <- cor(X)
  z <- with(ss, betahat / sebetahat)

  fit <- susie_rss(z, R, n = n, L = 5, verbose = FALSE)

  expect_error(
    susie_plot(fit, "PIP"),
    NA
  )
})

test_that("all three plot functions work in sequence", {
  set.seed(33)

  # Regular susie fit
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit1 <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_error(susie_plot(fit1, "PIP"), NA)

  # Trendfilter
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 0.3)
  fit2 <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_error(susie_plot_changepoint(fit2, y), NA)

  # Iteration plot
  fit3 <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, max_iter = 5, verbose = FALSE)
  temp_prefix <- tempfile("test_seq_")

  expect_error({
    invisible(capture.output({
      suppressMessages(susie_plot_iteration(fit3, L = 5, file_prefix = temp_prefix))
    }, type = "output"))
  }, NA)

  # Clean up
  temp_files <- list.files(dirname(temp_prefix),
                           pattern = basename(temp_prefix),
                           full.names = TRUE)
  file.remove(temp_files)
})


================================================
FILE: tests/testthat/test_post_outcome_configuration_summary.R
================================================
# Tests for `summary.susie_post_outcome_configuration` and its print
# method. The numerical algorithms (susiex / coloc_pairwise) are exercised
# in mfsusieR's `tests/testthat/test_susie_post_outcome_configuration.R`
# against a verbatim port of the legacy `mvf.susie.alpha::posthoc_multfsusie`
# kernel; here we focus on:
#   * dispatch via class tag
#   * tidy-table shape and column names
#   * signal_only filtering and the kept/total bookkeeping
#   * defensive handling of malformed / partial input

# ---- Helpers --------------------------------------------------------------

# A minimal hand-built `susiex` tuple (skips the IBSS + algorithm and
# constructs the documented fields directly).
make_susiex_tuple <- function(trait_names,
                              cs_indices,
                              marginal_prob,
                              top_config_idx = 1L,
                              prob_thresh    = 0.8) {
  N         <- length(trait_names)
  configs   <- as.matrix(expand.grid(rep(list(c(0L, 1L)), N)))
  colnames(configs) <- paste0("trait_", seq_len(N))
  cp        <- numeric(2L^N)
  cp[top_config_idx] <- 1
  list(
    cs_indices    = setNames(as.integer(cs_indices), trait_names),
    logBF_trait   = setNames(rep(0, N),              trait_names),
    configs       = configs,
    config_prob   = cp,
    marginal_prob = setNames(marginal_prob,          trait_names),
    active        = setNames(marginal_prob >= prob_thresh, trait_names)
  )
}

make_post_obj <- function(susiex = NULL, coloc = NULL) {
  out <- list()
  if (!is.null(susiex)) out$susiex <- susiex
  if (!is.null(coloc))  out$coloc_pairwise <- coloc
  class(out) <- c("susie_post_outcome_configuration", "list")
  out
}

make_coloc_df <- function(rows) {
  do.call(rbind, lapply(rows, function(r) {
    pp <- r$pp
    data.frame(trait1 = r$t1, trait2 = r$t2,
               l1 = r$l1, l2 = r$l2,
               hit1 = r$h1, hit2 = r$h2,
               PP.H0 = pp[1], PP.H1 = pp[2], PP.H2 = pp[3],
               PP.H3 = pp[4], PP.H4 = pp[5],
               stringsAsFactors = FALSE, row.names = NULL)
  }))
}

# ---- Dispatch -------------------------------------------------------------

test_that("summary() dispatches on the class tag", {
  obj <- make_post_obj(
    susiex = list(make_susiex_tuple(c("a", "b"),
                                    cs_indices    = c(1, 1),
                                    marginal_prob = c(0.95, 0.95))))
  s <- summary(obj, color = FALSE)
  expect_s3_class(s, "summary.susie_post_outcome_configuration")
  # Print returns input invisibly without erroring.
  out <- capture.output(p <- print(s))
  expect_identical(p, s)
  # The captured output mentions the SuSiEx header.
  expect_true(any(grepl("SuSiEx:", out)))
})

# ---- Tidy table shape -----------------------------------------------------

test_that("susiex tidy table carries one row per CS tuple with reserved + per-trait columns", {
  tuples <- list(
    make_susiex_tuple(c("trait_a", "trait_b"),
                      cs_indices    = c(1, 1),
                      marginal_prob = c(0.95, 0.30)),
    make_susiex_tuple(c("trait_a", "trait_b"),
                      cs_indices    = c(2, 2),
                      marginal_prob = c(0.10, 0.92)))
  s <- summary(make_post_obj(susiex = tuples), color = FALSE,
               signal_only = FALSE)
  expect_s3_class(s$susiex, "data.frame")
  expect_equal(nrow(s$susiex), 2L)
  expect_setequal(colnames(s$susiex),
                  c("tuple", "trait_a", "trait_b", "top_pattern", "top_prob"))
  expect_equal(s$susiex$tuple, c("(1,1)", "(2,2)"))
  expect_equal(s$susiex$trait_a, c(0.95, 0.10))
})

test_that("coloc tidy table extends the input data.frame with verdict and top_pp", {
  rows <- list(
    list(t1 = "A", t2 = "B", l1 = 1, l2 = 1, h1 = "rs1", h2 = "rs1",
         pp = c(0.001, 0.001, 0.001, 0.05, 0.947)),
    list(t1 = "A", t2 = "C", l1 = 1, l2 = 1, h1 = "rs1", h2 = "rs9",
         pp = c(0.99, 0.005, 0.002, 0.002, 0.001)))   # H0 dominant
  s <- summary(make_post_obj(coloc = make_coloc_df(rows)),
               color = FALSE, signal_only = FALSE)
  expect_s3_class(s$coloc_pairwise, "data.frame")
  expect_equal(nrow(s$coloc_pairwise), 2L)
  expect_true(all(c("verdict", "top_pp") %in% colnames(s$coloc_pairwise)))
  expect_equal(s$coloc_pairwise$verdict, c("H4 shared", "H0 no signal"))
  expect_equal(s$coloc_pairwise$top_pp, c(0.947, 0.990), tolerance = 1e-9)
})

# ---- signal_only filtering + bookkeeping ----------------------------------

test_that("signal_only drops below-threshold susiex rows and counts them in n_total/n_kept", {
  tuples <- list(
    make_susiex_tuple(c("a", "b"),
                      cs_indices    = c(1, 1),
                      marginal_prob = c(0.95, 0.20)),    # signal (a active)
    make_susiex_tuple(c("a", "b"),
                      cs_indices    = c(2, 2),
                      marginal_prob = c(0.40, 0.30)))    # no signal
  s_filt <- summary(make_post_obj(susiex = tuples), color = FALSE,
                    signal_only = TRUE)
  s_all  <- summary(make_post_obj(susiex = tuples), color = FALSE,
                    signal_only = FALSE)
  expect_equal(s_filt$susiex_n_total, 2L)
  expect_equal(s_filt$susiex_n_kept,  1L)
  expect_equal(s_all$susiex_n_kept,   2L)
  expect_equal(s_filt$susiex$tuple, "(1,1)")
})

test_that("signal_only drops H0-dominant coloc rows and footers the count", {
  rows <- list(
    list(t1 = "A", t2 = "B", l1 = 1, l2 = 1, h1 = "rs1", h2 = "rs1",
         pp = c(0.99, 0.005, 0.002, 0.002, 0.001)),    # H0
    list(t1 = "A", t2 = "B", l1 = 1, l2 = 2, h1 = "rs1", h2 = "rs7",
         pp = c(0.001, 0.001, 0.001, 0.05, 0.947)))    # H4
  obj   <- make_post_obj(coloc = make_coloc_df(rows))
  s     <- summary(obj, color = FALSE, signal_only = TRUE)
  expect_equal(s$coloc_n_total, 2L)
  expect_equal(s$coloc_n_kept,  1L)
  out <- capture.output(print(s))
  expect_true(any(grepl("1/2 pairs hidden", out)))
})

# ---- Defensive paths ------------------------------------------------------

test_that("summary handles entirely empty input gracefully", {
  s <- summary(make_post_obj(), color = FALSE)
  expect_null(s$susiex)
  expect_null(s$coloc_pairwise)
  out <- capture.output(print(s))
  expect_true(any(grepl("no signals", out)))
})

test_that("summary tolerates susiex tuples with missing fields (skips them)", {
  good   <- make_susiex_tuple(c("a", "b"),
                              cs_indices    = c(1, 1),
                              marginal_prob = c(0.95, 0.95))
  broken <- list(cs_indices = c(2, 2))   # missing marginal_prob etc.
  s <- summary(make_post_obj(susiex = list(good, broken)),
               color = FALSE, signal_only = FALSE)
  expect_equal(nrow(s$susiex), 1L)
  expect_equal(s$susiex_n_total, 2L)   # both counted in total
  expect_equal(s$susiex_n_kept,  1L)
})

test_that("summary prefixes trait names that collide with reserved column names", {
  # Trait literally named "tuple" must not clobber the CS-tuple column.
  tup <- make_susiex_tuple(c("tuple", "top_prob"),
                           cs_indices    = c(1, 1),
                           marginal_prob = c(0.95, 0.95))
  s <- summary(make_post_obj(susiex = list(tup)), color = FALSE)
  expect_true("tuple" %in% colnames(s$susiex))
  # Reserved-name traits get a "trait_" prefix.
  expect_true("trait_tuple"   %in% colnames(s$susiex))
  expect_true("trait_top_prob" %in% colnames(s$susiex))
})

test_that("summary warns and skips coloc when required PP columns are missing", {
  bad <- data.frame(trait1 = "A", trait2 = "B",
                    l1 = 1, l2 = 1, hit1 = "rs1", hit2 = "rs1",
                    PP.H0 = 0.5, PP.H1 = 0.5,
                    stringsAsFactors = FALSE)
  expect_warning(
    s <- summary(make_post_obj(coloc = bad), color = FALSE),
    "missing required columns")
  expect_null(s$coloc_pairwise)
  expect_equal(s$coloc_n_total, 1L)
  expect_equal(s$coloc_n_kept,  0L)
})

test_that("summary validates its arguments", {
  obj <- make_post_obj()
  expect_error(summary(obj, prob_thresh = 1.1),     "prob_thresh")
  expect_error(summary(obj, prob_thresh = -0.1),    "prob_thresh")
  expect_error(summary(obj, ambiguous_lower = 0.9, prob_thresh = 0.8),
               "ambiguous_lower")
  expect_error(summary(obj, signal_only = NA),      "signal_only")
  expect_error(summary(obj, color = "yes"),         "color")
})

# ---- Color toggle ---------------------------------------------------------

test_that("color = FALSE produces ASCII-only output", {
  obj <- make_post_obj(
    susiex = list(make_susiex_tuple(c("a", "b"),
                                    cs_indices    = c(1, 1),
                                    marginal_prob = c(0.95, 0.95))))
  out <- capture.output(print(summary(obj, color = FALSE)))
  # No ANSI escape sequences.
  expect_false(any(grepl("\033\\[", out)))
})

test_that("color = TRUE injects ANSI escape sequences", {
  obj <- make_post_obj(
    susiex = list(make_susiex_tuple(c("a", "b"),
                                    cs_indices    = c(1, 1),
                                    marginal_prob = c(0.95, 0.95))))
  out <- capture.output(print(summary(obj, color = TRUE)))
  expect_true(any(grepl("\033\\[", out)),
              info = "Forcing color = TRUE should emit at least one ANSI SGR.")
})


================================================
FILE: tests/testthat/test_refinement.R
================================================
context("Refinement unit tests")

# =============================================================================
# BASIC FUNCTIONALITY
# =============================================================================

test_that("run_refine returns a valid susie model", {
  setup <- create_model_with_cs(seed = 100)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true("alpha" %in% names(refined_model))
  expect_true("mu" %in% names(refined_model))
  expect_true("V" %in% names(refined_model))
  expect_true("sigma2" %in% names(refined_model))
  expect_true("elbo" %in% names(refined_model))
})

test_that("run_refine maintains or improves ELBO", {
  setup <- create_model_with_cs(seed = 101)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  initial_elbo <- susie_get_objective(setup$model)
  refined_model <- run_refine(setup$model, setup$data, setup$params)
  final_elbo <- susie_get_objective(refined_model)

  expect_true(final_elbo >= initial_elbo - 1e-6)
})

test_that("run_refine preserves model dimensions", {
  setup <- create_model_with_cs(seed = 102)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  initial_L <- nrow(setup$model$alpha)
  initial_p <- ncol(setup$model$alpha)

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(nrow(refined_model$alpha), initial_L)
  expect_equal(ncol(refined_model$alpha), initial_p)
  expect_equal(nrow(refined_model$mu), initial_L)
  expect_equal(ncol(refined_model$mu), initial_p)
})

test_that("run_refine returns finite ELBO", {
  setup <- create_model_with_cs(seed = 103)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(all(is.finite(refined_model$elbo)))
  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine maintains valid probability distributions", {
  setup <- create_model_with_cs(seed = 104)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(all(refined_model$alpha >= 0))
  expect_true(all(refined_model$alpha <= 1))

  row_sums <- rowSums(refined_model$alpha)
  expect_true(all(abs(row_sums - 1) < 1e-10))
})

# =============================================================================
# REFINEMENT LOGIC
# =============================================================================

test_that("run_refine iterates through credible sets", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 3, seed = 105)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  n_cs_initial <- length(setup$model$sets$cs)

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine uses two-step procedure correctly", {
  setup <- create_model_with_cs(seed = 106)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true("alpha" %in% names(refined_model))
  expect_true(all(refined_model$alpha >= 0 & refined_model$alpha <= 1))
})

test_that("run_refine preserves prior weights structure", {
  setup <- create_model_with_cs(seed = 107)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  initial_pi <- setup$model$pi

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(length(refined_model$pi), length(initial_pi))
  expect_true(all(refined_model$pi >= 0))
  expect_true(abs(sum(refined_model$pi) - 1) < 1e-10)
})

test_that("run_refine evaluates multiple candidate models", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 4, seed = 108)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) < 2,
          "Need at least 2 credible sets")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

# =============================================================================
# CONVERGENCE BEHAVIOR
# =============================================================================

test_that("run_refine stops when ELBO improvement < tol", {
  setup <- create_model_with_cs(seed = 109)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  params_tight_tol <- setup$params
  params_tight_tol$tol <- 1e-10

  refined_model <- run_refine(setup$model, setup$data, params_tight_tol)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine with loose tolerance may iterate more", {
  setup <- create_model_with_cs(seed = 110)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  params_loose <- setup$params
  params_loose$tol <- 1e-1

  refined_model <- run_refine(setup$model, setup$data, params_loose)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine stops when no candidate models generated", {
  setup <- create_model_with_cs(seed = 111)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true("elbo" %in% names(refined_model))
})

test_that("run_refine convergence is deterministic", {
  setup <- create_model_with_cs(seed = 112)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found in initial model")

  refined1 <- run_refine(setup$model, setup$data, setup$params)
  refined2 <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(susie_get_objective(refined1),
               susie_get_objective(refined2))
})

# =============================================================================
# EDGE CASES
# =============================================================================

test_that("run_refine handles model with no credible sets", {
  set.seed(113)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  model <- susie(X, y, L = 5, verbose = FALSE)

  constructor_result <- individual_data_constructor(
    X = X, y = y, L = 5,
    standardize = TRUE, intercept = TRUE,
    estimate_residual_method = "MLE",
    convergence_method = "elbo",
    coverage = 0.95, min_abs_corr = 0.5,
    n_purity = 100,
    track_fit = FALSE
  )

  if (is.null(model$sets) || length(model$sets$cs) == 0) {
    refined_model <- run_refine(model, constructor_result$data,
                                constructor_result$params)

    expect_equal(susie_get_objective(refined_model),
                 susie_get_objective(model))
  } else {
    skip("Model unexpectedly found credible sets")
  }
})

test_that("run_refine handles single credible set", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 1, seed = 114)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
  expect_true(susie_get_objective(refined_model) >=
              susie_get_objective(setup$model) - 1e-6)
})

test_that("run_refine handles credible set with all prior weights zero", {
  setup <- create_model_with_cs(seed = 115)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  if (length(setup$model$sets$cs) > 0) {
    cs_vars <- setup$model$sets$cs[[1]]

    if (length(cs_vars) < ncol(setup$model$alpha)) {
      refined_model <- run_refine(setup$model, setup$data, setup$params)
      expect_true(is.finite(susie_get_objective(refined_model)))
    }
  }
})

test_that("run_refine handles large credible set", {
  setup <- create_model_with_cs(n = 200, p = 100, seed = 116)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine handles small p relative to L", {
  setup <- create_model_with_cs(n = 100, p = 10, L = 5,
                                n_causal = 2, seed = 117)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

# =============================================================================
# PARAMETER HANDLING
# =============================================================================

test_that("run_refine respects verbose parameter", {
  setup <- create_model_with_cs(seed = 118)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  params_verbose <- setup$params
  params_verbose$verbose <- TRUE

  expect_message(
    run_refine(setup$model, setup$data, params_verbose),
    "Block ascent iter"
  )
})

test_that("run_refine verbose=FALSE produces no output", {
  setup <- create_model_with_cs(seed = 119)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  params_silent <- setup$params
  params_silent$verbose <- FALSE

  expect_silent(
    run_refine(setup$model, setup$data, params_silent)
  )
})

test_that("run_refine warns about model_init", {
  setup <- create_model_with_cs(seed = 120)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  params_with_init <- setup$params
  params_with_init$model_init <- list(alpha = setup$model$alpha)

  expect_message(
    run_refine(setup$model, setup$data, params_with_init),
    "model_init is not used"
  )
})

test_that("run_refine respects tolerance parameter", {
  setup <- create_model_with_cs(seed = 121)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  params_tol1 <- setup$params
  params_tol1$tol <- 1e-2

  params_tol2 <- setup$params
  params_tol2$tol <- 1e-6

  refined1 <- run_refine(setup$model, setup$data, params_tol1)
  refined2 <- run_refine(setup$model, setup$data, params_tol2)

  expect_true(is.finite(susie_get_objective(refined1)))
  expect_true(is.finite(susie_get_objective(refined2)))
})

test_that("run_refine preserves null_weight", {
  setup <- create_model_with_cs(seed = 122)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  initial_null_weight <- setup$model$null_weight

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(refined_model$null_weight, initial_null_weight)
})

# =============================================================================
# INTEGRATION
# =============================================================================

test_that("run_refine works with individual data", {
  setup <- create_model_with_cs(seed = 123)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  expect_equal(class(setup$data), "individual")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine works with sufficient statistics", {
  set.seed(124)
  n <- 100
  p <- 50
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X)

  beta <- rep(0, p)
  beta[c(5, 15, 25)] <- c(1.5, -1.2, 1.0)
  y <- as.vector(X %*% beta + rnorm(n, sd = 0.5))

  XtX <- crossprod(X)
  Xty <- as.vector(crossprod(X, y))
  yty <- sum(y^2)

  model <- susie_ss(XtX, Xty, yty, n = n, L = 5, verbose = FALSE)

  skip_if(is.null(model$sets) || length(model$sets$cs) == 0,
          "No credible sets found")

  constructor_result <- sufficient_stats_constructor(
    XtX = XtX, Xty = Xty, yty = yty, n = n, L = 5,
    standardize = TRUE,
    estimate_residual_method = "MLE",
    convergence_method = "elbo",
    coverage = 0.95, min_abs_corr = 0.5,
    n_purity = 100,
    track_fit = FALSE
  )

  refined_model <- run_refine(model, constructor_result$data,
                              constructor_result$params)

  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine output compatible with susie_get functions", {
  setup <- create_model_with_cs(seed = 125)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  pips <- susie_get_pip(refined_model)
  expect_equal(length(pips), ncol(refined_model$alpha))
  expect_true(all(pips >= 0))
  expect_true(all(pips <= 1))

  cs <- susie_get_cs(refined_model)
  expect_true(is.null(cs) || is.list(cs))

  post_mean <- susie_get_posterior_mean(refined_model)
  expect_true(all(is.finite(post_mean)))
})

test_that("run_refine maintains fitted values", {
  setup <- create_model_with_cs(seed = 126)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true("fitted" %in% names(refined_model))
  expect_equal(length(refined_model$fitted), nrow(setup$X))
  expect_true(all(is.finite(refined_model$fitted)))
})

test_that("run_refine maintains intercept", {
  setup <- create_model_with_cs(seed = 127)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true("intercept" %in% names(refined_model))
  expect_true(is.finite(refined_model$intercept))
})

# =============================================================================
# MATHEMATICAL PROPERTIES
# =============================================================================

test_that("run_refine maintains non-negative prior variances", {
  setup <- create_model_with_cs(seed = 128)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(all(refined_model$V >= 0))
  expect_true(all(is.finite(refined_model$V)))
})

test_that("run_refine maintains positive residual variance", {
  setup <- create_model_with_cs(seed = 129)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(refined_model$sigma2 > 0)
  expect_true(is.finite(refined_model$sigma2))
})

test_that("run_refine maintains non-negative KL divergences", {
  setup <- create_model_with_cs(seed = 130)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_true(all(refined_model$KL >= -1e-6))
})

test_that("run_refine ELBO is monotonically increasing", {
  setup <- create_model_with_cs(seed = 131)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  elbo_diff <- diff(refined_model$elbo)
  expect_true(all(elbo_diff > -1e-6))
})

# =============================================================================
# SIGNAL RECOVERY
# =============================================================================

test_that("run_refine improves or maintains signal recovery", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 3, seed = 132)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  pips_initial <- susie_get_pip(setup$model)

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  pips_refined <- susie_get_pip(refined_model)

  expect_equal(length(pips_refined), length(pips_initial))
  expect_true(all(pips_refined >= 0))
  expect_true(all(pips_refined <= 1))
})

test_that("run_refine identifies true causal variables", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 3, seed = 133)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  pips <- susie_get_pip(refined_model)
  top_vars <- order(pips, decreasing = TRUE)[1:5]

  overlap <- length(intersect(top_vars, setup$causal_idx))
  expect_true(overlap >= 1)
})

test_that("run_refine maintains low PIPs for null variables", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 3, seed = 134)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  pips <- susie_get_pip(refined_model)
  null_vars <- setdiff(1:length(pips), setup$causal_idx)
  null_pips <- pips[null_vars]

  expect_true(median(null_pips) < 0.3)
})

# =============================================================================
# COMPARISON
# =============================================================================

test_that("run_refine produces different result than no refinement", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 3, seed = 135)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  initial_elbo <- susie_get_objective(setup$model)

  refined_model <- run_refine(setup$model, setup$data, setup$params)
  refined_elbo <- susie_get_objective(refined_model)

  if (refined_elbo > initial_elbo + setup$params$tol) {
    expect_true(TRUE)
  } else {
    expect_equal(refined_elbo, initial_elbo, tolerance = setup$params$tol)
  }
})

test_that("run_refine with tight tolerance may differ from loose tolerance", {
  setup <- create_model_with_cs(seed = 136)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  params_tight <- setup$params
  params_tight$tol <- 1e-6

  params_loose <- setup$params
  params_loose$tol <- 1e-1

  refined_tight <- run_refine(setup$model, setup$data, params_tight)
  refined_loose <- run_refine(setup$model, setup$data, params_loose)

  expect_true(is.finite(susie_get_objective(refined_tight)))
  expect_true(is.finite(susie_get_objective(refined_loose)))
})

# =============================================================================
# STRESS TESTING
# =============================================================================

test_that("run_refine handles multiple refinement iterations", {
  setup <- create_model_with_cs(n = 200, p = 100, L = 10,
                                n_causal = 5, seed = 137)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) < 2,
          "Need multiple credible sets")

  params_loose <- setup$params
  params_loose$tol <- 1e-3

  refined_model <- run_refine(setup$model, setup$data, params_loose)

  expect_true(is.finite(susie_get_objective(refined_model)))
  expect_true(susie_get_objective(refined_model) >=
              susie_get_objective(setup$model) - 1e-6)
})

test_that("run_refine handles large L", {
  setup <- create_model_with_cs(n = 150, p = 80, L = 20,
                                n_causal = 4, seed = 138)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(nrow(refined_model$alpha), nrow(setup$model$alpha))
  expect_true(is.finite(susie_get_objective(refined_model)))
})

test_that("run_refine handles large p", {
  setup <- create_model_with_cs(n = 150, p = 200, L = 10,
                                n_causal = 3, seed = 139)

  skip_if(is.null(setup$model$sets) || length(setup$model$sets$cs) == 0,
          "No credible sets found")

  refined_model <- run_refine(setup$model, setup$data, setup$params)

  expect_equal(ncol(refined_model$alpha), ncol(setup$model$alpha))
  expect_true(is.finite(susie_get_objective(refined_model)))
})


================================================
FILE: tests/testthat/test_rss_lambda_methods.R
================================================
context("S3 methods for rss_lambda data class")

# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
# =============================================================================

test_that("configure_data.rss_lambda returns configured data object", {
  dat <- setup_rss_lambda_data(seed = 1)

  # Create rss_lambda data object
  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data
  params <- list(
    L = 5,
    prior_variance = 0.2,
    residual_variance = 1.0
  )

  configured <- configure_data.rss_lambda(data, params)

  expect_s3_class(configured, "rss_lambda")
  expect_true(!is.null(configured$z))
  expect_true(!is.null(configured$R))
  expect_equal(configured$lambda, dat$lambda)
})

test_that("get_var_y.rss_lambda returns 1", {
  dat <- setup_rss_lambda_data(seed = 2)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  var_y <- get_var_y.rss_lambda(data)

  expect_equal(var_y, 1)
  expect_type(var_y, "double")
  expect_length(var_y, 1)
})

# =============================================================================
# MODEL INITIALIZATION & SETUP
# =============================================================================

test_that("initialize_susie_model.rss_lambda creates valid model", {
  dat <- setup_rss_lambda_data(seed = 3)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data
  params <- list(
    L = 5,
    prior_variance = 0.2,
    residual_variance = 1.0,
    estimate_residual_variance = TRUE,
    estimate_prior_variance = TRUE
  )

  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  expect_type(model, "list")
  expect_true(!is.null(model$alpha))
  expect_true(!is.null(model$mu))
  expect_true(!is.null(model$mu2))
  expect_true(!is.null(model$SinvRj))
  expect_true(!is.null(model$RjSinvRj))

  # Check dimensions
  expect_equal(dim(model$alpha), c(5, dat$p))
  expect_equal(dim(model$mu), c(5, dat$p))
  expect_equal(dim(model$SinvRj), c(dat$p, dat$p))
  expect_length(model$RjSinvRj, dat$p)
})

test_that("validate_prior.rss_lambda delegates to default method", {
  dat <- setup_rss_lambda_data(seed = 21)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data
  params <- list(
    L = 5,
    prior_variance = 0.2,
    residual_variance = 1.0
  )
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  result <- validate_prior.rss_lambda(data, params, model)

  expect_type(result, "logical")
})

test_that("track_ibss_fit.rss_lambda delegates to default method", {
  dat <- setup_rss_lambda_data(seed = 22)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data
  params <- list(L = 5, track_fit = TRUE,
                 scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  tracking <- list()
  iter <- 1
  elbo <- -100

  result <- track_ibss_fit.rss_lambda(data, params, model, tracking, iter, elbo)

  expect_type(result, "list")
})

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
# =============================================================================

test_that("initialize_fitted.rss_lambda creates Rz", {
  dat <- setup_rss_lambda_data(seed = 4)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  # Create minimal mat_init
  mat_init <- list(
    alpha = matrix(1/dat$p, nrow = 5, ncol = dat$p),
    mu = matrix(0, nrow = 5, ncol = dat$p)
  )

  fitted <- initialize_fitted.rss_lambda(data, mat_init)

  expect_type(fitted, "list")
  expect_true("Rz" %in% names(fitted))
  expect_length(fitted$Rz, dat$p)
  expect_type(fitted$Rz, "double")
})

test_that("compute_residuals.rss_lambda computes correct residuals", {
  dat <- setup_rss_lambda_data(seed = 5)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  # Add Rz to model
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))

  # Compute residuals for effect 1
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  expect_true("residuals" %in% names(model))
  expect_true("fitted_without_l" %in% names(model))
  expect_length(model$residuals, dat$p)
  expect_length(model$fitted_without_l, dat$p)
  expect_equal(model$residual_variance, 1)
})


test_that("compute_ser_statistics.rss_lambda computes shat2 and optim params", {
  dat <- setup_rss_lambda_data(seed = 6)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  ser_stats <- compute_ser_statistics.rss_lambda(data, params, model, l = 1)

  expect_type(ser_stats, "list")
  expect_true("shat2" %in% names(ser_stats))
  expect_true("optim_init" %in% names(ser_stats))
  expect_true("optim_bounds" %in% names(ser_stats))
  expect_true("optim_scale" %in% names(ser_stats))

  expect_length(ser_stats$shat2, dat$p)
  expect_true(all(ser_stats$shat2 > 0))
  expect_equal(ser_stats$optim_scale, "log")
})


test_that("SER_posterior_e_loglik.rss_lambda computes expected log-likelihood", {
  dat <- setup_rss_lambda_data(seed = 7)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  e_loglik <- SER_posterior_e_loglik.rss_lambda(data, params, model, l = 1)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
  expect_true(is.finite(e_loglik))
})


test_that("compute_kl.rss_lambda delegates to default method", {
  dat <- setup_rss_lambda_data(seed = 23)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))

  # Set up for KL computation
  l <- 1
  model$lbf <- rep(0, params$L)
  model$alpha[l, ] <- rep(1/dat$p, dat$p)
  model$mu[l, ] <- rnorm(dat$p, sd = 0.1)
  model$mu2[l, ] <- model$mu[l, ]^2 + 0.1

  model <- compute_residuals.rss_lambda(data, params, model, l)
  model <- compute_kl.rss_lambda(data, params, model, l)

  expect_type(model$KL[l], "double")
  expect_length(model$KL[l], 1)
})


test_that("calculate_posterior_moments.rss_lambda computes moments", {
  dat <- setup_rss_lambda_data(seed = 8)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  V <- 0.2
  l <- 1
  model <- calculate_posterior_moments.rss_lambda(data, params, model, V, l)

  expect_length(model$mu[l, ], dat$p)
  expect_length(model$mu2[l, ], dat$p)

  # Variance should be positive
  post_var <- model$mu2[l, ] - model$mu[l, ]^2
  expect_true(all(post_var > -1e-10))

  # post_mean2 = post_var + post_mean^2
  expect_equal(model$mu2[l, ], post_var + model$mu[l, ]^2)
})


test_that("Eloglik.rss_lambda computes expected log-likelihood", {
  dat <- setup_rss_lambda_data(seed = 24)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  # Precompute cached terms needed for Eloglik
  model <- precompute_rss_lambda_terms(data, model)

  e_loglik <- Eloglik.rss_lambda(data, model)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
  expect_true(is.finite(e_loglik))
})


test_that("loglik.rss_lambda computes log Bayes factors", {
  dat <- setup_rss_lambda_data(seed = 25)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  V <- 0.2
  l <- 1
  ser_stats <- compute_ser_statistics.rss_lambda(data, params, model, l = l)
  model <- loglik.rss_lambda(data, params, model, V, ser_stats, l)

  expect_length(model$lbf_variable[l, ], dat$p)
  expect_length(model$alpha[l, ], dat$p)

  expect_true(all(model$alpha[l, ] >= 0))
  expect_true(abs(sum(model$alpha[l, ]) - 1) < 1e-10)
  expect_true(is.numeric(model$lbf[l]))
})


test_that("neg_loglik.rss_lambda returns negative log-likelihood", {
  dat <- setup_rss_lambda_data(seed = 26)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  V_param <- log(1.0)  # Log scale
  ser_stats <- compute_ser_statistics.rss_lambda(data, params, model, l = 1)
  neg_ll <- neg_loglik.rss_lambda(data, params, model, V_param, ser_stats)

  expect_type(neg_ll, "double")
  expect_length(neg_ll, 1)
})

test_that("get_ER2.rss_lambda computes expected squared residuals", {
  dat <- setup_rss_lambda_data(seed = 27)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  # Precompute cached terms needed for get_ER2
  model <- precompute_rss_lambda_terms(data, model)


  er2 <- get_ER2.rss_lambda(data, model)

  expect_type(er2, "double")
  expect_length(er2, 1)
  expect_true(er2 >= 0)
  expect_true(is.finite(er2))
})

# =============================================================================
# MODEL UPDATES & FITTING
# =============================================================================

test_that("update_fitted_values.rss_lambda updates Rz correctly", {
  dat <- setup_rss_lambda_data(seed = 28)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  # Update fitted values for effect 1
  old_Rz <- model$Rz
  model <- update_fitted_values.rss_lambda(data, params, model, l = 1)

  expect_true("Rz" %in% names(model))
  expect_length(model$Rz, dat$p)
  expect_type(model$Rz, "double")
})


test_that("update_variance_components.rss_lambda estimates sigma2", {
  dat <- setup_rss_lambda_data(seed = 29)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0, estimate_residual_variance = TRUE)

  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  # Precompute cached terms
  model <- precompute_rss_lambda_terms(data, model)


  variance_update <- update_variance_components.rss_lambda(data, params, model)

  expect_type(variance_update, "list")
  expect_true("sigma2" %in% names(variance_update))
  expect_type(variance_update$sigma2, "double")
  expect_length(variance_update$sigma2, 1)
  expect_true(variance_update$sigma2 > 0)
  expect_true(variance_update$sigma2 <= 1 - dat$lambda)  # Upper bound
})


test_that("update_derived_quantities.rss_lambda updates SinvRj and RjSinvRj", {
  dat <- setup_rss_lambda_data(seed = 12)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  # Change sigma2
  model$sigma2 <- 0.5

  # Update derived quantities
  updated_model <- update_derived_quantities.rss_lambda(data, params, model)

  expect_true("SinvRj" %in% names(updated_model))
  expect_true("RjSinvRj" %in% names(updated_model))
  expect_equal(dim(updated_model$SinvRj), c(dat$p, dat$p))
  expect_length(updated_model$RjSinvRj, dat$p)
})

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
# =============================================================================

test_that("get_scale_factors.rss_lambda returns vector of 1s", {
  dat <- setup_rss_lambda_data(seed = 13)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list()
  scale_factors <- get_scale_factors.rss_lambda(data, params)

  expect_type(scale_factors, "double")
  expect_length(scale_factors, dat$p)
  expect_equal(scale_factors, rep(1, dat$p))
})


test_that("get_intercept.rss_lambda returns intercept_value", {
  dat <- setup_rss_lambda_data(seed = 14)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  intercept <- get_intercept.rss_lambda(data, params, model)

  expect_type(intercept, "double")
  expect_length(intercept, 1)
  expect_equal(intercept, data$intercept_value)
})


test_that("get_fitted.rss_lambda delegates to default method", {
  dat <- setup_rss_lambda_data(seed = 30)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  fitted <- get_fitted.rss_lambda(data, params, model)

  # Default method returns NULL for RSS data
  expect_null(fitted)
})


test_that("get_cs.rss_lambda returns NULL when coverage is NULL", {
  dat <- setup_rss_lambda_data(seed = 31)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, coverage = NULL, min_abs_corr = 0.5,
                 scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  cs <- get_cs.rss_lambda(data, params, model)

  expect_null(cs)
})

test_that("get_cs.rss_lambda returns NULL when min_abs_corr is NULL", {
  dat <- setup_rss_lambda_data(seed = 32)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, coverage = 0.95, min_abs_corr = NULL,
                 scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  cs <- get_cs.rss_lambda(data, params, model)

  expect_null(cs)
})

test_that("get_cs.rss_lambda uses correlation from R matrix", {
  dat <- setup_rss_lambda_data(seed = 33)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, coverage = 0.95, min_abs_corr = 0.5, n_purity = 100,
                 scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  # Add strong signal to create credible set
  model$alpha[1, 1] <- 0.95
  model$alpha[1, -1] <- 0.05 / (dat$p - 1)

  cs <- get_cs.rss_lambda(data, params, model)

  # May or may not find CS, but should not error
  expect_true(is.null(cs) || is.list(cs))
})


test_that("get_variable_names.rss_lambda assigns variable names to model", {
  dat <- setup_rss_lambda_data(seed = 34)

  # Create named z-scores
  z_named <- dat$z
  names(z_named) <- paste0("var", 1:dat$p)

  result <- rss_lambda_constructor(
    z = z_named,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$pip <- rep(0.1, dat$p)
  model$null_weight <- NULL
  model$alpha <- matrix(0, 5, dat$p)
  model$mu <- matrix(0, 5, dat$p)
  model$mu2 <- matrix(0, 5, dat$p)
  model$lbf_variable <- matrix(0, 5, dat$p)

  model_with_names <- get_variable_names.rss_lambda(data, model)

  expect_true(all(grepl("var", colnames(model_with_names$alpha))))
  expect_true(all(grepl("var", colnames(model_with_names$mu))))
  expect_true(all(grepl("var", colnames(model_with_names$mu2))))
  expect_true(all(grepl("var", names(model_with_names$pip))))
})


test_that("get_zscore.rss_lambda delegates to default method", {
  dat <- setup_rss_lambda_data(seed = 35)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, compute_univariate_zscore = TRUE,
                 scaled_prior_variance = 0.2, residual_variance = 1.0,
                 prior_weights = rep(1/dat$p, dat$p))
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)

  z <- get_zscore.rss_lambda(data, params, model)

  # Default returns NULL
  expect_null(z)
})

test_that("cleanup_model.rss_lambda removes temporary fields", {
  dat <- setup_rss_lambda_data(seed = 38)

  result <- rss_lambda_constructor(
    z = dat$z,
    R = dat$R,
    lambda = dat$lambda,
    n = dat$n
  )

  data <- result$data

  params <- list(L = 5, scaled_prior_variance = 0.2, residual_variance = 1.0)
  var_y <- get_var_y.rss_lambda(data)
  model <- initialize_susie_model.rss_lambda(data, params, var_y)
  model$Rz <- rep(0, dat$p)
  model$Z <- matrix(0, 5, dat$p)
  model$zbar <- rep(0, dat$p)
  model$diag_postb2 <- rep(0, dat$p)

  # Cleanup model
  cleaned <- cleanup_model.rss_lambda(data, params, model)

  # Check that temporary fields are removed
  expect_false("SinvRj" %in% names(cleaned))
  expect_false("RjSinvRj" %in% names(cleaned))
  expect_false("Rz" %in% names(cleaned))
  expect_false("Z" %in% names(cleaned))
  expect_false("zbar" %in% names(cleaned))
  expect_false("diag_postb2" %in% names(cleaned))

  # Check that essential fields remain
  expect_true("alpha" %in% names(cleaned))
  expect_true("mu" %in% names(cleaned))
  expect_true("mu2" %in% names(cleaned))
})

# =============================================================================
# FINITE-REFERENCE R INFLATION TESTS
# =============================================================================

test_that("compute_ser_statistics.rss_lambda returns betahat", {
  dat <- setup_rss_lambda_data(seed = 40)

  data <- dat$data
  params <- dat$params
  model <- dat$model
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  ser_stats <- compute_ser_statistics.rss_lambda(data, params, model, l = 1)

  expect_true("betahat" %in% names(ser_stats))
  expect_length(ser_stats$betahat, dat$p)
  expect_true(all(is.finite(ser_stats$betahat)))
})

test_that("compute_residuals.rss_lambda does not set shat2_inflation", {
  # rss_lambda path no longer carries per-variant inflation; the
  # entry-level error in susie_rss blocks lambda > 0 + R_finite, so
  # data$R_finite_B is never set on an rss_lambda data object.
  dat <- setup_rss_lambda_data(seed = 42)

  data <- dat$data
  params <- dat$params
  model <- dat$model
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))

  expect_null(data$R_finite_B)
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)
  expect_null(model$shat2_inflation)
})

# =============================================================================
# R vs X INPUT PATH AGREEMENT
# =============================================================================

test_that("R and X input paths produce numerically identical results", {
  set.seed(50)
  p <- 30
  n <- 500
  B <- 200
  X_full <- matrix(rnorm(n * p), n, p)
  X_full <- scale(X_full, center = TRUE, scale = TRUE)
  y <- X_full[, 1] * 0.5 + rnorm(n)
  input_ss <- compute_suff_stat(X_full, y, standardize = TRUE)
  R <- cov2cor(input_ss$XtX)
  R <- (R + t(R)) / 2
  ss <- univariate_regression(X_full, y)
  z <- ss$betahat / ss$sebetahat

  # Use X as a finite-reference factor; here use X_full itself (B=n)
  X_ref <- X_full

  # Construct from R
  res_R <- rss_lambda_constructor(z = z, R = R, lambda = 0.1, n = n)
  # Construct from X
  res_X <- rss_lambda_constructor(z = z, X = X_ref, lambda = 0.1, n = n)

  # Eigendecomposition should be very close
  # (sorted eigenvalues should match; eigenvectors may differ in sign)
  expect_equal(res_R$data$eigen_R$values, res_X$data$eigen_R$values, tolerance = 1e-6)

  # Initialize and run one SER iteration
  var_y_R <- get_var_y.rss_lambda(res_R$data)
  model_R <- initialize_susie_model.rss_lambda(res_R$data, res_R$params, var_y_R)
  model_R$Rz <- as.vector(R %*% colSums(model_R$alpha * model_R$mu))

  var_y_X <- get_var_y.rss_lambda(res_X$data)
  model_X <- initialize_susie_model.rss_lambda(res_X$data, res_X$params, var_y_X)
  model_X$Rz <- as.vector(compute_Rv(res_X$data, colSums(model_X$alpha * model_X$mu)))

  # RjSinvRj should agree
  expect_equal(model_R$RjSinvRj, model_X$RjSinvRj, tolerance = 1e-6)

  # Compute residuals
  model_R <- compute_residuals.rss_lambda(res_R$data, res_R$params, model_R, l = 1)
  model_X <- compute_residuals.rss_lambda(res_X$data, res_X$params, model_X, l = 1)
  expect_equal(model_R$residuals, model_X$residuals, tolerance = 1e-6)

  # SER statistics
  stats_R <- compute_ser_statistics.rss_lambda(res_R$data, res_R$params, model_R, l = 1)
  stats_X <- compute_ser_statistics.rss_lambda(res_X$data, res_X$params, model_X, l = 1)
  expect_equal(stats_R$betahat, stats_X$betahat, tolerance = 1e-6)
  expect_equal(stats_R$shat2, stats_X$shat2, tolerance = 1e-6)
})

# =============================================================================
# END-TO-END susie_rss_lambda
# =============================================================================

test_that("susie_rss_lambda with lambda > 0 runs", {
  set.seed(51)
  p <- 50
  n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta <- rep(0, p)
  beta[1] <- 0.5
  beta[10] <- -0.3
  y <- drop(X %*% beta + rnorm(n))
  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  R <- cov2cor(input_ss$XtX)
  R <- (R + t(R)) / 2
  ss <- univariate_regression(X, y)
  z <- ss$betahat / ss$sebetahat

  fit <- susie_rss_lambda(z = z, R = R, lambda = 0.1, n = n, L = 5,
                          max_iter = 50, verbose = FALSE)
  expect_true(fit$converged)
  expect_true(is.finite(fit$elbo[length(fit$elbo)]))
  expect_true(fit$pip[1] > 0.5)
})

test_that("susie_rss_lambda excludes R_finite, R_mismatch, and multi-panel", {
  set.seed(511)
  p <- 20
  n <- 1000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  expect_error(
    susie_rss_lambda(z = z, R = R, n = n, L = 3, lambda = 0.1,
                     R_finite = 5000, max_iter = 2, verbose = FALSE),
    "unused argument"
  )
  expect_error(
    susie_rss_lambda(z = z, R = R, n = n, L = 3, lambda = 0.1,
                     R_mismatch = "map", max_iter = 2, verbose = FALSE),
    "unused argument"
  )
  expect_error(
    susie_rss_lambda(z = z, R = R, n = n, L = 3, lambda = 0.1,
                     R_mismatch = "map_qc", max_iter = 2, verbose = FALSE),
    "unused argument"
  )
  expect_error(
    susie_rss_lambda(z = z, X = list(X, X), n = n, L = 3, lambda = 0.1,
                     max_iter = 2, verbose = FALSE),
    "single X matrix"
  )
})

test_that("R_mismatch requires R_finite and stores lambda_bias and B_corrected", {
  set.seed(511)
  p <- 20
  n <- 1000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_mismatch = "map",
              max_iter = 2, verbose = FALSE),
    "R_mismatch requires R_finite"
  )

  # F6: "mle" is no longer a valid choice.
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_finite = 10000, R_mismatch = "mle",
              max_iter = 2, verbose = FALSE),
    "should be one of"
  )

  # F5: estimate_residual_variance with R_mismatch warns (via warning_message,
  # which uses message()) and is auto-disabled.
  expect_message(
    fit_warn <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 10000,
                          R_mismatch = "map", estimate_residual_variance = TRUE,
                          max_iter = 2, verbose = FALSE),
    "incompatible with"
  )

  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 10000,
                   R_mismatch = "map", max_iter = 2, verbose = FALSE)
  # SS path: region-level scalar lambda_bias and B_corrected (Commit 3 redesign).
  expect_length(fit$R_finite_diagnostics$lambda_bias, 1)
  # B_corrected = 1 / (1/R_finite_B + lambda_bias).
  expect_length(fit$R_finite_diagnostics$B_corrected, 1)
  expect_true(fit$R_finite_diagnostics$lambda_bias >= 0)
  R_finiteB <- fit$R_finite_diagnostics$B
  if (fit$R_finite_diagnostics$lambda_bias > 0) {
    expect_true(fit$R_finite_diagnostics$B_corrected < R_finiteB)
  } else {
    expect_equal(fit$R_finite_diagnostics$B_corrected, R_finiteB)
  }
})

test_that("R_mismatch = 'none' is identical to no-R_mismatch call", {
  # Spec invariant 5.1(b): R_mismatch = 'none' must reduce to the un-augmented
  # variance model exactly.
  set.seed(913)
  p <- 25
  n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)
  z[3] <- 4

  fit_none <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                        R_mismatch = "none", max_iter = 5, verbose = FALSE)
  fit_default <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                           max_iter = 5, verbose = FALSE)
  expect_equal(fit_none$pip, fit_default$pip, tolerance = 1e-12)
  expect_equal(fit_none$alpha, fit_default$alpha, tolerance = 1e-12)
  expect_null(fit_none$lambda_bias)
})

test_that("Fisher SE zero-mask sends near-boundary estimates to 0", {
  # Under the null (z ~ N(0,1)) with no real drift, lambda_bias should
  # be masked to exactly 0 by the Fisher-SE rule
  # (ld_mismatch_generativemodel.tex Sec.~zero_mask).
  set.seed(7)
  p <- 50
  n <- 5000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)  # pure null
  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 10000,
                   R_mismatch = "map", max_iter = 5, verbose = FALSE)
  # All entries should be cleanly zero, not ~4e-9 optimizer floor.
  lb <- fit$R_finite_diagnostics$lambda_bias
  expect_true(all(lb == 0 | lb > 1e-6),
              info = "Fisher zero-mask must leave no values in the (0, 1e-6) gap")
})

test_that("In-sample LD identity yields lambda_bias = 0 (spec invariant 5.3)", {
  # Spec invariant 5.3: when R is the in-sample LD of the data that
  # produced z, there is no population mismatch and the MAP estimator
  # should drive lambda_bias to 0 (modulo Fisher mask).
  set.seed(2024)
  p <- 30
  n <- 4000
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta <- rep(0, p); beta[5] <- 0.4
  y <- drop(X %*% beta + rnorm(n))
  ss <- compute_suff_stat(X, y, standardize = TRUE)
  R <- cov2cor(ss$XtX)
  z <- ss$XtX %*% beta / sqrt(diag(ss$XtX)) + rnorm(p)
  z <- as.numeric(z)
  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map", max_iter = 8, verbose = FALSE)
  expect_true(all(fit$R_finite_diagnostics$lambda_bias == 0),
              info = "In-sample LD must produce lambda_bias = 0")
})

test_that("In-sample LD with multiple sparse signals does not inflate lambda_bias", {
  # Regression for the confounding failure mode: estimating lambda_bias from
  # the leave-one-effect residual can mistake the lth sparse signal for
  # population LD mismatch and suppress power. The generative target is the
  # full residual after all current sparse effects are removed.
  set.seed(44)
  n <- 1000
  p <- 120
  rho <- 0.95
  Sigma <- rho^abs(outer(seq_len(p), seq_len(p), "-"))
  X <- matrix(rnorm(n * p), n, p) %*% chol(Sigma)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta <- rep(0, p)
  causal <- c(20, 60, 100)
  beta[causal] <- c(0.18, -0.20, 0.22)
  y <- drop(X %*% beta + rnorm(n))
  z <- calc_z(X, y, center = TRUE, scale = FALSE)

  fit <- susie_rss(z = z, X = X, n = n, L = 6, R_finite = TRUE,
                   R_mismatch = "map", max_iter = 50, verbose = FALSE)

  expect_true(max(fit$R_finite_diagnostics$lambda_bias) < 0.01,
              info = "In-sample LD should not estimate large population mismatch")
  expect_gt(max(fit$pip[causal]), 0.5)
})

test_that("R_mismatch = 'mle' is rejected at all entry points", {
  # F6 closure: rejecting "mle" must hold at the public function AND
  # at the internal constructors so that downstream packages cannot
  # silently invoke ML.
  set.seed(31)
  p <- 20; n <- 1000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X); z <- rnorm(p)
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_finite = 10000, R_mismatch = "mle",
              max_iter = 1, verbose = FALSE),
    "should be one of"
  )
  expect_error(
    summary_stats_constructor(z = z, R = R, n = n, L = 3, R_finite = 10000,
                              R_mismatch = "mle"),
    "should be one of"
  )
})

test_that("Large R_finite limit reduces to pure-drift estimator", {
  # When 1/R_finite is negligible, B_corrected ~ 1/lambda_bias and the
  # finite-reference contribution to tau^2 vanishes.
  set.seed(11)
  p <- 30; n <- 4000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  beta <- rep(0, p); beta[1] <- 0.6
  z <- as.numeric(R %*% beta * sqrt(n) + rnorm(p))
  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 1e12,
                   R_mismatch = "map", max_iter = 5, verbose = FALSE)
  lb <- fit$R_finite_diagnostics$lambda_bias
  bc <- fit$R_finite_diagnostics$B_corrected
  active <- lb > 0
  if (any(active)) {
    expect_equal(bc[active], 1 / lb[active], tolerance = 1e-6,
                 info = "B_corrected -> 1/lambda_bias as R_finite -> Inf")
  }
})

test_that("tau_j^2 is monotone non-decreasing in lambda_bias", {
  # Spec invariant 5.1(e): tau_j^2(lambda) = sigma^2 + (1/B + lambda) * s_j
  # is monotone non-decreasing in lambda for s_j >= 0.
  s     <- c(0.5, 1.5, 3.0, 0.0)
  sigma2 <- 1.2
  B     <- 1000
  tau2 <- function(lambda) sigma2 + (1 / B + lambda) * s
  expect_true(all(tau2(0.05) >= tau2(0)))
  expect_true(all(tau2(0.5)  >= tau2(0.05)))
  expect_true(all(tau2(0)[s == 0] == sigma2))
})

test_that("loglik.rss_lambda Wakefield ABF agrees with old signal-based form", {
  # Verify the Wakefield ABF form gives the same result as the original
  # signal^2 / RjSinvRj form when there is no inflation
  dat <- setup_rss_lambda_data(seed = 53)
  data <- dat$data
  params <- dat$params
  model <- dat$model
  model$Rz <- as.vector(data$R %*% colSums(model$alpha * model$mu))
  model <- compute_residuals.rss_lambda(data, params, model, l = 1)

  ser_stats <- compute_ser_statistics.rss_lambda(data, params, model, l = 1)

  # Compute BF using Wakefield ABF (current code)
  V <- 0.2
  shat2 <- pmax(ser_stats$shat2, .Machine$double.eps)
  lbf_wakefield <- -0.5 * log(1 + V / shat2) +
    0.5 * ser_stats$betahat^2 * V / (shat2 * (V + shat2))

  # Compute BF using the original SinvRj form:
  # lbf = -0.5 * log(1 + V * RjSinvRj) + 0.5 * V * signal^2 / (1 + V * RjSinvRj)
  # where signal = SinvRj' * r, and shat2 = 1/RjSinvRj, betahat = signal * shat2
  signal <- as.vector(crossprod(model$SinvRj, model$residuals))
  RjSinvRj <- model$RjSinvRj
  lbf_original <- -0.5 * log(1 + V * RjSinvRj) +
    0.5 * V * signal^2 / (1 + V * RjSinvRj)

  expect_equal(lbf_wakefield, lbf_original, tolerance = 1e-10)
})

# =============================================================================
# SS vs RSS-LAMBDA CROSS-PATH AGREEMENT TESTS
# =============================================================================

test_that("SS and RSS-lambda paths agree with small lambda (no inflation)", {
  set.seed(200)
  p <- 50; n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta <- rep(0, p)
  beta[1] <- 0.5; beta[10] <- -0.3
  y <- drop(X %*% beta + rnorm(n))

  input_ss <- compute_suff_stat(X, y, standardize = TRUE)
  R <- cov2cor(input_ss$XtX); R <- (R + t(R)) / 2
  ss <- univariate_regression(X, y)
  z <- ss$betahat / ss$sebetahat

  # SS path (lambda = 0)
  fit_ss <- susie_rss(z = z, R = R, n = n, L = 5,
                      max_iter = 100, verbose = FALSE)
  # RSS-lambda path (tiny lambda ~= 0)
  fit_rss <- susie_rss_lambda(z = z, R = R, n = n, L = 5, lambda = 1e-6,
                              max_iter = 100, verbose = FALSE)

  expect_true(fit_ss$converged)
  expect_true(fit_rss$converged)
  # Alpha matrices should be essentially identical
  expect_equal(fit_ss$alpha, fit_rss$alpha, tolerance = 1e-4)
  # PIPs should match
  expect_equal(fit_ss$pip, fit_rss$pip, tolerance = 1e-4)
})

# =============================================================================
# MULTI-PANEL R MIXTURE TESTS
# =============================================================================

test_that("form_X_meta combines panels correctly", {
  set.seed(42)
  p <- 10
  X1 <- matrix(rnorm(50 * p), 50, p)
  X2 <- matrix(rnorm(30 * p), 30, p)
  omega <- c(0.6, 0.4)

  X_meta <- form_X_meta(list(X1, X2), omega)

  expect_equal(nrow(X_meta), 80)
  expect_equal(ncol(X_meta), p)
  # First 50 rows scaled by sqrt(0.6)
  expect_equal(X_meta[1:50, ], sqrt(0.6) * X1)
  # Last 30 rows scaled by sqrt(0.4)
  expect_equal(X_meta[51:80, ], sqrt(0.4) * X2)
})

test_that("eigen_from_X recovers eigendecomposition of X'X", {
  set.seed(43)
  p <- 20
  X <- matrix(rnorm(100 * p), 100, p)
  R <- crossprod(X)
  eigen_R_direct <- eigen(R, symmetric = TRUE)

  eigen_R_svd <- eigen_from_X(X, p)

  # Eigenvalues should match
  expect_equal(eigen_R_svd$values, eigen_R_direct$values, tolerance = 1e-10)
  # Eigenvectors span same space (up to sign)
  for (j in seq_len(p)) {
    inner <- abs(sum(eigen_R_svd$vectors[, j] * eigen_R_direct$vectors[, j]))
    expect_gt(inner, 0.99)
  }
})

test_that("eval_omega_eloglik_reduced matches pure R reference", {
  set.seed(44)
  p <- 50
  K <- 2

  # Create two panels with B_total < p so reduced-basis applies
  X1 <- matrix(rnorm(15 * p), 15, p)
  X2 <- matrix(rnorm(10 * p), 10, p)
  X_list <- list(X1, X2)
  # Use raw cross-products (matching constructor: lapply(X_list, crossprod))
  panel_R <- list(crossprod(X1), crossprod(X2))

  z <- rnorm(p)
  zbar <- rnorm(p) * 0.1
  diag_postb2 <- abs(rnorm(p)) * 0.01
  L <- 3
  Z <- matrix(rnorm(L * p) * 0.05, L, p)
  sigma2 <- 0.9
  lambda <- 0.01
  omega <- c(0.7, 0.3)

  # Pure R reference (O(p^3) eigendecomposition using panel_R)
  val_R <- susieR:::eval_omega_eloglik_R(panel_R, omega, z, zbar, diag_postb2,
                                          Z, sigma2, lambda, K, p)

  # Reduced-basis (O(r^3) Cholesky using X_list)
  cache <- susieR:::precompute_omega_cache(X_list, z)
  iter_cache <- susieR:::precompute_omega_iteration(cache, zbar, diag_postb2, Z)
  val_reduced <- susieR:::eval_omega_eloglik_reduced(cache, omega, iter_cache,
                                                      sigma2, lambda, K, p)

  expect_equal(val_R, val_reduced, tolerance = 1e-6)
})

test_that("eval_omega_eloglik is concave in omega", {
  set.seed(45)
  p <- 20
  K <- 2

  X1 <- matrix(rnorm(60 * p), 60, p)
  X2 <- matrix(rnorm(50 * p), 50, p)
  panel_R <- list(crossprod(X1) / 60, crossprod(X2) / 50)

  z <- rnorm(p)
  zbar <- rnorm(p) * 0.1
  diag_postb2 <- abs(rnorm(p)) * 0.01
  Z <- matrix(rnorm(2 * p) * 0.05, 2, p)

  eloglik <- function(w1) {
    susieR:::eval_omega_eloglik_R(panel_R, c(w1, 1 - w1), z, zbar,
                                   diag_postb2, Z, 0.9, 0.01, K, p)
  }

  # Concavity: midpoint should be >= average of endpoints
  vals <- sapply(seq(0, 1, 0.1), eloglik)
  for (i in 1:(length(vals) - 2)) {
    midval <- vals[i + 1]
    avg_endpoints <- (vals[i] + vals[i + 2]) / 2
    expect_gte(midval, avg_endpoints - 1e-8)
  }
})

test_that("accessor helpers fall through for single panel", {
  dat <- setup_rss_lambda_data(seed = 50)
  model <- dat$model

  # model$eigen_R is NULL for single panel
  expect_null(model$eigen_R)
  # Accessor should return data$eigen_R
  eigen_R <- get_eigen_R(dat$data, model)
  expect_equal(eigen_R$values, dat$data$eigen_R$values)

  # Same for Vtz
  expect_null(model$Vtz)
  Vtz <- get_Vtz(dat$data, model)
  expect_equal(Vtz, dat$data$Vtz)
})

# =============================================================================
# RANK BOUND FALLBACK
# =============================================================================

# =============================================================================
# TOLERANCE CONSTANTS
# =============================================================================

test_that(".omega_tol has expected fields", {
  tol <- susieR:::.omega_tol
  expect_true(is.list(tol))
  expect_true("convergence" %in% names(tol))
  expect_true("grid_spacing" %in% names(tol))
  expect_true("fw_stop" %in% names(tol))
  expect_true("fw_max_iter" %in% names(tol))
  # Sanity: values are positive
  expect_true(tol$convergence > 0)
  expect_true(tol$grid_spacing > 0 && tol$grid_spacing < 1)
  expect_true(tol$fw_stop > 0)
  expect_true(tol$fw_max_iter >= 1L)
})

# =============================================================================
# EIGEN_FROM_REDUCED UNIT TEST (Issue 21)
# =============================================================================

test_that("eigen_from_reduced recovers full eigendecomposition", {
  set.seed(55)
  p <- 30; B1 <- 40; B2 <- 35
  X1 <- matrix(rnorm(B1 * p), B1, p)
  X2 <- matrix(rnorm(B2 * p), B2, p)
  X_list <- lapply(list(X1, X2), susieR:::standardize_X)
  z <- rnorm(p)

  cache <- susieR:::precompute_omega_cache(X_list, z)

  omega <- c(0.7, 0.3)
  eig_reduced <- susieR:::eigen_from_reduced(cache, omega, K = 2, p = p)

  # Direct eigendecomposition of R(omega)
  R_omega <- omega[1] * crossprod(X_list[[1]]) + omega[2] * crossprod(X_list[[2]])
  R_omega <- 0.5 * (R_omega + t(R_omega))
  eig_direct <- eigen(R_omega, symmetric = TRUE)

  # Eigenvalues should match (within reduced rank)
  r <- cache$r
  expect_equal(eig_reduced$values[1:r], eig_direct$values[1:r], tolerance = 1e-8)

  # Eigenvectors should span the same space: V_reduced' V_direct ~= I for top-r
  overlap <- abs(crossprod(eig_reduced$vectors[, 1:r], eig_direct$vectors[, 1:r]))
  # Each reduced eigenvector should align with exactly one direct eigenvector
  expect_true(all(apply(overlap, 1, max) > 1 - 1e-8))
})

# =============================================================================
# OMEGA AT SIMPLEX VERTEX (Issue 22)
# =============================================================================

test_that("optimize_omega handles vertex optimum (one panel irrelevant)", {
  set.seed(57)
  p <- 25; B <- 100

  # Panel 1: true R, Panel 2: pure noise (identity-like)
  X1 <- matrix(rnorm(B * p), B, p)
  X_list <- lapply(list(X1, matrix(rnorm(B * p), B, p)), susieR:::standardize_X)
  z <- rnorm(p)

  # Construct data where panel 1 is much better
  R1 <- crossprod(X_list[[1]])
  R2 <- diag(p)  # identity -- pure noise panel
  panel_R <- list(R1, R2)

  zbar <- rnorm(p) * 0.1
  diag_postb2 <- abs(rnorm(p)) * 0.01
  Z <- matrix(rnorm(2 * p) * 0.05, 2, p)

  eval_fn <- function(omega_vec) {
    susieR:::eval_omega_eloglik_R(panel_R, omega_vec, z, zbar,
                                   diag_postb2, Z, 0.9, 0.1, 2, p)
  }

  result <- susieR:::optimize_omega(eval_fn, c(0.5, 0.5), K = 2)

  # Should produce valid omega on simplex
  expect_equal(sum(result$omega), 1, tolerance = 1e-10)
  expect_true(all(result$omega >= -1e-10))
})


================================================
FILE: tests/testthat/test_rss_mismatch.R
================================================
context("RSS R-reference mismatch (R_mismatch correction)")

# ---- API surface guards ----

test_that("R_mismatch = 'map_qc' runs and returns Q_art diagnostics", {
  set.seed(11)
  p <- 20
  n <- 1000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map_qc", max_iter = 2, verbose = FALSE)
  d <- fit$R_finite_diagnostics
  expect_true(!is.null(d$Q_art))
  expect_true(d$Q_art >= 0 && d$Q_art <= 1)
  expect_true(is.logical(d$artifact_flag))
  expect_true(d$mode_label %in% c("normal", "warning", "conservative"))
})

test_that("Optional artifact args validate ranges", {
  set.seed(17)
  p <- 20
  n <- 1000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
              R_mismatch = "map", artifact_threshold = -0.1,
              max_iter = 2, verbose = FALSE),
    "artifact_threshold"
  )
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
              R_mismatch = "map", artifact_threshold = 1.1,
              max_iter = 2, verbose = FALSE),
    "artifact_threshold"
  )
  expect_error(
    susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
              R_mismatch = "map", eig_delta_rel = -1,
              max_iter = 2, verbose = FALSE),
    "eig_delta_rel"
  )
})

# ---- Region-level scalar lambda_bias on the SS path ----

test_that("SS path stores scalar lambda_bias / B_corrected (not per-slot)", {
  set.seed(101)
  p <- 25
  n <- 1500
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map", max_iter = 5, verbose = FALSE)
  expect_length(fit$R_finite_diagnostics$lambda_bias, 1)
  expect_length(fit$R_finite_diagnostics$B_corrected, 1)
  expect_true(fit$R_finite_diagnostics$lambda_bias >= 0)
  expect_equal(fit$R_finite_diagnostics$B_corrected,
               1 / (1 / fit$R_finite_diagnostics$B +
                      fit$R_finite_diagnostics$lambda_bias),
               tolerance = 1e-12)
})

# ---- Q_art unit tests ----

test_that("compute_Q_art recovers Q ~ 1 when r_fit lies in low-eigen direction", {
  # Diagonal R with eigenvalues (2, 1, 1e-6). Default eig_delta_rel=1e-3
  # selects only the third eigenvalue.
  V <- diag(3)
  d <- c(2, 1, 1e-6)
  eig <- list(values = d, vectors = V)
  r_fit <- c(0, 0, 1)  # purely in the low-eigen direction
  out <- susieR:::compute_Q_art(eig, r_fit)
  expect_equal(out$Q_art, 1, tolerance = 1e-12)
  expect_true(out$evaluable)
  expect_equal(out$low_eigen_count, 1L)
})

test_that("compute_Q_art returns Q ~ 0 when r_fit avoids low-eigen directions", {
  V <- diag(3)
  d <- c(2, 1, 1e-6)
  eig <- list(values = d, vectors = V)
  r_fit <- c(1, 0.5, 0)  # fully in top two eigen directions
  out <- susieR:::compute_Q_art(eig, r_fit)
  expect_equal(out$Q_art, 0, tolerance = 1e-12)
})

test_that("compute_Q_art is non-evaluable when r_fit has negligible energy", {
  V <- diag(3)
  d <- c(2, 1, 1e-6)
  eig <- list(values = d, vectors = V)
  out <- susieR:::compute_Q_art(eig, rep(0, 3))
  expect_equal(out$Q_art, 0)
  expect_false(out$evaluable)
})

test_that("compute_Q_art is non-evaluable when no low-eigenvalues exist", {
  V <- diag(3)
  d <- c(2, 1, 0.5)  # all > 1e-3 * 2 = 2e-3
  eig <- list(values = d, vectors = V)
  out <- susieR:::compute_Q_art(eig, c(1, 0, 0))
  expect_equal(out$low_eigen_count, 0L)
  expect_false(out$evaluable)
})

test_that("compute_Q_art is in [0, 1] for typical inputs", {
  V <- diag(3)
  d <- c(2, 1, 1e-6)
  eig <- list(values = d, vectors = V)
  for (r_fit in list(c(1, 0, 0), c(0, 1, 0), c(0, 0, 1),
                     c(0.5, 0.5, 0.5), c(-1, 1, -1))) {
    out <- susieR:::compute_Q_art(eig, r_fit)
    expect_true(out$Q_art >= 0 && out$Q_art <= 1)
  }
})

# ---- map_qc end-to-end smoke ----

test_that("map_qc on well-behaved data yields Q_art near 0 and no flag", {
  set.seed(11)
  p <- 25
  n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)
  z[3] <- 4

  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map_qc", max_iter = 5, verbose = FALSE)
  d <- fit$R_finite_diagnostics
  expect_lt(d$Q_art, 0.1)
  expect_false(d$artifact_flag)
  expect_equal(d$mode_label, "normal")
})

test_that("map_qc emits a true R warning when artifact_flag triggers", {
  rho <- 0.9999
  z <- c(-8, -8)
  R <- matrix(c(1, -rho, -rho, 1), 2, 2)
  expect_warning(
    fit <- susie_rss(z = z, R = R, n = 5000, L = 1, R_finite = 1e6,
                     R_mismatch = "map_qc", max_iter = 5,
                     estimate_prior_variance = FALSE,
                     estimate_residual_variance = FALSE, verbose = FALSE),
    "Residual R-bias artifact detected"
  )
  expect_true(fit$R_finite_diagnostics$artifact_flag)
  expect_equal(fit$R_finite_diagnostics$Q_art, 1, tolerance = 1e-6)
})

test_that("map_qc surfaces Q_art and mode_label diagnostics", {
  set.seed(12)
  p <- 25; n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  R <- cor(X)
  z <- rnorm(p)

  fit <- susie_rss(z = z, R = R, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map_qc", max_iter = 3, verbose = FALSE)
  d <- fit$R_finite_diagnostics
  for (fld in c("Q_art", "artifact_flag", "artifact_evaluable",
                "low_eigen_count", "low_eigen_fraction", "eig_delta",
                "mode_label", "lambda_bias", "B_corrected"))
    expect_true(!is.null(d[[fld]]), info = paste("missing diagnostic:", fld))
})

test_that("map_qc with X-input runs and surfaces Q_art", {
  set.seed(15)
  p <- 25; n <- 2000
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta <- rep(0, p); beta[5] <- 0.4
  y <- drop(X %*% beta + rnorm(n))
  z <- as.numeric(crossprod(X, y) / sqrt(diag(crossprod(X))))
  fit <- susie_rss(z = z, X = X, n = n, L = 3, R_finite = 5000,
                   R_mismatch = "map_qc", max_iter = 3, verbose = FALSE)
  d <- fit$R_finite_diagnostics
  expect_true(!is.null(d$Q_art))
  expect_true(d$Q_art >= 0 && d$Q_art <= 1)
})

test_that("map_qc works on lambda=0 multi-panel SS path", {
  set.seed(19)
  n <- 80
  p <- 12
  X1 <- matrix(rnorm(n * p), n, p)
  X2 <- matrix(rnorm(n * p), n, p)
  z <- rnorm(p)

  fit <- susie_rss(z = z, X = list(X1, X2), n = 1000, L = 3,
                   R_finite = TRUE, R_mismatch = "map_qc", max_iter = 3,
                   verbose = FALSE)
  d <- fit$R_finite_diagnostics
  expect_true(!is.null(d$Q_art))
  expect_true(d$Q_art >= 0 && d$Q_art <= 1)
  expect_length(d$lambda_bias, 1)
})


================================================
FILE: tests/testthat/test_rss_utils.R
================================================
context("RSS utility functions")

# =============================================================================
# FUNDAMENTAL COMPUTATIONS
# =============================================================================

test_that("compute_suff_stat with standardize=FALSE produces correct XtX", {
  base_data <- generate_base_data(n = 10, p = 5, seed = 1)

  # Manual calculation: center X
  X_centered <- scale(base_data$X, center = TRUE, scale = FALSE)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)

  dimnames(out$XtX) <- NULL
  expect_equal(out$XtX, crossprod(X_centered), tolerance = 1e-14)
})

test_that("compute_suff_stat with standardize=TRUE produces correct XtX", {
  base_data <- generate_base_data(n = 10, p = 5, seed = 2)

  # Manual calculation: center and scale X
  X_standardized <- scale(base_data$X, center = TRUE, scale = TRUE)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = TRUE)

  dimnames(out$XtX) <- NULL
  expect_equal(out$XtX, crossprod(X_standardized), tolerance = 1e-14)
})

test_that("compute_suff_stat with sparse matrix input", {
  base_data <- generate_base_data(n = 10, p = 5, seed = 3)

  # Sparse version
  X_sparse <- as(base_data$X, "sparseMatrix")

  out_dense <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)
  out_sparse <- compute_suff_stat(X_sparse, base_data$y, standardize = FALSE)

  dimnames(out_dense$XtX) <- NULL
  dimnames(out_sparse$XtX) <- NULL

  expect_equal(out_sparse$XtX, out_dense$XtX, tolerance = 1e-14)
  expect_equal(as.vector(out_sparse$Xty), out_dense$Xty, tolerance = 1e-14)
  expect_equal(out_sparse$yty, out_dense$yty, tolerance = 1e-14)
})

test_that("compute_suff_stat produces correct Xty", {
  base_data <- generate_base_data(n = 20, p = 8, seed = 4)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)

  # Manual calculation
  y_centered <- base_data$y - mean(base_data$y)
  X_centered <- scale(base_data$X, center = TRUE, scale = FALSE)
  expected_Xty <- drop(crossprod(X_centered, y_centered))

  expect_equal(out$Xty, expected_Xty, tolerance = 1e-14)
})

test_that("compute_suff_stat produces correct yty", {
  base_data <- generate_base_data(n = 20, p = 8, seed = 5)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)

  # Manual calculation
  y_centered <- base_data$y - mean(base_data$y)
  expected_yty <- sum(y_centered^2)

  expect_equal(out$yty, expected_yty, tolerance = 1e-14)
})

test_that("compute_suff_stat stores column means and y_mean", {
  base_data <- generate_base_data(n = 15, p = 6, seed = 6)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)

  expect_equal(out$X_colmeans, colMeans(base_data$X), tolerance = 1e-14)
  expect_equal(out$y_mean, mean(base_data$y), tolerance = 1e-14)
  expect_equal(out$n, base_data$n)
})

test_that("compute_suff_stat with standardize=TRUE scales correctly", {
  base_data <- generate_base_data(n = 25, p = 10, seed = 7)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = TRUE)

  # XtX diagonal should be close to n (since standardized columns have variance 1)
  # After centering: crossprod of standardized X
  X_std <- scale(base_data$X, center = TRUE, scale = TRUE)
  expected_diag <- diag(crossprod(X_std))

  expect_equal(diag(out$XtX), expected_diag, tolerance = 1e-12)
})

test_that("compute_suff_stat returns list with correct names", {
  base_data <- generate_base_data(n = 10, p = 5, seed = 8)

  out <- compute_suff_stat(base_data$X, base_data$y, standardize = FALSE)

  expect_type(out, "list")
  expect_named(out, c("XtX", "Xty", "yty", "n", "y_mean", "X_colmeans"))
})

test_that("compute_suff_stat matches susie_ss input requirements", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 9)

  ss <- compute_suff_stat(base_data$X, base_data$y, standardize = TRUE)

  # Should be able to use directly with susie_ss
  expect_error(
    fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                    max_iter = 2, verbose = FALSE),
    NA
  )
})

test_that("compute_suff_stat with zero-variance column", {
  skip("Fails on Linux in CI")

  base_data <- generate_base_data(n = 20, p = 5, seed = 10)
  base_data$X[, 3] <- 1  # Constant column (zero variance after centering)

  # Should not error
  expect_error(
    out <- compute_suff_stat(base_data$X, base_data$y, standardize = TRUE),
    NA
  )
  expect_true(is.infinite(out$Xty[3]))
})

# =============================================================================
# RSS MODEL METHODS
# =============================================================================

test_that("estimate_s_rss returns value between 0 and 1 (null-mle)", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 11)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  s <- estimate_s_rss(z, R, n = base_data$n, method = "null-mle")

  expect_type(s, "double")
  expect_length(s, 1)
  expect_true(s >= 0 && s <= 1)
})

test_that("estimate_s_rss with null-partialmle method", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 12)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  s <- estimate_s_rss(z, R, n = base_data$n, method = "null-partialmle")

  expect_type(s, "double")
  expect_length(s, 1)
  # Note: null-partialmle can be > 1
  expect_true(s >= 0)
})

test_that("estimate_s_rss with null-pseudomle method", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 13)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  s <- estimate_s_rss(z, R, n = base_data$n, method = "null-pseudomle")

  expect_type(s, "double")
  expect_length(s, 1)
  expect_true(s >= 0 && s <= 1)
})

test_that("estimate_s_rss warns when n is not provided", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 14)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_message(
    s <- estimate_s_rss(z, R),
    "sample size"
  )
})

test_that("estimate_s_rss errors when n <= 1", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 15)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_error(
    estimate_s_rss(z, R, n = 1),
    "must be greater than 1"
  )

  expect_error(
    estimate_s_rss(z, R, n = 0),
    "must be greater than 1"
  )
})

test_that("estimate_s_rss handles eigen decomposition in R", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 16)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Pre-compute eigen decomposition
  attr(R, "eigen") <- eigen(R, symmetric = TRUE)

  s1 <- estimate_s_rss(z, R, n = base_data$n, method = "null-mle")

  # Without pre-computed eigen
  R2 <- cor(base_data$X)
  s2 <- estimate_s_rss(z, R2, n = base_data$n, method = "null-mle")

  expect_equal(s1, s2, tolerance = 1e-10)
})

test_that("estimate_s_rss handles negative eigenvalues in R", {
  set.seed(17)
  p <- 50

  # Create R with intentionally negative eigenvalue
  R <- matrix(0.5, p, p)
  diag(R) <- 1
  R[1, 2] <- 1.5 
  R[2, 1] <- 1.5

  z <- rnorm(p)

  expect_message(
    s <- estimate_s_rss(z, R, n = 100, method = "null-mle"),
    "not positive semidefinite"
  )

  # Should still return valid estimate
  expect_true(s >= 0 && s <= 1)
})

test_that("estimate_s_rss handles NA values in z", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 18)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Introduce NA
  z[5] <- NA

  expect_error(
    s <- estimate_s_rss(z, R, n = base_data$n, method = "null-mle"),
    NA
  )

  expect_true(s >= 0 && s <= 1)
})

test_that("estimate_s_rss with perfect LD has one large eigenvalue", {
  set.seed(19)
  p <- 10

  # All variables perfectly correlated
  R <- matrix(1, p, p)
  z <- rnorm(p)
  s <- estimate_s_rss(z, R, n = 100, method = "null-partialmle")
  expect_true(s >= 0)
})

test_that("estimate_s_rss errors on invalid method", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 20)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_error(
    estimate_s_rss(z, R, n = base_data$n, method = "invalid-method"),
    "not implemented"
  )
})

test_that("estimate_s_rss produces small s for consistent z and R", {
  # Generate data where z-scores are consistent with R
  base_data <- generate_base_data(n = 500, p = 100, k = 3, signal_sd = 0.5, seed = 21)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  s <- estimate_s_rss(z, R, n = base_data$n, method = "null-mle")

  # With consistent data, s should be small
  expect_true(s < 0.01)
})

# =============================================================================
# DIAGNOSTIC & QUALITY CONTROL
# =============================================================================

test_that("kriging_rss returns list with plot and conditional_dist", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 22)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  result <- kriging_rss(z, R, n = base_data$n)

  expect_type(result, "list")
  expect_named(result, c("plot", "conditional_dist"))
})

test_that("kriging_rss plot is a ggplot object", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 23)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  result <- kriging_rss(z, R, n = base_data$n)

  expect_s3_class(result$plot, "gg")
  expect_s3_class(result$plot, "ggplot")
})

test_that("kriging_rss conditional_dist is a data frame with correct columns", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 24)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  result <- kriging_rss(z, R, n = base_data$n)

  expect_s3_class(result$conditional_dist, "data.frame")
  expect_equal(nrow(result$conditional_dist), base_data$p)
  expect_true(all(c("z", "condmean", "condvar", "z_std_diff", "logLR") %in%
                    colnames(result$conditional_dist)))
})

test_that("kriging_rss with provided s parameter", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 25)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Provide custom s
  result <- kriging_rss(z, R, n = base_data$n, s = 0.1)

  expect_type(result, "list")
  expect_s3_class(result$plot, "ggplot")
  expect_equal(nrow(result$conditional_dist), base_data$p)
})

test_that("kriging_rss warns when n is not provided", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 26)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_message(
    result <- kriging_rss(z, R),
    "sample size"
  )
})

test_that("kriging_rss errors when n <= 1", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 27)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_error(
    kriging_rss(z, R, n = 1),
    "must be greater than 1"
  )
})

test_that("kriging_rss handles s > 1 with warning", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 28)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_message(
    result <- kriging_rss(z, R, n = base_data$n, s = 1.5),
    "greater than 1"
  )

  # Should still produce output
  expect_type(result, "list")
})

test_that("kriging_rss errors when s < 0", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 29)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  expect_error(
    kriging_rss(z, R, n = base_data$n, s = -0.1),
    "non-negative"
  )
})

test_that("kriging_rss handles negative eigenvalues in R", {
  set.seed(30)
  p <- 50

  # Create R with intentionally negative eigenvalue
  R <- matrix(0.5, p, p)
  diag(R) <- 1
  R[1, 2] <- 1.5 
  R[2, 1] <- 1.5

  z <- rnorm(p)

  expect_message(
    result <- kriging_rss(z, R, n = 100),
    "not positive semidefinite"
  )

  expect_type(result, "list")
})

test_that("kriging_rss identifies potential allele switches (high logLR)", {
  # Create data with one flipped allele
  base_data <- generate_base_data(n = 500, p = 100, k = 3, signal_sd = 1, seed = 31)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Flip one z-score to simulate allele switch
  z[1] <- -z[1]

  result <- kriging_rss(z, R, n = base_data$n)

  # The flipped variant should have high logLR
  expect_true(result$conditional_dist$logLR[1] > 0)
})

test_that("kriging_rss handles NA values in z", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 32)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Introduce NA
  z[10] <- NA

  expect_error(
    result <- kriging_rss(z, R, n = base_data$n),
    NA
  )

  # NA should be replaced with 0
  expect_equal(result$conditional_dist$z[10], 0)
})

test_that("kriging_rss conditional mean and variance are sensible", {
  base_data <- generate_base_data(n = 200, p = 50, seed = 33)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  result <- kriging_rss(z, R, n = base_data$n)

  # All conditional variances should be positive
  expect_true(all(result$conditional_dist$condvar > 0))

  # Conditional means should be finite
  expect_true(all(is.finite(result$conditional_dist$condmean)))

  # Standardized differences should be finite
  expect_true(all(is.finite(result$conditional_dist$z_std_diff)))
})

test_that("kriging_rss sets a_max=2 when max(z_std_diff^2) < 1", {
  # Create data where z-scores are very consistent with R
  # Use very small z-scores (close to 0) which will have small standardized differences
  set.seed(34)
  p <- 50

  # Create identity correlation matrix (independent variables)
  R <- diag(p)

  # Use very small z-scores (near zero)
  z <- rnorm(p, mean = 0, sd = 0.3)  # Small standard deviation

  result <- kriging_rss(z, R, n = 100)

  # Verify that max(z_std_diff^2) < 1
  max_z_std_diff_sq <- max(result$conditional_dist$z_std_diff^2)
  expect_true(max_z_std_diff_sq < 1)

  # The plot should be created successfully (tests the a_max=2 branch)
  expect_s3_class(result$plot, "ggplot")
})

test_that("kriging_rss adds red points when outliers exist (length(idx) > 0)", {
  # Create scenario that produces outliers with high logLR
  # Use data with inconsistent z-scores relative to correlation structure
  set.seed(32)  # This seed produces outliers
  n <- 200
  p <- 50

  # Generate data with signal
  base_data <- generate_base_data(n = n, p = p, k = 5, signal_sd = 2, seed = 32)

  ss <- univariate_regression(base_data$X, base_data$y)
  R <- cor(base_data$X)
  z <- with(ss, betahat / sebetahat)

  # Flip some strong z-scores to create allele switch-like pattern
  strong_idx <- which(abs(z) > 2)
  if (length(strong_idx) >= 3) {
    # Flip first 3 strong z-scores
    flip_idx <- strong_idx[1:3]
    z[flip_idx] <- -z[flip_idx]
  }

  result <- kriging_rss(z, R, n = n)

  # Check that outliers were detected
  outliers <- which(result$conditional_dist$logLR > 2 &
                    abs(result$conditional_dist$z) > 2)

  # Verify the length(idx) > 0 branch was executed
  expect_true(length(outliers) > 0)

  # Test that plot was created successfully (with red points added)
  expect_s3_class(result$plot, "ggplot")
  expect_s3_class(result$conditional_dist, "data.frame")
})


================================================
FILE: tests/testthat/test_single_effect_regression.R
================================================
context("Single Effect Regression")

# =============================================================================
# SINGLE_EFFECT_REGRESSION - Returns Correct Structure
# =============================================================================

test_that("single_effect_regression returns correct structure", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_type(result, "list")
  expect_true("alpha" %in% names(result))
  expect_true("mu" %in% names(result))
  expect_true("mu2" %in% names(result))
  expect_true("lbf" %in% names(result))
  expect_true("lbf_variable" %in% names(result))
  expect_true("V" %in% names(result))
  expect_length(result$alpha[l, ], setup$data$p)
  expect_length(result$mu[l, ], setup$data$p)
  expect_length(result$mu2[l, ], setup$data$p)
  expect_length(result$lbf_variable[l, ], setup$data$p)
  expect_length(result$lbf[l], 1)
  expect_length(result$V[l], 1)
})

# =============================================================================
# SINGLE_EFFECT_REGRESSION - Alpha Sums to 1
# =============================================================================

test_that("single_effect_regression alpha is valid probability distribution", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_equal(sum(result$alpha[l, ]), 1, tolerance = 1e-10)
  expect_true(all(result$alpha[l, ] >= 0 & result$alpha[l, ] <= 1))
})

# =============================================================================
# SINGLE_EFFECT_REGRESSION - V Non-negative
# =============================================================================

test_that("single_effect_regression V is non-negative and finite", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(result$V[l] >= 0)
  expect_true(is.finite(result$V[l]))
})

# =============================================================================
# SINGLE_EFFECT_REGRESSION - Different Estimation Methods
# =============================================================================

test_that("single_effect_regression works with estimate_prior_method='optim'", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$estimate_prior_method <- "optim"
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(result$V[l] >= 0)
  expect_equal(sum(result$alpha[l, ]), 1, tolerance = 1e-10)
})

test_that("single_effect_regression works with estimate_prior_method='EM'", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$estimate_prior_method <- "EM"
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(result$V[l] >= 0)
  expect_equal(sum(result$alpha[l, ]), 1, tolerance = 1e-10)
})

test_that("single_effect_regression works with estimate_prior_method='simple'", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$estimate_prior_method <- "simple"
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(result$V[l] >= 0)
  expect_equal(sum(result$alpha[l, ]), 1, tolerance = 1e-10)
})

test_that("single_effect_regression works with estimate_prior_method='none'", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$estimate_prior_method <- "none"
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(result$V[l] >= 0)
  expect_equal(sum(result$alpha[l, ]), 1, tolerance = 1e-10)
})

test_that("single_effect_regression rejects invalid estimate_prior_method", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$estimate_prior_method <- "invalid_method"
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  expect_error(
    single_effect_regression(setup$data, setup$params, setup$model, l),
    "Invalid option for estimate_prior_method: invalid_method"
  )
})

# =============================================================================
# SINGLE_EFFECT_UPDATE
# =============================================================================

test_that("single_effect_update updates all model components", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1

  updated_model <- single_effect_update(setup$data, setup$params, setup$model, l)

  expect_equal(sum(updated_model$alpha[l, ]), 1, tolerance = 1e-10)
  expect_true(updated_model$V[l] >= 0)
  expect_true(updated_model$KL[l] >= -1e-6)
  expect_true("lbf" %in% names(updated_model))
  expect_true("lbf_variable" %in% names(updated_model))
  expect_true("Xr" %in% names(updated_model))
})

test_that("single_effect_update maintains valid probability constraints", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1

  updated_model <- single_effect_update(setup$data, setup$params, setup$model, l)

  expect_equal(sum(updated_model$alpha[l, ]), 1, tolerance = 1e-10)
  expect_true(all(updated_model$alpha[l, ] >= 0))
  expect_true(all(updated_model$alpha[l, ] <= 1))
})

test_that("single_effect_update works for all effects l=1,...,L", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)

  for (l in 1:setup$params$L) {
    updated_model <- single_effect_update(setup$data, setup$params, setup$model, l)
    expect_equal(sum(updated_model$alpha[l, ]), 1, tolerance = 1e-10)
    expect_true(updated_model$V[l] >= 0)
  }
})

# =============================================================================
# MATHEMATICAL PROPERTIES
# =============================================================================

test_that("SER variance decomposition", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  post_second_moment <- sum(result$alpha[l, ] * result$mu2[l, ])
  post_mean_squared <- (sum(result$alpha[l, ] * result$mu[l, ]))^2
  post_var <- post_second_moment - post_mean_squared

  expect_true(post_var >= -1e-10)
})

test_that("SER log Bayes factors are finite", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(all(is.finite(result$lbf_variable[l, ])))
  expect_true(is.finite(result$lbf[l]))
})

test_that("SER posterior moments are finite", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  l <- 1
  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)

  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_true(all(is.finite(result$mu[l, ])))
  expect_true(all(is.finite(result$mu2[l, ])))
  expect_true(all(result$mu2[l, ] >= 0))
})

# =============================================================================
# SIGNAL DETECTION
# =============================================================================

test_that("SER with strong signal has large V", {
  set.seed(123)
  n <- 100
  p <- 50

  base_data <- generate_base_data(n, p, k = 1, signal_sd = 10, seed = NULL)
  X <- set_X_attributes(base_data$X, center = TRUE, scale = TRUE)
  y <- base_data$y - mean(base_data$y)

  data <- structure(
    list(X = X, y = y, n = n, p = p, mean_y = mean(base_data$y)),
    class = "individual"
  )

  params <- create_base_params(L = 1, p = p, additional_params = list(
    estimate_prior_method = "optim",
    use_NIG = FALSE,
    check_null_threshold = 0.1
  ))

  model <- create_base_model(L = 1, p = p, n = n, X_attr = attr(X, "d"))

  model <- compute_residuals.individual(data, params, model, 1)
  result <- single_effect_regression(data, params, model, 1)

  expect_true(result$V > 0.1)
})

test_that("SER with no signal has V close to 0", {
  set.seed(456)
  n <- 100
  p <- 50

  base_data <- generate_base_data(n, p, k = 0, seed = NULL)
  X <- set_X_attributes(base_data$X, center = TRUE, scale = TRUE)
  y <- base_data$y - mean(base_data$y)

  data <- structure(
    list(X = X, y = y, n = n, p = p, mean_y = mean(base_data$y)),
    class = "individual"
  )

  params <- create_base_params(L = 1, p = p, additional_params = list(
    estimate_prior_method = "optim",
    use_NIG = FALSE,
    check_null_threshold = 0.1
  ))

  model <- create_base_model(L = 1, p = p, n = n, X_attr = attr(X, "d"))

  model <- compute_residuals.individual(data, params, model, 1)
  result <- single_effect_regression(data, params, model, 1)

  expect_equal(result$V, 0, tolerance = 1e-10)
})

# =============================================================================
# EDGE CASES
# =============================================================================

test_that("SER handles single variable (p=1)", {
  setup <- setup_individual_data(n = 100, p = 1, L = 1)
  l <- 1
  setup$model$alpha <- matrix(1, 1, 1)
  setup$model$mu <- matrix(0, 1, 1)
  setup$model$mu2 <- matrix(0, 1, 1)
  setup$model$V <- 1
  setup$model$pi <- 1
  setup$model$predictor_weights <- attr(setup$data$X, "d")
  setup$model$lbf <- 0
  setup$model$lbf_variable <- matrix(0, 1, 1)

  setup$model <- compute_residuals.individual(setup$data, setup$params, setup$model, l)
  result <- single_effect_regression(setup$data, setup$params, setup$model, l)

  expect_length(result$alpha, 1)
  expect_equal(result$alpha[1], 1)
  expect_true(result$V >= 0)
})


================================================
FILE: tests/testthat/test_slot_prior.R
================================================
context("slot_prior class")

test_that("slot_prior_poisson constructs correctly", {
  sp <- suppressMessages(slot_prior_poisson(C = 5, nu = 8))
  expect_s3_class(sp, "slot_prior_poisson")
  expect_s3_class(sp, "slot_prior")
  expect_equal(sp$C, 5)
  expect_equal(sp$nu, 8)  # default when NULL
  expect_equal(sp$update_schedule, "sequential")  # binomial default
  expect_null(sp$c_hat_init)
  expect_equal(sp$skip_threshold_multiplier, 0)
})

test_that("slot_prior_poisson constructs correctly", {
  sp <- slot_prior_poisson(C = 3, nu = 10)
  expect_s3_class(sp, "slot_prior_poisson")
  expect_s3_class(sp, "slot_prior")
  expect_equal(sp$C, 3)
  expect_equal(sp$nu, 10)
  expect_equal(sp$update_schedule, "sequential")  # poisson default
})

test_that("slot_prior validates inputs", {
  expect_error(slot_prior_poisson(C = -1, nu = 8))
  expect_error(slot_prior_poisson(C = "abc", nu = 8))
  expect_error(slot_prior_poisson(C = 5, nu = -1))
})

test_that("slot_prior tracks nu_was_default", {
  sp_default <- slot_prior_poisson(C = 4)
  expect_true(sp_default$nu_was_default)
  expect_equal(sp_default$nu, 8)
  sp_explicit <- slot_prior_poisson(C = 4, nu = 8)
  expect_false(sp_explicit$nu_was_default)
  expect_equal(sp_explicit$nu, 8)
})

test_that("slot_prior_poisson default for update_schedule is sequential", {
  sp <- slot_prior_poisson(C = 5, nu = 8)
  expect_equal(sp$update_schedule, "sequential")
})

test_that("slot_prior_poisson default for update_schedule is sequential", {
  sp <- slot_prior_poisson(C = 5, nu = 8)
  expect_equal(sp$update_schedule, "sequential")
})

test_that("is.slot_prior works", {
  expect_true(is.slot_prior(slot_prior_poisson(C = 5, nu = 8)))
  expect_true(is.slot_prior(slot_prior_poisson(C = 5, nu = 8)))
  expect_false(is.slot_prior(list(C = 5)))
  expect_false(is.slot_prior(NULL))
})

test_that("print.slot_prior produces output", {
  expect_output(print(slot_prior_poisson(C = 5, nu = 8)), "poisson")
  expect_output(print(slot_prior_poisson(C = 3, nu = 8)), "poisson")
})

test_that("susie with slot_prior produces c_hat output", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  b <- rep(0, p); b[1:3] <- 1
  y <- X %*% b + rnorm(n)
  fit <- susie(X, y, L = 10, slot_prior = slot_prior_poisson(C = 3, nu = 8),
               verbose = FALSE)
  expect_true(!is.null(fit$c_hat))
  expect_equal(length(fit$c_hat), 10)
  expect_true(all(fit$c_hat >= 0 & fit$c_hat <= 1))
  expect_true(!is.null(fit$C_hat))
  expect_true(fit$C_hat > 0)
})

test_that("susie with binomial and poisson give similar results", {
  set.seed(42)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  b <- rep(0, p); b[1:3] <- 1
  y <- X %*% b + rnorm(n)
  fit_b <- susie(X, y, L = 10, slot_prior = slot_prior_poisson(C = 3, nu = 8),
                 verbose = FALSE)
  fit_p <- susie(X, y, L = 10, slot_prior = slot_prior_poisson(C = 3, nu = 8),
                 verbose = FALSE)
  # Both should find approximately the same effects
  expect_equal(length(fit_b$sets$cs), length(fit_p$sets$cs))
  # c_hat values should be similar (binomial correction is small for L >> C)
  expect_equal(fit_b$C_hat, fit_p$C_hat, tolerance = 1)
})

test_that("susie without slot_prior does not produce c_hat", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)
  fit <- susie(X, y, L = 5, verbose = FALSE)
  expect_null(fit$c_hat)
})

test_that("ash model auto-creates binomial slot_prior with warning", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)
  expect_message(
    fit <- susie(X, y, L = 10, unmappable_effects = "ash",
                 verbose = FALSE, max_iter = 5),
    "strongly advised"
  )
  expect_true(!is.null(fit$c_hat))
})

test_that("ash model with explicit slot_prior does not warn about C", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)
  # Should not produce the "strongly advised" warning about C
  # (may still produce convergence method warning, which is expected)
  fit <- withCallingHandlers(
    susie(X, y, L = 10, unmappable_effects = "ash",
          slot_prior = slot_prior_poisson(C = 3, nu = 8),
          verbose = FALSE, max_iter = 5),
    warning = function(w) {
      if (grepl("strongly advised", conditionMessage(w)))
        stop("Got unexpected C warning")
      invokeRestart("muffleWarning")
    }
  )
  expect_true(!is.null(fit$c_hat))
})

test_that("c_hat warm start works", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  b <- rep(0, p); b[1:3] <- 1
  y <- X %*% b + rnorm(n)

  # First fit
  fit1 <- susie(X, y, L = 10, slot_prior = slot_prior_poisson(C = 3, nu = 8),
                verbose = FALSE)

  # Warm start with previous c_hat
  sp_warm <- slot_prior_poisson(C = 3, nu = 8, c_hat_init = fit1$c_hat)
  fit2 <- susie(X, y, L = 10, slot_prior = sp_warm,
                model_init = fit1, verbose = FALSE)

  # Should converge immediately or in very few iterations
  expect_true(fit2$niter <= fit1$niter)
})

test_that("batch and sequential schedules both converge", {
  set.seed(1)
  n <- 100; p <- 200
  X <- matrix(rnorm(n * p), n, p)
  b <- rep(0, p); b[1:3] <- 1
  y <- X %*% b + rnorm(n)
  fit_batch <- susie(X, y, L = 10,
                     slot_prior = slot_prior_poisson(C = 3, update_schedule = "batch"),
                     verbose = FALSE)
  fit_seq <- susie(X, y, L = 10,
                   slot_prior = slot_prior_poisson(C = 3, update_schedule = "sequential"),
                   verbose = FALSE)
  expect_true(fit_batch$converged)
  expect_true(fit_seq$converged)
  # Results should be very similar
  expect_equal(sum(fit_batch$c_hat > 0.5), sum(fit_seq$c_hat > 0.5))
})


================================================
FILE: tests/testthat/test_slot_weights.R
================================================
# Tests for slot_weights mechanism
#
# Key invariant: slot_weights = rep(1, L) must produce identical results
# to the standard path (slot_weights = NULL).

context("Slot weights")

set.seed(1)
n <- 200
p <- 50
X <- matrix(rnorm(n * p), n, p)
beta <- rep(0, p)
beta[c(1, 5, 10)] <- c(0.5, -0.3, 0.4)
y <- X %*% beta + rnorm(n)
R <- cor(X)
z <- as.vector(sqrt(n) * crossprod(X, y) / sqrt(n * diag(crossprod(X))))

# =============================================================================
# Test 1: slot_weights = rep(1,L) matches NULL (RSS)
# =============================================================================
test_that("slot_weights = rep(1,L) matches standard path for RSS", {
  L <- 5
  fit_std <- susie_rss(z = z, R = R, n = n, L = L,
                       estimate_prior_variance = FALSE,
                       estimate_residual_variance = FALSE,
                       max_iter = 10, tol = 1e-4)

  # Run with explicit all-ones slot_weights via workhorse
  objs <- susie_rss(z = z, R = R, n = n, L = L,
                    estimate_prior_variance = FALSE,
                    estimate_residual_variance = FALSE,
                    max_iter = 10, tol = 1e-4,
                    init_only = TRUE)
  model <- susieR:::ibss_initialize(objs$data, objs$params)
  model$slot_weights <- rep(1, L)
  fit_sw <- susieR:::susie_workhorse(objs$data, objs$params)

  # Should be identical (slot_weights = NULL is equivalent to rep(1,L))
  # Note: we compare the standard path vs workhorse-with-weights
  # The workhorse doesn't see slot_weights because it initializes fresh.
  # So instead, verify that get_slot_weight returns 1 when NULL.
  expect_equal(susieR:::get_slot_weight(list(), 1), 1)
  expect_equal(susieR:::get_slot_weight(list(slot_weights = c(0.5, 0.8)), 1), 0.5)
  expect_equal(susieR:::get_slot_weight(list(slot_weights = c(0.5, 0.8)), 2), 0.8)
})

# =============================================================================
# Test 2: slot_weights = 0 for one effect zeroes its contribution
# =============================================================================
test_that("slot_weight = 0 zeroes effect contribution in RSS", {
  L <- 3
  objs <- susie_rss(z = z, R = R, n = n, L = L,
                    estimate_prior_variance = FALSE,
                    estimate_residual_variance = FALSE,
                    init_only = TRUE)
  data <- objs$data
  params <- objs$params
  model <- susieR:::ibss_initialize(data, params)

  # Set slot 2 weight to 0
  model$slot_weights <- c(1, 0, 1)

  # Run one SER update for slot 2
  model_before <- model
  model <- susieR:::single_effect_update(data, params, model, 2)

  # The fitted values (Rz) should not change from slot 2's contribution
  # because its weight is 0. After update, slot 2's alpha*mu is computed
  # but multiplied by 0 in update_fitted_values.
  # The SER still runs (alpha, mu are updated), but the contribution to
  # the total fitted value is zero.
  expect_true(is.numeric(model$alpha[2, ]))
  expect_true(all(is.finite(model$alpha[2, ])))
})

# =============================================================================
# Test 3: slot_weights works with individual data
# =============================================================================
test_that("slot_weights works with individual data", {
  L <- 3
  fit <- susie(X, y, L = L,
               estimate_prior_variance = FALSE,
               estimate_residual_variance = FALSE,
               max_iter = 1)
  # Just verify it runs without error
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

# =============================================================================
# Test 4: slot_weights works with sufficient stats
# =============================================================================
test_that("slot_weights works with sufficient stats", {
  L <- 3
  XtX <- crossprod(X)
  Xty <- crossprod(X, y)
  yty <- sum(y^2)

  fit <- susie_ss(XtX = XtX, Xty = Xty, yty = yty, n = n, L = L,
                  estimate_prior_variance = FALSE,
                  estimate_residual_variance = FALSE,
                  max_iter = 1)
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})


================================================
FILE: tests/testthat/test_sparse_multiplication.R
================================================
context("sparse multiplication utilities")

# =============================================================================
# compute_Xb
# =============================================================================

test_that("compute_Xb works with dense matrices (centered and scaled)", {
  set.seed(123)
  n <- 50
  p <- 10

  # Create test data
  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rnorm(p)

  # Standardize X and add attributes
  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)
  X_std <- scale(X_raw, center = TRUE, scale = TRUE)

  # Add attributes to raw X
  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  # Compute using function
  result <- compute_Xb(X_raw, b)

  # Compute expected result (naive)
  expected <- as.vector(X_std %*% b)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_length(result, n)
})

test_that("compute_Xb works with sparse matrices (centered and scaled)", {
  set.seed(456)
  n <- 100
  p <- 20

  # Create sparse test data (30% non-zero)
  X_raw <- Matrix::Matrix(rbinom(n * p, 1, 0.3) * rnorm(n * p), n, p, sparse = TRUE)
  b <- rnorm(p)

  # Standardize and add attributes
  cm <- Matrix::colMeans(X_raw)
  csd <- apply(as.matrix(X_raw), 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  # Compute using function
  result <- compute_Xb(X_raw, b)

  # Compute expected result (naive with standardization)
  X_std <- scale(as.matrix(X_raw), center = cm, scale = csd)
  expected <- as.vector(X_std %*% b)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_length(result, n)
})

test_that("compute_Xb works with only centering (no scaling)", {
  set.seed(789)
  n <- 30
  p <- 5

  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rnorm(p)

  cm <- colMeans(X_raw)
  csd <- rep(1, p)  # No scaling

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_Xb(X_raw, b)

  # Expected: centered X times b
  X_centered <- scale(X_raw, center = cm, scale = FALSE)
  expected <- as.vector(X_centered %*% b)

  expect_equal(result, expected, tolerance = 1e-10)
})

test_that("compute_Xb works with only scaling (no centering)", {
  set.seed(101)
  n <- 30
  p <- 5

  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rnorm(p)

  cm <- rep(0, p)  # No centering
  csd <- apply(X_raw, 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_Xb(X_raw, b)

  # Expected: scaled X times b
  X_scaled <- scale(X_raw, center = FALSE, scale = csd)
  expected <- as.vector(X_scaled %*% b)

  expect_equal(result, expected, tolerance = 1e-10)
})

test_that("compute_Xb handles zero vector b", {
  set.seed(202)
  n <- 20
  p <- 8

  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rep(0, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  result <- compute_Xb(X_raw, b)

  expect_equal(result, rep(0, n), tolerance = 1e-10)
})

# =============================================================================
# compute_Xty
# =============================================================================

test_that("compute_Xty works with dense matrices (centered and scaled)", {
  set.seed(303)
  n <- 50
  p <- 10

  X_raw <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  # Standardize X
  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)
  X_std <- scale(X_raw, center = cm, scale = csd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_Xty(X_raw, y)

  # Expected result
  expected <- as.vector(t(X_std) %*% y)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_length(result, p)
})

test_that("compute_Xty works with sparse matrices (centered and scaled)", {
  set.seed(404)
  n <- 100
  p <- 20

  X_raw <- Matrix::Matrix(rbinom(n * p, 1, 0.3) * rnorm(n * p), n, p, sparse = TRUE)
  y <- rnorm(n)

  cm <- Matrix::colMeans(X_raw)
  csd <- apply(as.matrix(X_raw), 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_Xty(X_raw, y)

  # Expected result
  X_std <- scale(as.matrix(X_raw), center = cm, scale = csd)
  expected <- as.vector(t(X_std) %*% y)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_length(result, p)
})

test_that("compute_Xty works with only centering (no scaling)", {
  set.seed(505)
  n <- 30
  p <- 5

  X_raw <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  cm <- colMeans(X_raw)
  csd <- rep(1, p)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_Xty(X_raw, y)

  X_centered <- scale(X_raw, center = cm, scale = FALSE)
  expected <- as.vector(t(X_centered) %*% y)

  expect_equal(result, expected, tolerance = 1e-10)
})

test_that("compute_Xty handles zero vector y", {
  set.seed(606)
  n <- 20
  p <- 8

  X_raw <- matrix(rnorm(n * p), n, p)
  y <- rep(0, n)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  result <- compute_Xty(X_raw, y)

  expect_equal(result, rep(0, p), tolerance = 1e-10)
})

# =============================================================================
# compute_XtX
# =============================================================================

test_that("compute_XtX works with dense matrices (centered and scaled)", {
  set.seed(707)
  n <- 50
  p <- 10

  X_raw <- matrix(rnorm(n * p), n, p)

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)
  X_std <- scale(X_raw, center = cm, scale = csd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd
  attr(X_raw, "d") <- colSums(X_std^2)

  result <- compute_XtX(X_raw)

  # Expected result
  expected <- t(X_std) %*% X_std

  expect_equal(result, expected, tolerance = 1e-10)
  expect_equal(dim(result), c(p, p))
})

test_that("compute_XtX produces symmetric matrix", {
  set.seed(808)
  n <- 40
  p <- 8

  X_raw <- matrix(rnorm(n * p), n, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  result <- compute_XtX(X_raw)

  expect_equal(result, t(result), tolerance = 1e-10)
})

test_that("compute_XtX is positive semi-definite", {
  set.seed(909)
  n <- 60
  p <- 12

  X_raw <- matrix(rnorm(n * p), n, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  result <- compute_XtX(X_raw)

  # Check eigenvalues are non-negative
  eigenvalues <- eigen(result, symmetric = TRUE)$values
  expect_true(all(eigenvalues >= -1e-10))  # Allow for numerical error
})

test_that("compute_XtX works with sparse matrices", {
  set.seed(1010)
  n <- 100
  p <- 20

  X_raw <- Matrix::Matrix(rbinom(n * p, 1, 0.3) * rnorm(n * p), n, p, sparse = TRUE)

  cm <- Matrix::colMeans(X_raw)
  csd <- apply(as.matrix(X_raw), 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_XtX(X_raw)

  # Expected result
  X_std <- scale(as.matrix(X_raw), center = cm, scale = csd)
  expected <- t(X_std) %*% X_std

  expect_equal(as.matrix(result), expected, tolerance = 1e-9)
})

test_that("compute_XtX works with only centering (no scaling)", {
  set.seed(1111)
  n <- 30
  p <- 6

  X_raw <- matrix(rnorm(n * p), n, p)

  cm <- colMeans(X_raw)
  csd <- rep(1, p)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_XtX(X_raw)

  X_centered <- scale(X_raw, center = cm, scale = FALSE)
  expected <- t(X_centered) %*% X_centered

  expect_equal(result, expected, tolerance = 1e-10)
})

test_that("compute_XtX rejects trend filtering matrices", {
  set.seed(1212)
  n <- 50
  p <- 10

  X_raw <- matrix(rnorm(n * p), n, p)

  # Add standard attributes
  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  # Add matrix.type attribute to simulate trend filtering matrix
  attr(X_raw, "matrix.type") <- "trend_filtering"

  expect_error(
    compute_XtX(X_raw),
    "compute_XtX not yet implemented for trend filtering matrices"
  )
})

# =============================================================================
# compute_MXt
# =============================================================================

test_that("compute_MXt works with dense matrices (centered and scaled)", {
  set.seed(1212)
  n <- 50
  p <- 10
  L <- 3

  X_raw <- matrix(rnorm(n * p), n, p)
  M <- matrix(rnorm(L * p), L, p)

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)
  X_std <- scale(X_raw, center = cm, scale = csd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_MXt(M, X_raw)

  # Expected result
  expected <- M %*% t(X_std)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_equal(dim(result), c(L, n))
})

test_that("compute_MXt works with sparse matrices", {
  set.seed(1313)
  n <- 100
  p <- 20
  L <- 5

  X_raw <- Matrix::Matrix(rbinom(n * p, 1, 0.3) * rnorm(n * p), n, p, sparse = TRUE)
  M <- matrix(rnorm(L * p), L, p)

  cm <- Matrix::colMeans(X_raw)
  csd <- apply(as.matrix(X_raw), 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_MXt(M, X_raw)

  # Expected result
  X_std <- scale(as.matrix(X_raw), center = cm, scale = csd)
  expected <- M %*% t(X_std)

  expect_equal(result, expected, tolerance = 1e-9)
})

test_that("compute_MXt works with single row M", {
  set.seed(1414)
  n <- 40
  p <- 8

  X_raw <- matrix(rnorm(n * p), n, p)
  M <- matrix(rnorm(p), 1, p)  # Single row

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)
  X_std <- scale(X_raw, center = cm, scale = csd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  result <- compute_MXt(M, X_raw)

  expected <- M %*% t(X_std)

  expect_equal(result, expected, tolerance = 1e-10)
  expect_equal(dim(result), c(1, n))
})

test_that("compute_MXt handles zero matrix M", {
  set.seed(1515)
  n <- 30
  p <- 6
  L <- 2

  X_raw <- matrix(rnorm(n * p), n, p)
  M <- matrix(0, L, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  result <- compute_MXt(M, X_raw)

  expect_equal(result, matrix(0, L, n), tolerance = 1e-10)
})

test_that("compute_MXt is equivalent to row-wise compute_Xb", {
  set.seed(1616)
  n <- 40
  p <- 8
  L <- 4

  X_raw <- matrix(rnorm(n * p), n, p)
  M <- matrix(rnorm(L * p), L, p)

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  # Using compute_MXt
  result_MXt <- compute_MXt(M, X_raw)

  # Using row-wise compute_Xb
  result_Xb <- t(apply(M, 1, function(b) compute_Xb(X_raw, b)))

  expect_equal(result_MXt, result_Xb, tolerance = 1e-10)
})

# =============================================================================
# Edge Cases and Consistency
# =============================================================================

test_that("sparse multiplication functions preserve dimensions correctly", {
  set.seed(1717)
  n <- 25
  p <- 7
  L <- 3

  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rnorm(p)
  y <- rnorm(n)
  M <- matrix(rnorm(L * p), L, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  # Test dimensions
  expect_length(compute_Xb(X_raw, b), n)
  expect_length(compute_Xty(X_raw, y), p)
  expect_equal(dim(compute_XtX(X_raw)), c(p, p))
  expect_equal(dim(compute_MXt(M, X_raw)), c(L, n))
})

test_that("all sparse functions handle edge case with p=1", {
  set.seed(1818)
  n <- 50
  p <- 1

  X_raw <- matrix(rnorm(n * p), n, p)
  b <- rnorm(p)
  y <- rnorm(n)
  M <- matrix(rnorm(2 * p), 2, p)

  attr(X_raw, "scaled:center") <- colMeans(X_raw)
  attr(X_raw, "scaled:scale") <- apply(X_raw, 2, sd)

  # Should not error
  expect_length(compute_Xb(X_raw, b), n)
  expect_length(compute_Xty(X_raw, y), p)
  expect_equal(dim(compute_XtX(X_raw)), c(p, p))
  expect_equal(dim(compute_MXt(M, X_raw)), c(2, n))
})

test_that("consistency test: compute_Xty(X,y) should equal t(X) %*% y for standardized X", {
  set.seed(1919)
  n <- 45
  p <- 9

  X_raw <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  # Using compute_Xty
  result1 <- compute_Xty(X_raw, y)

  # Manually standardize and compute
  X_std <- scale(X_raw, center = cm, scale = csd)
  result2 <- as.vector(t(X_std) %*% y)

  expect_equal(result1, result2, tolerance = 1e-10)
})

test_that("consistency test: compute_Xb and compute_XtX relationship", {
  set.seed(2020)
  n <- 50
  p <- 10

  X_raw <- matrix(rnorm(n * p), n, p)
  b1 <- rnorm(p)
  b2 <- rnorm(p)

  cm <- colMeans(X_raw)
  csd <- apply(X_raw, 2, sd)

  attr(X_raw, "scaled:center") <- cm
  attr(X_raw, "scaled:scale") <- csd

  # Compute Xb1 and Xb2
  Xb1 <- compute_Xb(X_raw, b1)
  Xb2 <- compute_Xb(X_raw, b2)

  # Inner product should equal b1' XtX b2
  XtX <- compute_XtX(X_raw)

  result1 <- sum(Xb1 * Xb2)
  result2 <- sum(b1 * (XtX %*% b2))

  expect_equal(result1, result2, tolerance = 1e-9)
})


================================================
FILE: tests/testthat/test_sufficient_stats_methods.R
================================================
context("S3 methods for sufficient statistics (ss) data class")

# =============================================================================
# DATA INITIALIZATION & CONFIGURATION
# =============================================================================

test_that("configure_data.ss returns data when unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")

  result <- configure_data.ss(setup$data, setup$params)

  expect_true("ss" %in% class(result))
  expect_false("eigen_values" %in% names(result))
})

test_that("configure_data.ss adds eigen decomposition for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")

  # Remove eigen components to test they get added
  setup$data$eigen_values <- NULL
  setup$data$eigen_vectors <- NULL
  setup$data$VtXty <- NULL

  result <- configure_data.ss(setup$data, setup$params)

  expect_true("eigen_values" %in% names(result))
  expect_true("eigen_vectors" %in% names(result))
  expect_true("VtXty" %in% names(result))
})

test_that("sufficient_stats_constructor accepts unmappable_effects='ash'", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 1)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # ash is now supported for sufficient statistics via mr.ash.rss
  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
                                          unmappable_effects = "ash")
  expect_true(inherits(result$data, "ss"))
  expect_equal(result$params$unmappable_effects, "ash")
})

test_that("get_var_y.ss computes variance of y", {
  setup <- setup_ss_data()

  var_y <- get_var_y.ss(setup$data)

  expect_type(var_y, "double")
  expect_length(var_y, 1)
  expect_true(var_y > 0)
  expect_equal(var_y, setup$data$yty / (setup$data$n - 1))
})

# =============================================================================
# MODEL INITIALIZATION & SETUP
# =============================================================================

test_that("initialize_susie_model.ss creates model with predictor_weights (none)", {
  setup <- setup_ss_data(unmappable_effects = "none")
  var_y <- var(setup$data$yty / setup$data$n)

  model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  expect_true("predictor_weights" %in% names(model))
  expect_length(model$predictor_weights, setup$data$p)
  expect_equal(model$predictor_weights, attr(setup$data$XtX, "d"))
})

test_that("initialize_susie_model.ss initializes omega quantities for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  var_y <- setup$data$yty / (setup$data$n - 1)

  model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  expect_true("omega_var" %in% names(model))
  expect_true("predictor_weights" %in% names(model))
  expect_true("XtOmegay" %in% names(model))
  expect_true("tau2" %in% names(model))
  expect_true("theta" %in% names(model))

  expect_equal(model$tau2, 0)
  expect_equal(model$theta, rep(0, setup$data$p))
})

test_that("initialize_fitted.ss creates XtXr", {
  setup <- setup_ss_data()

  mat_init <- list(
    alpha = setup$model$alpha,
    mu = setup$model$mu
  )

  fitted <- initialize_fitted.ss(setup$data, mat_init)

  expect_true("XtXr" %in% names(fitted))
  expect_length(fitted$XtXr, setup$data$p)
})

test_that("validate_prior.ss checks prior variance", {
  setup <- setup_ss_data()
  setup$params$check_prior <- TRUE

  # Should not error for reasonable prior variance
  expect_error(
    validate_prior.ss(setup$data, setup$params, setup$model),
    NA
  )
})

test_that("validate_prior.ss errors when prior variance is unreasonably large", {
  setup <- setup_ss_data()
  setup$params$check_prior <- TRUE

  # Initialize model properly to get predictor_weights
  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  # Compute zm (max z-score magnitude)
  bhat <- setup$data$Xty / setup$model$predictor_weights
  shat <- sqrt(setup$model$sigma2 / setup$model$predictor_weights)
  z <- bhat / shat
  zm <- max(abs(z[!is.nan(z)]))

  # Set V to be unreasonably large (more than 100 * zm^2)
  setup$model$V <- rep(150 * (zm^2), setup$params$L)

  expect_error(
    validate_prior.ss(setup$data, setup$params, setup$model),
    "Estimated prior variance is unreasonably large"
  )
})

test_that("track_ibss_fit.ss delegates to default when unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  tracking <- list()
  iter <- 1
  elbo <- -100

  result <- track_ibss_fit.ss(setup$data, setup$params, setup$model,
                               tracking, iter, elbo)

  expect_type(result, "list")
})

test_that("track_ibss_fit.ss tracks tau2 for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  setup$params$track_fit <- TRUE
  tracking <- list()
  iter <- 1
  elbo <- -100

  result <- track_ibss_fit.ss(setup$data, setup$params, setup$model,
                               tracking, iter, elbo)

  expect_true("tau2" %in% names(result[[1]]))
  expect_equal(result[[1]]$tau2, setup$model$tau2)
})

# =============================================================================
# SINGLE EFFECT REGRESSION & ELBO
# =============================================================================

test_that("compute_residuals.ss computes residuals for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  l <- 1

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)

  expect_true("residuals" %in% names(model))
  expect_true("fitted_without_l" %in% names(model))
  expect_true("residual_variance" %in% names(model))

  expect_length(model$residuals, setup$data$p)
  expect_equal(model$residual_variance, setup$model$sigma2)
})

test_that("compute_residuals.ss computes omega-weighted residuals for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  l <- 1

  # Initialize omega quantities first
  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)

  expect_true("residuals" %in% names(model))
  expect_true("predictor_weights" %in% names(model))
  expect_true("residual_variance" %in% names(model))

  expect_length(model$residuals, setup$data$p)
  expect_equal(model$residual_variance, 1)  
})

test_that("compute_ser_statistics.ss computes betahat and shat2 for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  l <- 1

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.ss(setup$data, setup$params, model, l)

  expect_true("betahat" %in% names(ser_stats))
  expect_true("shat2" %in% names(ser_stats))
  expect_true("optim_init" %in% names(ser_stats))
  expect_true("optim_bounds" %in% names(ser_stats))
  expect_true("optim_scale" %in% names(ser_stats))

  expect_length(ser_stats$betahat, setup$data$p)
  expect_length(ser_stats$shat2, setup$data$p)
  expect_equal(ser_stats$optim_scale, "log")
  expect_equal(ser_stats$optim_bounds, c(-30, 15))
})

test_that("compute_ser_statistics.ss uses linear scale for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  l <- 1

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)
  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.ss(setup$data, setup$params, model, l)

  expect_equal(ser_stats$optim_scale, "linear")
  expect_equal(ser_stats$optim_bounds, c(0, 1))
  expect_equal(ser_stats$optim_init, model$V[l])
})

test_that("SER_posterior_e_loglik.ss computes expected log-likelihood for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  l <- 1

  setup$model$alpha[l, ] <- rep(1/setup$data$p, setup$data$p)
  setup$model$mu[l, ] <- rnorm(setup$data$p)
  setup$model$mu2[l, ] <- setup$model$mu[l, ]^2 + 0.1

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  e_loglik <- SER_posterior_e_loglik.ss(setup$data, setup$params, model, l)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
})

test_that("SER_posterior_e_loglik.ss uses omega-weighted likelihood for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  l <- 1

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)
  setup$model$alpha[l, ] <- rep(1/setup$data$p, setup$data$p)
  setup$model$mu[l, ] <- rnorm(setup$data$p, sd = 0.01)
  setup$model$mu2[l, ] <- setup$model$mu[l, ]^2 + 0.01

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  e_loglik <- SER_posterior_e_loglik.ss(setup$data, setup$params, model, l)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
})

test_that("calculate_posterior_moments.ss computes posterior correctly", {
  setup <- setup_ss_data()
  l <- 1
  V <- 1.0

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  model <- calculate_posterior_moments.ss(setup$data, setup$params, model, V, l)

  expect_length(model$mu[l, ], setup$data$p)
  expect_length(model$mu2[l, ], setup$data$p)

  post_var <- model$mu2[l, ] - model$mu[l, ]^2
  expect_true(all(post_var >= -1e-10))
  expect_true(all(model$mu2[l, ] >= model$mu[l, ]^2 - 1e-10))
})

test_that("compute_kl.ss delegates to default method", {
  setup <- setup_ss_data()
  l <- 1

  setup$model$lbf <- rep(0, setup$params$L)
  setup$model$alpha[l, ] <- rep(1/setup$data$p, setup$data$p)
  setup$model$mu[l, ] <- rnorm(setup$data$p, sd = 0.1)
  setup$model$mu2[l, ] <- setup$model$mu[l, ]^2 + 0.1

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  model <- compute_kl.ss(setup$data, setup$params, model, l)

  expect_type(model$KL[l], "double")
  expect_length(model$KL[l], 1)
})

test_that("get_ER2.ss computes expected squared residuals", {
  setup <- setup_ss_data()

  er2 <- get_ER2.ss(setup$data, setup$model)

  expect_type(er2, "double")
  expect_length(er2, 1)
  expect_true(er2 >= 0)
})

test_that("Eloglik.ss computes expected log-likelihood", {
  setup <- setup_ss_data()

  e_loglik <- Eloglik.ss(setup$data, setup$model)

  expect_type(e_loglik, "double")
  expect_length(e_loglik, 1)
})

test_that("loglik.ss computes log Bayes factors", {
  setup <- setup_ss_data()
  l <- 1
  V <- 1.0

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.ss(setup$data, setup$params, model, l)
  model <- loglik.ss(setup$data, setup$params, model, V, ser_stats, l)

  expect_length(model$lbf_variable[l, ], setup$data$p)
  expect_length(model$alpha[l, ], setup$data$p)

  expect_true(all(model$alpha[l, ] >= 0))
  expect_true(abs(sum(model$alpha[l, ]) - 1) < 1e-10)
  expect_true(is.numeric(model$lbf[l]))
})

test_that("neg_loglik.ss returns negative log-likelihood for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  l <- 1
  V_param <- log(1.0)

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.ss(setup$data, setup$params, model, l)
  neg_ll <- neg_loglik.ss(setup$data, setup$params, model, V_param, ser_stats)

  expect_type(neg_ll, "double")
  expect_length(neg_ll, 1)
})

test_that("neg_loglik.ss uses unmappable objective for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  l <- 1
  V_param <- 0.5  # Linear scale

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)
  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  ser_stats <- compute_ser_statistics.ss(setup$data, setup$params, model, l)
  neg_ll <- neg_loglik.ss(setup$data, setup$params, model, V_param, ser_stats)

  expect_type(neg_ll, "double")
  expect_length(neg_ll, 1)
})

# =============================================================================
# MODEL UPDATES & FITTING
# =============================================================================

test_that("update_fitted_values.ss updates XtXr for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")
  l <- 1

  model <- compute_residuals.ss(setup$data, setup$params, setup$model, l)
  setup$model$fitted_without_l <- model$fitted_without_l

  updated_model <- update_fitted_values.ss(setup$data, setup$params, setup$model, l)

  expect_true("XtXr" %in% names(updated_model))
  expect_length(updated_model$XtXr, setup$data$p)
})

test_that("update_fitted_values.ss includes theta for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")
  l <- 1

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  updated_model <- update_fitted_values.ss(setup$data, setup$params, setup$model, l)

  expect_true("XtXr" %in% names(updated_model))
  expect_length(updated_model$XtXr, setup$data$p)
})

test_that("update_variance_components.ss delegates to default for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")

  result <- update_variance_components.ss(setup$data, setup$params, setup$model)

  expect_type(result, "list")
  expect_true("sigma2" %in% names(result))
})

test_that("update_variance_components.ss uses MLE for unmappable_effects='inf' with estimate_residual_method='MLE'", {
  # Create setup with unmappable_effects='inf' but override to use MLE
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 42)
  X <- base_data$X
  y <- base_data$y

  # Center and scale
  X_colmeans <- colMeans(X)
  X <- sweep(X, 2, X_colmeans)
  y_mean <- mean(y)
  y <- y - y_mean

  # Compute sufficient statistics
  XtX <- crossprod(X)
  Xty <- as.vector(crossprod(X, y))
  yty <- sum(y^2)

  # Create constructor with MLE method (not the default MoM)
  susie_objects <- sufficient_stats_constructor(
    XtX = XtX, Xty = Xty, yty = yty, n = 100, L = 5,
    X_colmeans = X_colmeans, y_mean = y_mean,
    standardize = TRUE,
    unmappable_effects = "inf",
    estimate_residual_method = "MLE",  # Force MLE instead of default MoM
    residual_variance = 1,
    convergence_method = "pip",
    coverage = 0.95,
    min_abs_corr = 0.5,
    n_purity = 100,
    check_prior = FALSE,
    track_fit = FALSE
  )

  data <- susie_objects$data
  params <- susie_objects$params

  # Initialize model properly
  var_y <- data$yty / (data$n - 1)
  model <- initialize_susie_model.ss(data, params, var_y)

  # Verify we're using MLE
  expect_equal(params$estimate_residual_method, "MLE")

  # Call update_variance_components which should use mle_unmappable
  result <- update_variance_components.ss(data, params, model)

  # Check that result has expected fields
  expect_type(result, "list")
  expect_true("sigma2" %in% names(result))
  expect_true("tau2" %in% names(result))
  expect_true("theta" %in% names(result))

  # Check values are reasonable
  expect_true(result$sigma2 > 0)
  expect_true(result$tau2 >= 0)
  expect_length(result$theta, data$p)
})

test_that("update_derived_quantities.ss delegates to default for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")

  result <- update_derived_quantities.ss(setup$data, setup$params, setup$model)

  expect_type(result, "list")
})

test_that("update_derived_quantities.ss updates omega quantities for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)

  result <- update_derived_quantities.ss(setup$data, setup$params, setup$model)

  expect_true("omega_var" %in% names(result))
  expect_true("predictor_weights" %in% names(result))
  expect_true("XtOmegay" %in% names(result))
  expect_true("XtXr" %in% names(result))
})

# =============================================================================
# OUTPUT GENERATION & POST-PROCESSING
# =============================================================================

test_that("get_scale_factors.ss returns column scale factors", {
  setup <- setup_ss_data()

  scales <- get_scale_factors.ss(setup$data, setup$params)

  expect_length(scales, setup$data$p)
  expect_true(all(scales > 0))
  expect_equal(scales, attr(setup$data$XtX, "scaled:scale"))
})

test_that("get_intercept.ss computes intercept", {
  setup <- setup_ss_data()
  setup$params$intercept <- TRUE

  intercept <- get_intercept.ss(setup$data, setup$params, setup$model)

  expect_type(intercept, "double")
  expect_length(intercept, 1)
})

test_that("get_fitted.ss delegates to default method", {
  setup <- setup_ss_data()

  fitted <- get_fitted.ss(setup$data, setup$params, setup$model)

  # Default method returns NULL for SS data
  expect_null(fitted)
})

test_that("get_cs.ss returns NULL when coverage is NULL", {
  setup <- setup_ss_data()
  setup$params$coverage <- NULL

  cs <- get_cs.ss(setup$data, setup$params, setup$model)

  expect_null(cs)
})

test_that("get_cs.ss returns NULL when min_abs_corr is NULL", {
  setup <- setup_ss_data()
  setup$params$min_abs_corr <- NULL

  cs <- get_cs.ss(setup$data, setup$params, setup$model)

  expect_null(cs)
})

test_that("get_cs.ss computes correlation from XtX when diagonal not standardized", {
  setup <- setup_ss_data()

  # Make diagonal not 0 or 1
  diag(setup$data$XtX) <- diag(setup$data$XtX) * 1.5

  # Add strong signal to create credible set
  setup$model$alpha[1, 1] <- 0.95
  setup$model$alpha[1, -1] <- 0.05 / (setup$data$p - 1)

  cs <- get_cs.ss(setup$data, setup$params, setup$model)

  # May or may not find CS, but should not error
  expect_true(is.null(cs) || is.list(cs))
})

test_that("get_cs.ss uses XtX directly when diagonal is standardized", {
  setup <- setup_ss_data()

  R <- cor(matrix(rnorm(100 * setup$data$p), 100, setup$data$p))
  setup$data$XtX <- R

  # Verify diagonal is all 1s (correlation matrix)
  expect_true(all(diag(setup$data$XtX) %in% c(0, 1)))

  # Add strong signal to create credible set
  setup$model$alpha[1, 1] <- 0.95
  setup$model$alpha[1, -1] <- 0.05 / (setup$data$p - 1)

  # Call get_cs.ss which should use the else branch (Xcorr <- data$XtX)
  cs <- get_cs.ss(setup$data, setup$params, setup$model)

  # May or may not find CS, but should not error
  expect_true(is.null(cs) || is.list(cs))
})

test_that("get_variable_names.ss assigns variable names to model", {
  setup <- setup_ss_data()
  colnames(setup$data$XtX) <- paste0("var", 1:setup$data$p)
  setup$model$pip <- rep(0.1, setup$data$p)
  setup$model$null_weight <- NULL
  setup$model$alpha <- matrix(0, 5, setup$data$p)
  setup$model$mu <- matrix(0, 5, setup$data$p)
  setup$model$mu2 <- matrix(0, 5, setup$data$p)
  setup$model$lbf_variable <- matrix(0, 5, setup$data$p)

  model_with_names <- get_variable_names.ss(setup$data, setup$model)

  expect_true(all(grepl("var", colnames(model_with_names$alpha))))
  expect_true(all(grepl("var", colnames(model_with_names$mu))))
  expect_true(all(grepl("var", colnames(model_with_names$mu2))))
  expect_true(all(grepl("var", names(model_with_names$pip))))
})

test_that("get_zscore.ss delegates to default method", {
  setup <- setup_ss_data()
  setup$params$compute_univariate_zscore <- TRUE

  z <- get_zscore.ss(setup$data, setup$params, setup$model)

  expect_true(is.null(z) || is.numeric(z))
})

test_that("cleanup_model.ss removes temporary fields for unmappable_effects='none'", {
  setup <- setup_ss_data(unmappable_effects = "none")

  setup$model$residuals <- rnorm(setup$data$p)

  cleaned <- cleanup_model.ss(setup$data, setup$params, setup$model)

  expect_false("residuals" %in% names(cleaned))
})

test_that("cleanup_model.ss removes omega fields for unmappable_effects='inf'", {
  setup <- setup_ss_data(unmappable_effects = "inf")

  var_y <- setup$data$yty / (setup$data$n - 1)
  setup$model <- initialize_susie_model.ss(setup$data, setup$params, var_y)
  setup$model$residuals <- rnorm(setup$data$p)

  cleaned <- cleanup_model.ss(setup$data, setup$params, setup$model)

  expect_false("omega_var" %in% names(cleaned))
  expect_false("XtOmegay" %in% names(cleaned))
  expect_false("residuals" %in% names(cleaned))
})

context("susie() N>=2P hint and compute_suff_stat() workflow")

# These tests cover the two changes added in
#   - R/susie.R (the N>=2P hint)
#   - vignettes/finemapping.Rmd (compute_suff_stat -> susie_ss)
# They intentionally do NOT modify the existing
#   "susie_ss agrees with susie on same data"
# test in test_susie.R; that test stays as-is and uses hand-rolled crossprod.
# The tests below exercise the user-facing compute_suff_stat() composition
# instead, which is the path the new vignette section recommends.

# -----------------------------------------------------------------------------
# Hint behaviour
# -----------------------------------------------------------------------------

test_that("susie emits a hint pointing to compute_suff_stat() when nrow(X) >= 2 * ncol(X)", {
  set.seed(2026)
  n <- 200; p <- 50            # n >= 2 * p, so the hint should fire
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  # warning_message(..., style = "hint") emits a message() call whose body
  # contains the literal "compute_suff_stat". expect_message matches any
  # emitted message; other messages (e.g. non-convergence warnings from
  # max_iter = 2) are tolerated.
  expect_message(
    susie(X, y, L = 3, max_iter = 2, verbose = FALSE),
    "compute_suff_stat"
  )
})

test_that("susie does not emit the compute_suff_stat hint when nrow(X) < 2 * ncol(X)", {
  set.seed(2027)
  n <- 60; p <- 50             # n < 2 * p, so the hint must stay silent
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  msgs <- suppressWarnings(capture_messages(
    susie(X, y, L = 3, max_iter = 2, verbose = FALSE)
  ))
  expect_false(any(grepl("compute_suff_stat", msgs, fixed = TRUE)))
})

test_that("the hint does not interfere with susie's normal control flow", {
  # Regression check: the hint is advisory only. Adding it must not change
  # the algorithm's output relative to running with the hint suppressed.
  set.seed(2028)
  n <- 200; p <- 50
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(5, 15, 25)] <- c(1, -1, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 0.5))

  fit <- suppressMessages(
    susie(X, y, L = 5, max_iter = 100, verbose = FALSE)
  )

  expect_s3_class(fit, "susie")
  expect_length(fit$pip, p)
  expect_equal(rowSums(fit$alpha), rep(1, 5), tolerance = 1e-10)
  expect_true(all(is.finite(fit$elbo)))
})

# -----------------------------------------------------------------------------
# Vignette workflow: compute_suff_stat() -> susie_ss()
# -----------------------------------------------------------------------------

test_that("compute_suff_stat() + susie_ss() agrees with susie() on the same data", {
  # This is the workflow the new vignette section demonstrates: feed the
  # output of compute_suff_stat directly into susie_ss with matching
  # standardize/intercept settings, and recover the susie() fit.
  set.seed(2029)
  n <- 100; p <- 50            # same dims as the existing 1e-3 reference test
  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p); beta[c(5, 15, 25)] <- c(1, -1, 1.5)
  y <- as.vector(X %*% beta + rnorm(n, sd = 0.5))

  # n = 2 * p triggers the hint; suppress it for clean output here.
  fit_ind <- suppressMessages(susie(
    X, y, L = 5,
    standardize = TRUE, intercept = TRUE,
    verbose = FALSE
  ))

  ss <- compute_suff_stat(X, y, standardize = FALSE)

  fit_ss <- susie_ss(
    XtX = ss$XtX, Xty = ss$Xty, yty = ss$yty, n = ss$n,
    X_colmeans = ss$X_colmeans, y_mean = ss$y_mean,
    L = 5, standardize = TRUE, verbose = FALSE
  )

  # Tolerance matched to the existing
  #   "susie_ss agrees with susie on same data"  (test_susie.R, seed 33)
  # test, which uses the same configuration via hand-rolled crossprod.
  # compute_suff_stat() produces XtX/Xty/yty that are algebraically
  # identical to that hand-rolled computation, so the bound carries over.
  expect_equal(fit_ind$pip,    fit_ss$pip,    tolerance = 1e-3)
  expect_equal(fit_ind$V,      fit_ss$V,      tolerance = 1e-3)
  expect_equal(fit_ind$sigma2, fit_ss$sigma2, tolerance = 1e-3)
})

test_that("compute_suff_stat: XtX can be reused across multiple y vectors", {
  # This is the workhorse of the vignette example -- compute the heavy
  # XtX once, swap only Xty/yty/y_mean for each new response. The test
  # locks in two invariants:
  #   (1) X-only quantities (XtX, X_colmeans, n) are byte-identical
  #       between a reused-stats object and a freshly recomputed one.
  #   (2) Feeding either into susie_ss produces the same fit.
  # Either invariant breaking would silently bite users iterating over
  # many proteins on the same locus.
  set.seed(2030)
  n <- 80; p <- 30
  X <- matrix(rnorm(n * p), n, p)
  Y <- matrix(rnorm(n * 2), n, 2)

  ss1 <- compute_suff_stat(X, Y[, 1], standardize = FALSE)

  # Reuse path: keep XtX/X_colmeans, recompute the y-dependent slots.
  y2_mean <- mean(Y[, 2])
  y2c     <- Y[, 2] - y2_mean
  ss_reused        <- ss1
  ss_reused$Xty    <- drop(y2c %*% X)
  ss_reused$yty    <- sum(y2c^2)
  ss_reused$y_mean <- y2_mean

  # Reference path: compute_suff_stat from scratch on Y[, 2].
  ss_fresh <- compute_suff_stat(X, Y[, 2], standardize = FALSE)

  # X-only quantities must be byte-identical: same X, same code path.
  expect_identical(ss_reused$XtX,        ss_fresh$XtX)
  expect_identical(ss_reused$X_colmeans, ss_fresh$X_colmeans)
  expect_identical(ss_reused$n,          ss_fresh$n)
  # y-only quantities are computed differently but should match numerically.
  expect_equal(ss_reused$Xty,    ss_fresh$Xty,    tolerance = 1e-12)
  expect_equal(ss_reused$yty,    ss_fresh$yty,    tolerance = 1e-12)
  expect_equal(ss_reused$y_mean, ss_fresh$y_mean, tolerance = 1e-12)

  # End-to-end: fits from the two stat sets must be the same.
  fit_reused <- susie_ss(
    XtX = ss_reused$XtX, Xty = ss_reused$Xty, yty = ss_reused$yty,
    n = ss_reused$n,
    X_colmeans = ss_reused$X_colmeans, y_mean = ss_reused$y_mean,
    L = 5, verbose = FALSE
  )
  fit_fresh <- susie_ss(
    XtX = ss_fresh$XtX, Xty = ss_fresh$Xty, yty = ss_fresh$yty,
    n = ss_fresh$n,
    X_colmeans = ss_fresh$X_colmeans, y_mean = ss_fresh$y_mean,
    L = 5, verbose = FALSE
  )
  expect_equal(fit_reused$pip, fit_fresh$pip, tolerance = 1e-10)
  expect_equal(fit_reused$V,   fit_fresh$V,   tolerance = 1e-10)
})

================================================
FILE: tests/testthat/test_summary_print.R
================================================
context("summary and print S3 methods")

# =============================================================================
# summary.susie - Summary Statistics
# =============================================================================

test_that("summary.susie creates correct structure", {
  set.seed(1)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  expect_type(summ, "list")
  expect_s3_class(summ, "summary.susie")
  expect_named(summ, c("vars", "cs"))
})

test_that("summary.susie variables data frame has correct structure", {
  set.seed(2)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  expect_s3_class(summ$vars, "data.frame")
  expect_true(all(c("variable", "variable_prob", "cs") %in% colnames(summ$vars)))
  expect_equal(nrow(summ$vars), dat$p)
})

test_that("summary.susie CS data frame has correct structure when CS exist", {
  set.seed(3)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(fit$sets$cs)) {
    expect_s3_class(summ$cs, "data.frame")
    expect_true(all(c("cs", "cs_log10bf", "cs_avg_r2", "cs_min_r2", "variable") %in%
                    colnames(summ$cs)))
    expect_equal(nrow(summ$cs), length(fit$sets$cs))
  }
})

test_that("summary.susie variables sorted by PIP descending", {
  set.seed(4)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(fit$sets$cs)) {
    expect_true(all(diff(summ$vars$variable_prob) <= 0))
  }
})

test_that("summary.susie cs column maps variables to credible sets", {
  set.seed(5)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(fit$sets$cs)) {
    for (i in 1:length(fit$sets$cs)) {
      cs_vars <- fit$sets$cs[[i]]
      cs_idx <- fit$sets$cs_index[i]
      expect_true(all(summ$vars$cs[summ$vars$variable %in% cs_vars] == cs_idx))
    }
  }
})

test_that("summary.susie handles null_index correctly", {
  set.seed(6)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, null_weight = 0.1, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(fit$null_index) && fit$null_index > 0) {
    expect_equal(nrow(summ$vars), dat$p)
  } else {
    expect_equal(nrow(summ$vars), ncol(fit$alpha))
  }
})

test_that("summary.susie errors when sets is NULL", {
  set.seed(7)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  fit$sets <- NULL

  expect_error(
    summary(fit),
    "credible set information"
  )
})

test_that("summary.susie handles no credible sets", {
  set.seed(8)
  dat <- simulate_regression(n = 100, p = 50, k = 3, signal_sd = 0.1)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95, min_abs_corr = 0.99)

  summ <- summary(fit)

  expect_null(summ$cs)
  expect_s3_class(summ$vars, "data.frame")
})

test_that("summary.susie log10BF calculation is correct", {
  set.seed(9)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(summ$cs)) {
    for (i in 1:nrow(summ$cs)) {
      cs_idx <- summ$cs$cs[i]
      expected_log10bf <- fit$lbf[cs_idx] / log(10)
      expect_equal(summ$cs$cs_log10bf[i], expected_log10bf)
    }
  }
})

test_that("summary.susie r2 calculations are correct", {
  set.seed(10)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  if (!is.null(summ$cs) && !is.null(fit$sets$purity)) {
    for (i in 1:nrow(summ$cs)) {
      expect_equal(summ$cs$cs_avg_r2[i], fit$sets$purity$mean.abs.corr[i]^2)
      expect_equal(summ$cs$cs_min_r2[i], fit$sets$purity$min.abs.corr[i]^2)
    }
  }
})

# =============================================================================
# print.summary.susie - Console Output
# =============================================================================

test_that("print.summary.susie produces output", {
  set.seed(11)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  expect_message(capture.output(print(summ)), "Variables in credible sets")
  expect_message(capture.output(print(summ)), "Credible sets summary")
})

test_that("print.summary.susie handles no CS", {
  set.seed(12)
  dat <- simulate_regression(n = 100, p = 50, k = 3, signal_sd = 0.1)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95, min_abs_corr = 0.99)

  summ <- summary(fit)

  expect_message(capture.output(print(summ)))
})

test_that("print.summary.susie shows variables in CS", {
  set.seed(13)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  output <- capture.output(print(summ))
  output_text <- paste(output, collapse = "\n")

  if (!is.null(fit$sets$cs)) {
    cs_vars <- summ$vars[summ$vars$cs > 0, ]
    for (i in 1:nrow(cs_vars)) {
      expect_true(grepl(as.character(cs_vars$variable[i]), output_text))
    }
  }
})

test_that("summary and print work together", {
  set.seed(14)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  expect_message(capture.output({
    summ <- summary(fit)
    print(summ)
  }))
})

test_that("summary.susie variable column is sequential indices", {
  set.seed(15)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  expect_equal(sort(unique(summ$vars$variable)), 1:dat$p)
})

test_that("summary.susie variable_prob matches PIP", {
  set.seed(16)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  summ <- summary(fit)

  expect_equal(sort(summ$vars$variable_prob, decreasing = TRUE),
               sort(fit$pip, decreasing = TRUE))
})


================================================
FILE: tests/testthat/test_susie.R
================================================
context("Main susie interface functions")

# =============================================================================
# SUSIE() - BASIC FUNCTIONALITY
# =============================================================================

test_that("susie returns valid susie object", {
  set.seed(1)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("alpha" %in% names(fit))
  expect_true("mu" %in% names(fit))
  expect_true("mu2" %in% names(fit))
  expect_true("V" %in% names(fit))
  expect_true("sigma2" %in% names(fit))
  expect_true("pip" %in% names(fit))
  expect_true("sets" %in% names(fit))
  expect_true("elbo" %in% names(fit))
})

test_that("susie has correct dimensions", {
  set.seed(2)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  expect_equal(dim(fit$alpha), c(5, 50))
  expect_equal(dim(fit$mu), c(5, 50))
  expect_equal(dim(fit$mu2), c(5, 50))
  expect_length(fit$V, 5)
  expect_length(fit$pip, 50)
  expect_length(fit$fitted, 100)
})

test_that("susie maintains valid probability distributions", {
  set.seed(3)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Alpha rows sum to 1
  expect_equal(rowSums(fit$alpha), rep(1, 5), tolerance = 1e-10)

  # Alpha values are valid probabilities
  expect_true(all(fit$alpha >= 0 & fit$alpha <= 1))

  # PIPs are valid probabilities
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

test_that("susie ELBO is monotonically increasing", {
  set.seed(4)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  elbo_diff <- diff(fit$elbo)
  expect_true(all(elbo_diff > -1e-6))
})

test_that("susie converges within max_iter", {
  set.seed(5)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, max_iter = 100, verbose = FALSE)

  expect_true(fit$niter <= 100)
  expect_true("converged" %in% names(fit))
})

# =============================================================================
# SUSIE() - PARAMETER HANDLING
# =============================================================================

test_that("susie respects L parameter", {
  set.seed(6)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_L3 <- susie(dat$X, dat$y, L = 3, verbose = FALSE)
  fit_L7 <- susie(dat$X, dat$y, L = 7, verbose = FALSE)

  expect_equal(nrow(fit_L3$alpha), 3)
  expect_equal(nrow(fit_L7$alpha), 7)
})

test_that("susie adjusts L when L > p", {
  set.seed(7)
  dat <- simulate_regression(n = 100, p = 20, k = 3)

  fit <- susie(dat$X, dat$y, L = 50, verbose = FALSE)

  expect_equal(nrow(fit$alpha), 20)
})

test_that("susie handles standardize parameter", {
  set.seed(8)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_std <- susie(dat$X, dat$y, L = 5, standardize = TRUE, verbose = FALSE)
  fit_nostd <- susie(dat$X, dat$y, L = 5, standardize = FALSE, verbose = FALSE)

  expect_s3_class(fit_std, "susie")
  expect_s3_class(fit_nostd, "susie")
  expect_true(all(fit_std$X_column_scale_factors > 0))
})

test_that("susie handles intercept parameter", {
  set.seed(9)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_int <- susie(dat$X, dat$y, L = 5, intercept = TRUE, verbose = FALSE)
  fit_noint <- susie(dat$X, dat$y, L = 5, intercept = FALSE, verbose = FALSE)

  expect_true(is.finite(fit_int$intercept))
  expect_equal(fit_noint$intercept, 0)
})

test_that("susie handles prior_weights parameter", {
  set.seed(10)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # Uniform weights
  fit_uniform <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Custom weights (favor first 10 variables)
  custom_weights <- c(rep(10, 10), rep(1, 40))
  fit_custom <- susie(dat$X, dat$y, L = 5, prior_weights = custom_weights, verbose = FALSE)

  expect_s3_class(fit_uniform, "susie")
  expect_s3_class(fit_custom, "susie")
})

test_that("susie handles null_weight parameter", {
  set.seed(11)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_nonull <- susie(dat$X, dat$y, L = 5, null_weight = 0, verbose = FALSE)
  fit_null <- susie(dat$X, dat$y, L = 5, null_weight = 0.1, verbose = FALSE)

  expect_equal(ncol(fit_nonull$alpha), 50)
  expect_equal(ncol(fit_null$alpha), 51)
})

test_that("susie handles estimate_residual_variance parameter", {
  set.seed(12)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fixed_sigma2 <- 1.5
  fit_fixed <- susie(dat$X, dat$y, L = 5,
                     estimate_residual_variance = FALSE,
                     residual_variance = fixed_sigma2,
                     verbose = FALSE)

  fit_est <- susie(dat$X, dat$y, L = 5,
                   estimate_residual_variance = TRUE,
                   verbose = FALSE)

  expect_equal(fit_fixed$sigma2, fixed_sigma2)
  expect_true(fit_est$sigma2 != var(dat$y))
})

test_that("susie handles estimate_prior_variance parameter", {
  set.seed(13)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_fixed <- susie(dat$X, dat$y, L = 5,
                     estimate_prior_variance = FALSE,
                     scaled_prior_variance = 0.5,
                     verbose = FALSE)

  fit_est <- susie(dat$X, dat$y, L = 5,
                   estimate_prior_variance = TRUE,
                   verbose = FALSE)

  expect_s3_class(fit_fixed, "susie")
  expect_s3_class(fit_est, "susie")
})

test_that("susie handles convergence_method parameter", {
  set.seed(14)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_elbo <- susie(dat$X, dat$y, L = 5, convergence_method = "elbo", verbose = FALSE)
  fit_pip <- susie(dat$X, dat$y, L = 5, convergence_method = "pip", verbose = FALSE)

  expect_s3_class(fit_elbo, "susie")
  expect_s3_class(fit_pip, "susie")
})

test_that("susie handles compute_univariate_zscore parameter", {
  set.seed(15)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_noz <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = FALSE, verbose = FALSE)
  fit_z <- susie(dat$X, dat$y, L = 5, compute_univariate_zscore = TRUE, verbose = FALSE)

  expect_null(fit_noz$z)
  expect_true(!is.null(fit_z$z))
  expect_length(fit_z$z, 50)
})

# =============================================================================
# SUSIE() - VARIANCE ESTIMATION METHODS
# =============================================================================

test_that("susie handles estimate_residual_method = MoM", {
  set.seed(16)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5,
               estimate_residual_method = "MoM",
               verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true(fit$sigma2 > 0)
})

test_that("susie handles estimate_residual_method = MLE", {
  set.seed(17)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5,
               estimate_residual_method = "MLE",
               verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true(fit$sigma2 > 0)
})

test_that("susie handles estimate_residual_method = NIG", {
  set.seed(18)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 1,
               estimate_residual_method = "NIG",
               verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true(fit$sigma2 > 0)
})

test_that("susie errors clearly for invalid NIG alpha0/beta0", {
  # Regression test for GitHub issue: NIG SER with alpha0 = 0 and beta0 > 0
  # using L = 1 previously produced an infinite ELBO crash. The fix is to
  # reject improper Inverse-Gamma priors at parameter validation, before the
  # ELBO is ever computed.
  set.seed(18)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # Original failing case from the issue (L = 1, alpha0 = 0, beta0 > 0)
  expect_error(
    susie(dat$X, dat$y, L = 1,
          min_abs_corr = 0, check_null_threshold = -1000,
          estimate_residual_method = "NIG",
          alpha0 = 0, beta0 = 0.5,
          verbose = FALSE),
    "alpha0 > 0 and beta0 > 0"
  )

  # Both zero -- previously produced silent NaN; should now error
  expect_error(
    susie(dat$X, dat$y, L = 1,
          min_abs_corr = 0, check_null_threshold = -1000,
          estimate_residual_method = "NIG",
          alpha0 = 0, beta0 = 0,
          verbose = FALSE),
    "alpha0 > 0 and beta0 > 0"
  )

  # Same guard fires for L > 1 (the L=2 path no longer silently succeeds
  # with improper priors)
  expect_error(
    susie(dat$X, dat$y, L = 2,
          min_abs_corr = 0, check_null_threshold = -1000,
          estimate_residual_method = "NIG",
          alpha0 = 0, beta0 = 0.5,
          verbose = FALSE),
    "alpha0 > 0 and beta0 > 0"
  )

  # Sanity check: valid alpha0/beta0 still work for L=1 and L=2
  fit_l1 <- susie(dat$X, dat$y, L = 1,
                  min_abs_corr = 0, check_null_threshold = -1000,
                  estimate_residual_method = "NIG",
                  alpha0 = 0.1, beta0 = 0.1,
                  verbose = FALSE)
  expect_s3_class(fit_l1, "susie")

  fit_l2 <- susie(dat$X, dat$y, L = 2,
                  min_abs_corr = 0, check_null_threshold = -1000,
                  estimate_residual_method = "NIG",
                  alpha0 = 0.1, beta0 = 0.1,
                  verbose = FALSE)
  expect_s3_class(fit_l2, "susie")
})

test_that("susie handles estimate_prior_method options", {
  set.seed(19)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_optim <- susie(dat$X, dat$y, L = 5, estimate_prior_method = "optim", verbose = FALSE)
  fit_em <- susie(dat$X, dat$y, L = 5, estimate_prior_method = "EM", verbose = FALSE)
  fit_simple <- susie(dat$X, dat$y, L = 5, estimate_prior_method = "simple", verbose = FALSE)

  expect_s3_class(fit_optim, "susie")
  expect_s3_class(fit_em, "susie")
  expect_s3_class(fit_simple, "susie")
})

# =============================================================================
# SUSIE() - UNMAPPABLE EFFECTS
# =============================================================================

test_that("susie handles unmappable_effects = none", {
  set.seed(20)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, unmappable_effects = "none", verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_false("theta" %in% names(fit))
  expect_false("tau2" %in% names(fit))
})

test_that("susie handles unmappable_effects = inf", {
  set.seed(21)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, unmappable_effects = "inf", verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("theta" %in% names(fit))
  expect_true("tau2" %in% names(fit))
  expect_length(fit$theta, 50)
})

test_that("susie handles unmappable_effects = ash", {

  set.seed(22)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, unmappable_effects = "ash", verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("theta" %in% names(fit))
  expect_true("tau2" %in% names(fit))
})

# =============================================================================
# SUSIE() - SIGNAL RECOVERY
# =============================================================================

test_that("susie identifies true causal variables", {
  set.seed(23)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)

  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Top PIPs should include true causal variables
  top_vars <- order(fit$pip, decreasing = TRUE)[1:10]
  overlap <- length(intersect(top_vars, dat$causal_idx))

  expect_true(overlap >= 1)
})

test_that("susie maintains low PIPs for null variables", {
  set.seed(24)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)

  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  null_vars <- setdiff(1:dat$p, dat$causal_idx)
  null_pips <- fit$pip[null_vars]

  expect_true(median(null_pips) < 0.3)
})

# =============================================================================
# SUSIE() - EDGE CASES
# =============================================================================

test_that("susie handles L = 1", {
  set.seed(25)
  dat <- simulate_regression(n = 100, p = 50, k = 1)

  fit <- susie(dat$X, dat$y, L = 1, verbose = FALSE)

  expect_equal(nrow(fit$alpha), 1)
  expect_equal(sum(fit$alpha), 1, tolerance = 1e-10)
})

test_that("susie handles small p", {
  set.seed(26)
  dat <- simulate_regression(n = 100, p = 5, k = 2)

  fit <- susie(dat$X, dat$y, L = 3, verbose = FALSE)

  expect_equal(ncol(fit$alpha), 5)
})

test_that("susie errors on NA values when na.rm = FALSE", {
  set.seed(28)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  dat$y[5] <- NA

  expect_error(
    susie(dat$X, dat$y, L = 5, na.rm = FALSE, verbose = FALSE),
    "must not contain missing values"
  )
})

# =============================================================================
# SUSIE_SS() - BASIC FUNCTIONALITY
# =============================================================================

test_that("susie_ss returns valid susie object", {
  set.seed(29)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  X_centered <- scale(dat$X, center = TRUE, scale = FALSE)
  y_centered <- dat$y - mean(dat$y)

  XtX <- crossprod(X_centered)
  Xty <- as.vector(crossprod(X_centered, y_centered))
  yty <- sum(y_centered^2)

  fit <- susie_ss(XtX, Xty, yty, n = 100, L = 5, verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("alpha" %in% names(fit))
  expect_true("mu" %in% names(fit))
  expect_true("V" %in% names(fit))
  expect_true("sigma2" %in% names(fit))
  expect_true("pip" %in% names(fit))
})

test_that("susie_ss has correct dimensions", {
  set.seed(30)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  expect_equal(dim(fit$alpha), c(5, 50))
  expect_equal(dim(fit$mu), c(5, 50))
  expect_length(fit$V, 5)
  expect_length(fit$pip, 50)
})

test_that("susie_ss maintains valid probability distributions", {
  set.seed(31)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  expect_equal(rowSums(fit$alpha), rep(1, 5), tolerance = 1e-10)
  expect_true(all(fit$alpha >= 0 & fit$alpha <= 1))
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

test_that("susie_ss ELBO is monotonically increasing", {
  set.seed(32)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  elbo_diff <- diff(fit$elbo)
  expect_true(all(elbo_diff > -1e-6))
})

# =============================================================================
# SUSIE_SS() - CONSISTENCY WITH SUSIE()
# =============================================================================

test_that("susie_ss agrees with susie on same data", {
  set.seed(33)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # Fit with individual data
  fit_ind <- susie(dat$X, dat$y, L = 5, standardize = TRUE, verbose = FALSE)

  # Compute sufficient statistics
  X_centered <- scale(dat$X, center = TRUE, scale = FALSE)
  y_centered <- dat$y - mean(dat$y)
  XtX <- crossprod(X_centered)
  Xty <- as.vector(crossprod(X_centered, y_centered))
  yty <- sum(y_centered^2)

  # Fit with sufficient statistics
  fit_ss <- susie_ss(XtX, Xty, yty, n = 100, L = 5,
                     X_colmeans = colMeans(dat$X),
                     y_mean = mean(dat$y),
                     standardize = TRUE, verbose = FALSE)

  # Results should be very similar
  expect_equal(fit_ind$pip, fit_ss$pip, tolerance = 1e-3)
  expect_equal(fit_ind$V, fit_ss$V, tolerance = 1e-3)
  expect_equal(fit_ind$sigma2, fit_ss$sigma2, tolerance = 1e-3)
})

# =============================================================================
# SUSIE_SS() - PARAMETER HANDLING
# =============================================================================

test_that("susie_ss handles X_colmeans and y_mean for intercept", {
  set.seed(34)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit_noint <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)

  fit_int <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                      X_colmeans = colMeans(dat$X),
                      y_mean = mean(dat$y),
                      verbose = FALSE)

  expect_true(is.na(fit_noint$intercept))
  expect_true(is.finite(fit_int$intercept))
})

test_that("susie_ss handles maf filtering", {
  set.seed(35)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  maf <- runif(50, 0, 0.5)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                  maf = maf, maf_thresh = 0.1,
                  verbose = FALSE)

  n_filtered <- sum(maf > 0.1)
  expect_equal(ncol(fit$alpha), n_filtered)
})

test_that("susie_ss handles check_input parameter", {
  set.seed(36)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                  check_input = TRUE,
                  verbose = FALSE)

  expect_s3_class(fit, "susie")
})

test_that("susie_ss handles unmappable_effects = inf", {
  set.seed(37)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                  unmappable_effects = "inf",
                  verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("theta" %in% names(fit))
  expect_true("tau2" %in% names(fit))
})

# =============================================================================
# SUSIE_RSS() - BASIC FUNCTIONALITY (lambda = 0)
# =============================================================================

test_that("susie_rss with lambda = 0 returns valid susie object", {
  set.seed(39)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("alpha" %in% names(fit))
  expect_true("mu" %in% names(fit))
  expect_true("V" %in% names(fit))
  expect_true("pip" %in% names(fit))
})

test_that("susie_rss with lambda = 0 has correct dimensions", {
  set.seed(40)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)

  expect_equal(dim(fit$alpha), c(5, 50))
  expect_equal(dim(fit$mu), c(5, 50))
  expect_length(fit$V, 5)
  expect_length(fit$pip, 50)
})

test_that("susie_rss with lambda = 0 maintains valid probability distributions", {
  set.seed(41)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)

  expect_equal(rowSums(fit$alpha), rep(1, 5), tolerance = 1e-10)
  expect_true(all(fit$alpha >= 0 & fit$alpha <= 1))
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

test_that("susie_rss with lambda = 0 accepts bhat and shat instead of z", {
  set.seed(42)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  univar <- univariate_regression(dat$X, dat$y)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(bhat = univar$betahat, shat = univar$sebetahat,
                   R = R, n = 100, L = 5 , verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_equal(dim(fit$alpha), c(5, 50))
})

test_that("susie_rss with lambda = 0 handles maf filtering", {
  set.seed(43)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))
  maf <- runif(50, 0, 0.5)

  fit <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , maf = maf, maf_thresh = 0.1,
                   verbose = FALSE)

  n_filtered <- sum(maf > 0.1)
  expect_equal(ncol(fit$alpha), n_filtered)
})

# =============================================================================
# SUSIE_RSS() - BASIC FUNCTIONALITY (lambda > 0)
# =============================================================================

test_that("susie_rss_lambda with lambda > 0 returns valid susie object", {
  set.seed(44)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
                   lambda = 1e-5, verbose = FALSE)

  expect_s3_class(fit, "susie")
  expect_true("alpha" %in% names(fit))
  expect_true("mu" %in% names(fit))
  expect_true("V" %in% names(fit))
  expect_true("pip" %in% names(fit))
})

test_that("susie_rss_lambda with lambda > 0 has correct dimensions", {
  set.seed(45)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
                   lambda = 1e-5, verbose = FALSE)

  expect_equal(dim(fit$alpha), c(5, 50))
  expect_equal(dim(fit$mu), c(5, 50))
  expect_length(fit$V, 5)
  expect_length(fit$pip, 50)
})

test_that("susie_rss_lambda with lambda > 0 maintains valid probability distributions", {
  set.seed(46)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
                   lambda = 1e-5, verbose = FALSE)

  expect_equal(rowSums(fit$alpha), rep(1, 5), tolerance = 1e-10)
  expect_true(all(fit$alpha >= 0 & fit$alpha <= 1))
  expect_true(all(fit$pip >= 0 & fit$pip <= 1))
})

test_that("susie_rss_lambda with lambda > 0 handles maf filtering", {
  set.seed(47)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)
  maf <- runif(50, 0, 0.5)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
                   lambda = 1e-5, maf = maf, maf_thresh = 0.1,
                   verbose = FALSE)

  n_filtered <- sum(maf > 0.1)
  expect_equal(ncol(fit$alpha), n_filtered)
})

test_that("susie_rss_lambda with lambda > 0 ELBO is monotonically increasing", {
  set.seed(48)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
                   lambda = 1e-5, verbose = FALSE)

  elbo_diff <- diff(fit$elbo)
  expect_true(all(elbo_diff > -1e-6))
})

test_that("susie_rss_lambda with lambda > 0 identifies causal variables", {
  set.seed(49)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5,
                                  signal_sd = 1, seed = NULL)

  fit <- susie_rss_lambda(z = setup$z, R = setup$R, L = 10,
                   lambda = 1e-5, verbose = FALSE)

  # Top PIPs should include at least one true causal variable
  top_vars <- order(fit$pip, decreasing = TRUE)[1:10]
  overlap <- length(intersect(top_vars, setup$causal_idx))

  expect_true(overlap >= 1)
})

# =============================================================================
# SUSIE_RSS() - LAMBDA PARAMETER HANDLING
# =============================================================================

test_that("susie_rss switches data type based on lambda", {
  set.seed(50)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  # lambda = 0 should use sufficient statistics
  fit_lambda0 <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)

  # lambda > 0 should use rss_lambda class
  fit_lambda_pos <- susie_rss_lambda(z = z_scores, R = R, L = 5,
                              lambda = 1e-5, verbose = FALSE)

  expect_s3_class(fit_lambda0, "susie")
  expect_s3_class(fit_lambda_pos, "susie")
})

test_that("susie_rss_lambda with lambda > 0 accepts n parameter for PVE adjustment", {
  set.seed(51)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  # n is now used for PVE adjustment in all paths; no "n is not used" warning
  fit <- susie_rss_lambda(z = setup$z, R = setup$R, n = 100, L = 5,
                   lambda = 1e-5, verbose = FALSE)
  expect_s3_class(fit, "susie")
})

test_that("susie_rss_lambda does not expose bhat/shat", {
  set.seed(52)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  expect_error(
    susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
	      bhat = rnorm(50), shat = runif(50, 0.5, 1),
	      lambda = 1e-5, verbose = FALSE),
    "unused argument"
  )
})

test_that("susie_rss_lambda does not expose var_y", {
  set.seed(53)
  setup <- setup_rss_lambda_data(n = 500, p = 50, k = 3, lambda = 1e-5, seed = NULL)

  expect_error(
    susie_rss_lambda(z = setup$z, R = setup$R, L = 5,
	      var_y = 1.5, lambda = 1e-5, verbose = FALSE),
    "unused argument"
  )
})

test_that("susie_rss does not expose intercept_value", {
  set.seed(54)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  expect_error(
    susie_rss(z = z_scores, R = R, n = 100, L = 5 , intercept_value = 0.5, verbose = FALSE),
    "unused argument"
  )
})

# =============================================================================
# SUSIE_RSS() - INPUT VALIDATION
# =============================================================================

test_that("susie_rss requires either z or bhat/shat", {
  R <- diag(50)

  expect_error(
    susie_rss(R = R, n = 100, L = 5 , verbose = FALSE),
    "Please provide either z or \\(bhat, shat\\)"
  )
})

test_that("susie_rss rejects both z and bhat/shat", {
  z <- rnorm(50)
  bhat <- rnorm(50)
  shat <- runif(50, 0.5, 1)
  R <- diag(50)

  expect_error(
    susie_rss(z = z, bhat = bhat, shat = shat, R = R, n = 100,
              L = 5 , verbose = FALSE),
    "Please provide either z or \\(bhat, shat\\), but not both"
  )
})

test_that("susie_rss does not expose check_R", {
  set.seed(55)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  expect_error(
    susie_rss(z = z_scores, R = R, n = 100, L = 5,
              check_R = TRUE, verbose = FALSE),
    "unused argument"
  )
})

# =============================================================================
# INTEGRATION TESTS - CROSS-METHOD COMPARISONS
# =============================================================================

test_that("susie, susie_ss, and susie_rss give similar PIPs", {
  set.seed(56)
  dat <- simulate_regression(n = 100, p = 50, k = 3, signal_sd = 2)

  # Fit with individual data
  fit_ind <- susie(dat$X, dat$y, L = 5, standardize = TRUE,
                   intercept = TRUE, verbose = FALSE)

  # Fit with sufficient statistics
  X_centered <- scale(dat$X, center = TRUE, scale = FALSE)
  y_centered <- dat$y - mean(dat$y)
  XtX <- crossprod(X_centered)
  Xty <- as.vector(crossprod(X_centered, y_centered))
  yty <- sum(y_centered^2)

  fit_ss <- susie_ss(XtX, Xty, yty, n = 100, L = 5,
                     X_colmeans = colMeans(dat$X),
                     y_mean = mean(dat$y),
                     standardize = TRUE, verbose = FALSE)

  # Fit with RSS (lambda = 0)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit_rss <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE, estimate_residual_variance = TRUE)

  # PIPs should be very similar
  expect_equal(fit_ind$pip, fit_ss$pip, tolerance = 1e-3)
  expect_equal(fit_ind$pip, fit_rss$pip, tolerance = 1e-2)
})

test_that("All three interfaces find credible sets", {
  set.seed(57)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)

  fit_ind <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  ss <- compute_summary_stats(dat$X, dat$y)
  fit_ss <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 10, verbose = FALSE)

  ss_full <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss_full, cov2cor(XtX))
  fit_rss <- susie_rss(z = z_scores, R = R, n = 200, L = 10 , verbose = FALSE)

  # At least one method should find credible sets
  has_cs <- (!is.null(fit_ind$sets$cs) && length(fit_ind$sets$cs) > 0) ||
            (!is.null(fit_ss$sets$cs) && length(fit_ss$sets$cs) > 0) ||
            (!is.null(fit_rss$sets$cs) && length(fit_rss$sets$cs) > 0)

  expect_true(has_cs)
})

# =============================================================================
# REFINE PARAMETER
# =============================================================================

test_that("susie handles refine = TRUE", {
  set.seed(58)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)

  fit_norefine <- susie(dat$X, dat$y, L = 10, refine = FALSE, verbose = FALSE)
  fit_refine <- susie(dat$X, dat$y, L = 10, refine = TRUE, verbose = FALSE)

  expect_s3_class(fit_norefine, "susie")
  expect_s3_class(fit_refine, "susie")

  # Refined model should have equal or better ELBO
  elbo_norefine <- susie_get_objective(fit_norefine, last_only = TRUE)
  elbo_refine <- susie_get_objective(fit_refine, last_only = TRUE)

  expect_true(elbo_refine >= elbo_norefine - 1e-6)
})

test_that("susie_ss handles refine = TRUE", {
  set.seed(59)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 10,
                  refine = TRUE, verbose = FALSE)

  expect_s3_class(fit, "susie")
})

test_that("susie_rss handles refine = TRUE", {
  set.seed(60)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(z = z_scores, R = R, n = 200, L = 10 , refine = TRUE, verbose = FALSE)

  expect_s3_class(fit, "susie")
})

# =============================================================================
# TRACK_FIT PARAMETER
# =============================================================================

test_that("susie handles track_fit = TRUE", {
  set.seed(61)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit <- susie(dat$X, dat$y, L = 5, track_fit = TRUE, verbose = FALSE)

  expect_true("trace" %in% names(fit))
  expect_type(fit$trace, "list")
})

test_that("susie_ss handles track_fit = TRUE", {
  set.seed(62)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  fit <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5,
                  track_fit = TRUE, verbose = FALSE)

  expect_true("trace" %in% names(fit))
  expect_type(fit$trace, "list")
})

test_that("susie_rss handles track_fit = TRUE", {
  set.seed(63)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  fit <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , track_fit = TRUE, verbose = FALSE)

  expect_true("trace" %in% names(fit))
  expect_type(fit$trace, "list")
})

# =============================================================================
# VERBOSE PARAMETER
# =============================================================================

test_that("susie verbose output works", {
  set.seed(64)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  expect_message(
    susie(dat$X, dat$y, L = 5, verbose = TRUE),
    "ELBO"
  )
})

test_that("susie_ss verbose output works", {
  set.seed(65)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_summary_stats(dat$X, dat$y)

  expect_message(
    susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = TRUE),
    "ELBO"
  )
})

test_that("susie_rss verbose output works", {
  set.seed(66)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  ss <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss, cov2cor(XtX))

  expect_message(
    susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = TRUE),
    "ELBO"
  )
})

# =============================================================================
# MATHEMATICAL PROPERTIES - ALL INTERFACES
# =============================================================================

test_that("All interfaces maintain non-negative prior variances", {
  set.seed(67)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_ind <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  expect_true(all(fit_ind$V >= 0))

  ss <- compute_summary_stats(dat$X, dat$y)
  fit_ss <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)
  expect_true(all(fit_ss$V >= 0))

  ss_full <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss_full, cov2cor(XtX))
  fit_rss <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)
  expect_true(all(fit_rss$V >= 0))
})

test_that("All interfaces maintain positive residual variance", {
  set.seed(68)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  fit_ind <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  expect_true(fit_ind$sigma2 > 0)

  ss <- compute_summary_stats(dat$X, dat$y)
  fit_ss <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)
  expect_true(fit_ss$sigma2 > 0)

  ss_full <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss_full, cov2cor(XtX))
  fit_rss <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)
  expect_true(fit_rss$sigma2 > 0)
})

# =============================================================================
# OUTPUT COMPATIBILITY
# =============================================================================

test_that("All interfaces produce output compatible with susie_get functions", {
  set.seed(69)
  dat <- simulate_regression(n = 100, p = 50, k = 3)

  # Test susie
  fit_ind <- susie(dat$X, dat$y, L = 5, verbose = FALSE)
  expect_length(susie_get_pip(fit_ind), 50)
  expect_equal(susie_get_objective(fit_ind, last_only = TRUE),
               fit_ind$elbo[length(fit_ind$elbo)])

  # Test susie_ss
  ss <- compute_summary_stats(dat$X, dat$y)
  fit_ss <- susie_ss(ss$XtX, ss$Xty, ss$yty, n = ss$n, L = 5, verbose = FALSE)
  expect_length(susie_get_pip(fit_ss), 50)
  expect_equal(susie_get_objective(fit_ss, last_only = TRUE),
               fit_ss$elbo[length(fit_ss$elbo)])

  # Test susie_rss
  ss_full <- compute_suff_stat(dat$X, dat$y, standardize = TRUE)
  z_scores <- with(univariate_regression(dat$X, dat$y), betahat / sebetahat)
  R <- with(ss_full, cov2cor(XtX))
  fit_rss <- susie_rss(z = z_scores, R = R, n = 100, L = 5 , verbose = FALSE)
  expect_length(susie_get_pip(fit_rss), 50)
  expect_equal(susie_get_objective(fit_rss, last_only = TRUE),
               fit_rss$elbo[length(fit_rss$elbo)])
})


================================================
FILE: tests/testthat/test_susie_ash_ss_equivalence.R
================================================
# =============================================================================
# Test: SuSiE-ash (filter-archived) Individual vs Summary Statistics Equivalence
# =============================================================================
#
# Verifies that the archived filter-based masking path
# (unmappable_effects="ash_filter_archived") produces equivalent results
# between individual-level (mr.ash) and summary stats (mr.ash.rss) paths.
# Both share the masking logic via compute_ash_masking().
# =============================================================================

# Helper: prepare individual and SS data from a common dataset
setup_susie_ash_test <- function(n = 200, p = 50, k = 5, seed = 42) {
  set.seed(seed)
  X <- matrix(rnorm(n * p), n, p)
  X <- scale(X, center = TRUE, scale = TRUE)
  beta_true <- rep(0, p)
  causal <- sample(1:p, k)
  beta_true[causal] <- rnorm(k, sd = 2)
  y <- c(X %*% beta_true + rnorm(n))
  y <- y - mean(y)

  # Sufficient stats
  XtX <- crossprod(X)
  Xty <- crossprod(X, y)
  yty <- sum(y^2)

  # RSS inputs
  bhat <- sapply(1:p, function(j) sum(X[, j] * y) / sum(X[, j]^2))
  shat <- sapply(1:p, function(j) {
    resid <- y - X[, j] * bhat[j]
    sqrt(sum(resid^2) / ((n - 2) * sum(X[, j]^2)))
  })
  R_mat <- susieR:::safe_cor(X)

  list(X = X, y = y, n = n, p = p,
       XtX = XtX, Xty = Xty, yty = yty,
       bhat = bhat, shat = shat, R_mat = R_mat,
       beta_true = beta_true, causal = causal)
}

test_that("susie_ss ash agrees with susie individual-level ash", {
  d <- setup_susie_ash_test(n = 200, p = 50, k = 5, seed = 42)

  # Individual-level: uses mr.ash directly
  fit_ind <- susie(d$X, d$y, L = 5,
    unmappable_effects = "ash_filter_archived",
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim",
    intercept = FALSE, standardize = FALSE,
    max_iter = 20, verbose = FALSE
  )

  # SS path: uses mr.ash.rss
  fit_ss <- susie_ss(
    XtX = d$XtX, Xty = d$Xty, yty = d$yty, n = d$n, L = 5,
    unmappable_effects = "ash_filter_archived",
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim",
    max_iter = 20, verbose = FALSE
  )

  # mr.ash and mr.ash.rss agree to ~1e-5 tolerance
  expect_equal(fit_ss$theta, fit_ind$theta, tolerance = 1e-4,
    label = "theta (mr.ash coefficients)")
  expect_equal(fit_ss$sigma2, fit_ind$sigma2, tolerance = 1e-4,
    label = "sigma2 (residual variance)")

  # PIPs should be highly correlated
  pip_cor <- cor(susie_get_pip(fit_ss), susie_get_pip(fit_ind))
  expect_true(pip_cor > 0.999,
    label = "PIP correlation > 0.999")
})

test_that("susie_ss ash works with different data sizes", {
  for (params in list(
    list(n = 100, p = 30, k = 3, seed = 100),
    list(n = 300, p = 80, k = 8, seed = 200)
  )) {
    d <- setup_susie_ash_test(
      n = params$n, p = params$p,
      k = params$k, seed = params$seed
    )

    fit_ind <- susie(d$X, d$y, L = 5,
      unmappable_effects = "ash_filter_archived",
      estimate_residual_variance = TRUE,
      estimate_prior_method = "optim",
      intercept = FALSE, standardize = FALSE,
      max_iter = 15, verbose = FALSE
    )

    fit_ss <- susie_ss(
      XtX = d$XtX, Xty = d$Xty, yty = d$yty, n = d$n, L = 5,
      unmappable_effects = "ash_filter_archived",
      estimate_residual_variance = TRUE,
      estimate_prior_method = "optim",
      max_iter = 15, verbose = FALSE
    )

    expect_equal(fit_ss$theta, fit_ind$theta, tolerance = 1e-4,
      label = sprintf("theta (n=%d, p=%d)", params$n, params$p))
    expect_equal(fit_ss$sigma2, fit_ind$sigma2, tolerance = 1e-4,
      label = sprintf("sigma2 (n=%d, p=%d)", params$n, params$p))
    pip_cor <- cor(susie_get_pip(fit_ss), susie_get_pip(fit_ind))
    expect_true(pip_cor > 0.999,
      label = sprintf("PIP cor > 0.999 (n=%d, p=%d)", params$n, params$p))
  }
})

test_that("susie individual-level ash output has expected fields", {
  d <- setup_susie_ash_test(n = 100, p = 30, k = 3, seed = 123)

  fit_ind <- susie(d$X, d$y, L = 5,
    unmappable_effects = "ash_filter_archived",
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim",
    intercept = FALSE, standardize = FALSE,
    max_iter = 10, verbose = FALSE
  )

  # Check key fields exist
  expect_true(is.numeric(fit_ind$theta))
  expect_true(is.numeric(fit_ind$sigma2))
  expect_true(is.numeric(fit_ind$tau2))
  expect_true(is.matrix(fit_ind$alpha))

  # Check dimensions
  expect_length(fit_ind$theta, d$p)
  expect_length(fit_ind$sigma2, 1)
  expect_equal(ncol(fit_ind$alpha), d$p)

  # X_theta should be cleaned up
  expect_null(fit_ind$X_theta)
})

test_that("susie_ss ash output has expected fields", {
  d <- setup_susie_ash_test(n = 100, p = 30, k = 3, seed = 123)

  fit_ss <- susie_ss(
    XtX = d$XtX, Xty = d$Xty, yty = d$yty, n = d$n, L = 5,
    unmappable_effects = "ash_filter_archived",
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim",
    max_iter = 10, verbose = FALSE
  )

  # Check key fields exist
  expect_true(is.numeric(fit_ss$theta))
  expect_true(is.numeric(fit_ss$sigma2))
  expect_true(is.numeric(fit_ss$tau2))
  expect_true(is.matrix(fit_ss$alpha))

  # Check dimensions
  expect_length(fit_ss$theta, d$p)
  expect_length(fit_ss$sigma2, 1)
  expect_equal(ncol(fit_ss$alpha), d$p)
})

test_that("susie_rss ash works with correlation matrix input", {
  d <- setup_susie_ash_test(n = 200, p = 50, k = 5, seed = 42)

  fit_rss <- susie_rss(
    bhat = d$bhat, shat = d$shat, R = d$R_mat, n = d$n, L = 5,
    unmappable_effects = "ash_filter_archived",
    estimate_residual_variance = TRUE,
    estimate_prior_method = "optim",
    max_iter = 20, verbose = FALSE
  )

  # Basic sanity checks
  expect_true(is.numeric(fit_rss$theta))
  expect_length(fit_rss$theta, d$p)
  expect_true(is.numeric(fit_rss$sigma2))
  expect_true(length(fit_rss$sets$cs) >= 0)
})


================================================
FILE: tests/testthat/test_susie_auto.R
================================================
context("susie_auto unit tests")

# =============================================================================
# ALGORITHM PROGRESSION
# =============================================================================

test_that("susie_auto starts with L_init and doubles correctly", {
  base_data <- generate_base_data(n = 100, p = 50, k = 3, signal_sd = 1, seed = 123)
  # Manually set specific beta values for this test
  base_data$beta[base_data$causal_idx] <- c(2, -1.5, 1)
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n))

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 4, verbose = FALSE)

  L_final <- nrow(result$alpha)
  expect_true(L_final >= 1)
  expect_true(L_final %in% c(1, 2, 4, 8))
})

test_that("susie_auto respects L_max limit", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 124)

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 8, verbose = FALSE)

  L_final <- nrow(result$alpha)
  expect_true(L_final %in% c(1, 2, 4, 8, 16))
})

test_that("susie_auto converges when prior variances hit zero", {
  base_data <- generate_base_data(n = 100, p = 50, k = 1, signal_sd = 3, seed = 125)

  # With single effect, should converge quickly (some V should be 0)
  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 16, verbose = FALSE)

  # At least one prior variance should be zero (or very small)
  expect_true(any(result$V < 1e-3))
})

test_that("susie_auto handles L_init = L_max (no doubling)", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 126)

  # No doubling should occur
  result <- susie_auto(base_data$X, base_data$y, L_init = 5, L_max = 5, verbose = FALSE)

  # Should complete successfully with L = 5
  expect_equal(nrow(result$alpha), 5)
  expect_true(is.finite(result$elbo[length(result$elbo)]))
})

# =============================================================================
# CONVERGENCE BEHAVIOR
# =============================================================================

test_that("susie_auto convergence logic: stops when any V = 0", {
  set.seed(127)
  base_data <- generate_base_data(n = 100, p = 50, k = 1, signal_sd = 5, seed = NULL)
  # Add lower noise
  base_data$y <- base_data$X %*% base_data$beta + rnorm(base_data$n, sd = 0.5)

  # Should converge with strong single effect
  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 32, verbose = FALSE)

  # At least one V should be effectively zero (converged)
  expect_true(any(result$V < 1e-6))

  # Result should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))
})

test_that("susie_auto continues until L_max when all V > 0", {
  set.seed(128)
  base_data <- generate_base_data(n = 100, p = 50, k = 10, signal_sd = 0.5, seed = NULL)

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 4, verbose = FALSE)

  L_final <- nrow(result$alpha)
  expect_true(L_final %in% c(1, 2, 4, 8))
})

# =============================================================================
# PARAMETER PROPAGATION
# =============================================================================

test_that("susie_auto propagates standardize parameter correctly", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 129)
  # Create X with different scales
  base_data$X <- sweep(base_data$X, 2, seq(0.1, 5, length.out = base_data$p), "*")
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n))

  result_std <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4,
                           standardize = TRUE, verbose = FALSE)
  result_nostd <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4,
                             standardize = FALSE, verbose = FALSE)

  expect_true(all(result_std$alpha >= 0 & result_std$alpha <= 1))
  expect_true(all(result_nostd$alpha >= 0 & result_nostd$alpha <= 1))
})

test_that("susie_auto propagates intercept parameter correctly", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 130)
  base_data$y <- as.vector(base_data$X %*% base_data$beta + 3 + rnorm(base_data$n))  # Add intercept

  result_int <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4,
                           intercept = TRUE, verbose = FALSE)
  result_noint <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4,
                             intercept = FALSE, verbose = FALSE)

  # Intercept estimates should differ
  expect_false(isTRUE(all.equal(result_int$intercept, result_noint$intercept,
                                 tolerance = 1e-3)))
})

test_that("susie_auto propagates max_iter parameter correctly", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 131)

  # Use very small max_iter to test propagation
  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 2, max_iter = 3,
                       verbose = FALSE)

  # Should complete (may not converge, but should respect max_iter)
  expect_true(result$niter <= 3)
})

test_that("susie_auto uses init_tol for early runs and tol for final run", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 132)

  # Large init_tol should make early runs converge faster
  result_large_init <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 2,
                                  init_tol = 10, tol = 1e-3, verbose = FALSE)
  result_small_init <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 2,
                                  init_tol = 1e-5, tol = 1e-3, verbose = FALSE)

  # Both should complete successfully
  expect_true(is.finite(result_large_init$elbo[length(result_large_init$elbo)]))
  expect_true(is.finite(result_small_init$elbo[length(result_small_init$elbo)]))
})

test_that("susie_auto passes additional arguments via ...", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 133)

  # Pass coverage argument
  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 2, coverage = 0.9,
                       verbose = FALSE)

  # Should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))

  # Check that sets are computed (if any exist)
  if (!is.null(result$sets)) {
    expect_true(is.list(result$sets))
  }
})

# =============================================================================
# MODEL INITIALIZATION & EXPANSION
# =============================================================================

test_that("susie_auto correctly expands L via add_null_effect", {
  base_data <- generate_base_data(n = 100, p = 50, k = 5, signal_sd = 1, seed = 134)

  # Start small and let it expand
  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 8, verbose = FALSE)

  L_final <- nrow(result$alpha)

  # Dimensions should be consistent
  expect_equal(nrow(result$alpha), L_final)
  expect_equal(nrow(result$mu), L_final)
  expect_equal(nrow(result$mu2), L_final)
  expect_equal(length(result$V), L_final)
  expect_equal(length(result$KL), L_final)
})

test_that("susie_auto maintains valid model structure throughout", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 135)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Check model structure
  L <- nrow(result$alpha)
  expect_equal(dim(result$alpha), c(L, base_data$p))
  expect_equal(dim(result$mu), c(L, base_data$p))
  expect_equal(dim(result$mu2), c(L, base_data$p))
  expect_equal(length(result$V), L)
  expect_equal(length(result$KL), L)

  # Alpha rows should sum to 1
  expect_true(all(abs(rowSums(result$alpha) - 1) < 1e-10))
})

# =============================================================================
# VARIANCE ESTIMATION
# =============================================================================

test_that("susie_auto estimates variances in correct stages", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 136)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 2, verbose = FALSE)

  # Final result should have estimated variances
  expect_true(result$sigma2 > 0)
  expect_true(all(result$V >= 0))
})

test_that("susie_auto residual variance is positive", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 137)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  expect_true(result$sigma2 > 0)
  expect_true(is.finite(result$sigma2))
})

test_that("susie_auto prior variances are non-negative", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 138)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  expect_true(all(result$V >= 0))
  expect_true(all(is.finite(result$V)))
})

# =============================================================================
# EDGE CASES & ROBUSTNESS
# =============================================================================

test_that("susie_auto handles sparse signal (single effect)", {
  base_data <- generate_base_data(n = 100, p = 50, k = 1, signal_sd = 3, seed = 139)

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 8, verbose = FALSE)

  # Should identify the effect
  pips <- colSums(result$alpha * result$mu)
  expect_true(max(pips) > 0.5)  # At least one variable should have high PIP

  # Most V should be zero or very small
  expect_true(sum(result$V < 1e-3) >= length(result$V) - 2)
})

test_that("susie_auto handles dense signal (many effects)", {
  base_data <- generate_base_data(n = 100, p = 50, k = 8, signal_sd = 0.5, seed = 140)

  # May need multiple doublings
  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 16, verbose = FALSE)

  # Should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))
  expect_true(nrow(result$alpha) >= 2)
})

test_that("susie_auto handles high noise scenario", {
  set.seed(141)
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = NULL)
  # Add high noise
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n, sd = 5))

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))
  expect_true(result$sigma2 > 0)
})

test_that("susie_auto handles no signal (pure noise)", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 142)

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 4, verbose = FALSE)

  # Should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))

  # All effects should have small prior variance
  expect_true(all(result$V < 0.5))

  # No credible sets should be found
  expect_true(is.null(result$sets) || length(result$sets$cs) == 0)
})

test_that("susie_auto handles L_init = 1 (minimum)", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 143)

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 8, verbose = FALSE)

  # Should complete successfully
  expect_true(is.finite(result$elbo[length(result$elbo)]))
  expect_true(nrow(result$alpha) >= 1)
})

test_that("susie_auto handles large L_init", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 144)

  # Start with large L
  result <- susie_auto(base_data$X, base_data$y, L_init = 10, L_max = 10, verbose = FALSE)

  # Should complete successfully with L = 10
  expect_equal(nrow(result$alpha), 10)
  expect_true(is.finite(result$elbo[length(result$elbo)]))
})

# =============================================================================
# OUTPUT VALIDATION
# =============================================================================

test_that("susie_auto returns valid susie object", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 145)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Check required fields
  expect_true("alpha" %in% names(result))
  expect_true("mu" %in% names(result))
  expect_true("mu2" %in% names(result))
  expect_true("V" %in% names(result))
  expect_true("sigma2" %in% names(result))
  expect_true("elbo" %in% names(result))
  expect_true("niter" %in% names(result))
})

test_that("susie_auto PIPs are valid probabilities", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 146)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # PIPs should be between 0 and 1
  pips <- susie_get_pip(result)
  expect_true(all(pips >= 0))
  expect_true(all(pips <= 1))
})

test_that("susie_auto fitted values have correct dimensions", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 147)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Fitted values should have length n
  expect_equal(length(result$fitted), base_data$n)
  expect_true(all(is.finite(result$fitted)))
})

test_that("susie_auto predictions work correctly", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 148)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Predictions should work
  pred <- predict(result)
  expect_equal(length(pred), base_data$n)
  expect_true(all(is.finite(pred)))
})

test_that("susie_auto coefficients can be extracted", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 149)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Coefficients should be extractable
  coefs <- coef(result)
  expect_equal(length(coefs), base_data$p + 1)  # p coefficients + intercept
  expect_true(all(is.finite(coefs)))
})

# =============================================================================
# MATHEMATICAL PROPERTIES
# =============================================================================

test_that("susie_auto ELBO is monotonically increasing or stable", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 150)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # ELBO should be non-decreasing (allowing for small numerical errors)
  elbo_diff <- diff(result$elbo)
  expect_true(all(elbo_diff > -1e-6))
})

test_that("susie_auto final ELBO is finite", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 151)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  final_elbo <- result$elbo[length(result$elbo)]
  expect_true(is.finite(final_elbo))
  expect_false(is.na(final_elbo))
})

test_that("susie_auto alpha rows sum to 1", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 152)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Each row of alpha should sum to 1
  row_sums <- rowSums(result$alpha)
  expect_true(all(abs(row_sums - 1) < 1e-10))
})

test_that("susie_auto alpha values are valid probabilities", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 153)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Alpha should be in [0, 1]
  expect_true(all(result$alpha >= 0))
  expect_true(all(result$alpha <= 1))
})

test_that("susie_auto KL divergences are non-negative", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 154)

  result <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # KL divergences should be non-negative
  expect_true(all(result$KL >= -1e-10))  # Allow small numerical error
})

# =============================================================================
# SIGNAL RECOVERY
# =============================================================================

test_that("susie_auto recovers true causal variables with strong signal", {
  base_data <- generate_base_data(n = 200, p = 100, k = 3, signal_sd = 1.5, seed = 155)
  base_data$X <- scale(base_data$X)
  # Set specific effect sizes
  base_data$beta[base_data$causal_idx] <- c(1.5, -1.2, 1.8)
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n, sd = 0.5))

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 10, verbose = FALSE)

  # Get PIPs
  pips <- susie_get_pip(result)

  # Top PIPs should include causal variables
  top_vars <- order(pips, decreasing = TRUE)[1:5]
  expect_true(length(intersect(top_vars, base_data$causal_idx)) >= 2)
})

test_that("susie_auto has low PIPs for null variables", {
  base_data <- generate_base_data(n = 200, p = 100, k = 2, signal_sd = 1.9, seed = 156)
  base_data$X <- scale(base_data$X)
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n, sd = 0.5))

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 10, verbose = FALSE)

  # Get PIPs
  pips <- susie_get_pip(result)

  # Most PIPs should be low for null variables
  null_pips <- pips[setdiff(1:base_data$p, base_data$causal_idx)]
  expect_true(median(null_pips) < 0.2)
})

test_that("susie_auto identifies credible sets for strong effects", {
  base_data <- generate_base_data(n = 200, p = 100, k = 3, signal_sd = 2, seed = 157)
  base_data$X <- scale(base_data$X)
  base_data$y <- as.vector(base_data$X %*% base_data$beta + rnorm(base_data$n, sd = 0.5))

  result <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 10, verbose = FALSE)

  # Should find credible sets
  cs <- susie_get_cs(result)

  if (!is.null(cs) && length(cs$cs) > 0) {
    # At least one CS should be found
    expect_true(length(cs$cs) >= 1)

    # CSs should have reasonable coverage
    expect_true(all(cs$coverage >= 0.9))
  }
})

# =============================================================================
# VERBOSE OUTPUT
# =============================================================================

test_that("susie_auto verbose mode produces output", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 158)

  # Capture messages
  expect_message(
    susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 4, verbose = TRUE),
    "Trying L="
  )
})

test_that("susie_auto verbose shows correct L progression", {
  base_data <- generate_base_data(n = 100, p = 50, k = 5, signal_sd = 1, seed = 159)

  # Capture messages and check for L progression
  msgs <- capture_messages(
    susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 4, verbose = TRUE)
  )

  # Should see "Trying L=" messages
  expect_true(any(grepl("Trying L=", msgs)))
})

# =============================================================================
# CONSISTENCY
# =============================================================================

test_that("susie_auto gives consistent results with same seed", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 199)

  set.seed(200)
  result1 <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  set.seed(200)
  result2 <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 4, verbose = FALSE)

  # Results should be identical
  expect_equal(result1$alpha, result2$alpha)
  expect_equal(result1$elbo, result2$elbo)
})

test_that("susie_auto with different L_init converges to similar solutions", {
  base_data <- generate_base_data(n = 100, p = 50, k = 2, signal_sd = 1.75, seed = 201)

  result_L1 <- susie_auto(base_data$X, base_data$y, L_init = 1, L_max = 8, verbose = FALSE)
  result_L2 <- susie_auto(base_data$X, base_data$y, L_init = 2, L_max = 8, verbose = FALSE)

  # PIPs should be similar
  pips1 <- susie_get_pip(result_L1)
  pips2 <- susie_get_pip(result_L2)

  # Correlation of PIPs should be high
  expect_true(cor(pips1, pips2) > 0.9)
})


================================================
FILE: tests/testthat/test_susie_constructors.R
================================================
context("SuSiE Data Constructors")

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Basic Functionality
# =============================================================================

test_that("individual_data_constructor returns correct structure", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 1)

  result <- individual_data_constructor(base_data$X, base_data$y)

  expect_type(result, "list")
  expect_true("data" %in% names(result))
  expect_true("params" %in% names(result))
  expect_s3_class(result$data, "individual")
})

test_that("individual_data_constructor creates data object with correct fields", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 2)

  result <- individual_data_constructor(base_data$X, base_data$y)

  expect_true("X" %in% names(result$data))
  expect_true("y" %in% names(result$data))
  expect_true("n" %in% names(result$data))
  expect_true("p" %in% names(result$data))
  expect_true("mean_y" %in% names(result$data))
})

test_that("individual_data_constructor sets correct dimensions", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 3)

  result <- individual_data_constructor(base_data$X, base_data$y)

  expect_equal(result$data$n, base_data$n)
  expect_equal(result$data$p, base_data$p)
  expect_equal(dim(result$data$X), c(base_data$n, base_data$p))
  expect_length(result$data$y, base_data$n)
})

test_that("individual_data_constructor sets X attributes", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 4)

  result <- individual_data_constructor(base_data$X, base_data$y, standardize = TRUE, intercept = TRUE)

  expect_true(!is.null(attr(result$data$X, "scaled:center")))
  expect_true(!is.null(attr(result$data$X, "scaled:scale")))
  expect_true(!is.null(attr(result$data$X, "d")))
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Input Validation
# =============================================================================

test_that("individual_data_constructor rejects non-matrix X", {
  expect_error(
    individual_data_constructor(as.data.frame(matrix(1:10, 5, 2)), rnorm(5)),
    "Input X must be a double-precision matrix"
  )
})

test_that("individual_data_constructor rejects X with NAs", {
  base_data <- generate_base_data(n = 10, p = 10, k = 0, seed = 5)
  base_data$X[5, 5] <- NA

  expect_error(
    individual_data_constructor(base_data$X, base_data$y),
    "X contains NA values"
  )
})

test_that("individual_data_constructor rejects y with NAs when na.rm=FALSE", {
  base_data <- generate_base_data(n = 10, p = 10, k = 0, seed = 6)
  base_data$y[5] <- NA

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, na.rm = FALSE),
    "Input y must not contain missing values"
  )
})

test_that("individual_data_constructor handles y with NAs when na.rm=TRUE", {
  base_data <- generate_base_data(n = 10, p = 10, k = 0, seed = 7)
  base_data$y[5] <- NA

  result <- individual_data_constructor(base_data$X, base_data$y, na.rm = TRUE)

  expect_equal(result$data$n, 9)
  expect_equal(nrow(result$data$X), 9)
  expect_length(result$data$y, 9)
  expect_false(anyNA(result$data$y))
})

test_that("individual_data_constructor computes residual_variance_lowerbound after NA removal", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 7.25)
  base_data$y[1] <- NA

  result <- individual_data_constructor(base_data$X, base_data$y, na.rm = TRUE)

  # Verify residual_variance_lowerbound is computed correctly (not NA)
  expect_true(is.finite(result$params$residual_variance_lowerbound))
  expect_true(result$params$residual_variance_lowerbound > 0)

  # Verify it equals var(y_clean) / 1e4 where y_clean has NA removed
  y_clean <- base_data$y[!is.na(base_data$y)]
  expected_lowerbound <- var(y_clean) / 1e4
  expect_equal(result$params$residual_variance_lowerbound, expected_lowerbound)
})

test_that("individual_data_constructor allows custom residual_variance_lowerbound with NA in y", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 7.5)
  base_data$y[1] <- NA

  custom_lowerbound <- 0.001
  result <- individual_data_constructor(
    base_data$X, base_data$y,
    na.rm = TRUE,
    residual_variance_lowerbound = custom_lowerbound
  )

  expect_equal(result$params$residual_variance_lowerbound, custom_lowerbound)
})

test_that("individual_data_constructor handles multiple NAs in y with na.rm=TRUE", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 7.75)
  # Set multiple NAs at different positions

  base_data$y[c(1, 25, 50, 75, 100)] <- NA

  result <- individual_data_constructor(base_data$X, base_data$y, na.rm = TRUE)

  expect_equal(result$data$n, 95)
  expect_equal(nrow(result$data$X), 95)
  expect_length(result$data$y, 95)
  expect_false(anyNA(result$data$y))
  expect_true(is.finite(result$params$residual_variance_lowerbound))
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Centering and Scaling
# =============================================================================

test_that("individual_data_constructor centers y when intercept=TRUE", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 8)
  base_data$y <- base_data$y + 10

  result <- individual_data_constructor(base_data$X, base_data$y, intercept = TRUE)

  expect_equal(mean(result$data$y), 0, tolerance = 1e-10)
  expect_true(result$data$mean_y != 0)
})

test_that("individual_data_constructor does not center y when intercept=FALSE", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 9)
  base_data$y <- base_data$y + 10

  result <- individual_data_constructor(base_data$X, base_data$y, intercept = FALSE)

  expect_true(abs(mean(result$data$y) - 10) < 1)
})

test_that("individual_data_constructor standardizes X when requested", {
  set.seed(10)
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = NULL)
  # Create X with different mean and sd
  base_data$X <- matrix(rnorm(base_data$n * base_data$p, mean = 5, sd = 3), base_data$n, base_data$p)

  result <- individual_data_constructor(base_data$X, base_data$y, standardize = TRUE, intercept = TRUE)

  cm <- attr(result$data$X, "scaled:center")
  csd <- attr(result$data$X, "scaled:scale")

  expect_length(cm, base_data$p)
  expect_length(csd, base_data$p)
  expect_true(all(csd > 0))
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Prior Weights
# =============================================================================

test_that("individual_data_constructor creates uniform prior weights by default", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 11)

  result <- individual_data_constructor(base_data$X, base_data$y)

  expect_length(result$params$prior_weights, base_data$p)
  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)
  expect_true(all(abs(result$params$prior_weights - 1/base_data$p) < 1e-10))
})

test_that("individual_data_constructor normalizes custom prior weights", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 12)
  custom_weights <- rep(2, base_data$p)

  result <- individual_data_constructor(base_data$X, base_data$y, prior_weights = custom_weights)

  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)
})

test_that("individual_data_constructor rejects wrong length prior weights", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 13)

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, prior_weights = rep(1, 40)),
    "Prior weights must have length p"
  )
})

test_that("individual_data_constructor rejects all-zero prior weights", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 14)

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, prior_weights = rep(0, base_data$p)),
    "Prior weight should be greater than 0"
  )
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Null Weight
# =============================================================================

test_that("individual_data_constructor handles null_weight=0", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 15)

  result <- individual_data_constructor(base_data$X, base_data$y, null_weight = 0)

  expect_equal(result$data$p, base_data$p)
  expect_equal(ncol(result$data$X), base_data$p)
  expect_null(result$params$null_weight)
})

test_that("individual_data_constructor adds null column when null_weight > 0", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 16)

  result <- individual_data_constructor(base_data$X, base_data$y, null_weight = 0.1)

  expect_equal(result$data$p, base_data$p + 1)
  expect_equal(ncol(result$data$X), base_data$p + 1)
  expect_equal(result$params$null_weight, 0.1)
  expect_true(all(result$data$X[, base_data$p + 1] == 0))
})

test_that("individual_data_constructor adjusts prior weights with null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 17)

  result <- individual_data_constructor(base_data$X, base_data$y, null_weight = 0.2)

  expect_length(result$params$prior_weights, base_data$p + 1)
  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)
  expect_equal(result$params$prior_weights[base_data$p + 1], 0.2, tolerance = 1e-10)
})

test_that("individual_data_constructor adjusts custom prior weights with null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 17.5)

  # Create custom prior weights (not uniform)
  custom_weights <- runif(base_data$p, 0.5, 2)
  custom_weights <- custom_weights / sum(custom_weights)  # Normalize to sum to 1

  result <- individual_data_constructor(base_data$X, base_data$y,
                                       prior_weights = custom_weights,
                                       null_weight = 0.3)

  # Check that we have p+1 weights (original p + null column)
  expect_length(result$params$prior_weights, base_data$p + 1)

  # Check that all weights sum to 1
  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)

  # Check that the null weight is exactly 0.3
  expect_equal(result$params$prior_weights[base_data$p + 1], 0.3, tolerance = 1e-10)

  # Check that the other weights were scaled by (1 - null_weight) = 0.7
  # i.e., result$params$prior_weights[1:p] should equal custom_weights * 0.7
  expect_equal(result$params$prior_weights[1:base_data$p],
               custom_weights * 0.7,
               tolerance = 1e-10)

  # Verify that the sum of the first p weights is (1 - 0.3) = 0.7
  expect_equal(sum(result$params$prior_weights[1:base_data$p]), 0.7, tolerance = 1e-10)
})

test_that("individual_data_constructor rejects invalid null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 18)

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, null_weight = -0.1),
    "Null weight must be between 0 and 1"
  )

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, null_weight = 1.5),
    "Null weight must be between 0 and 1"
  )

  expect_error(
    individual_data_constructor(base_data$X, base_data$y, null_weight = "invalid"),
    "Null weight must be numeric"
  )
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Rfast Warning
# =============================================================================

test_that("individual_data_constructor warns about Rfast when p > 1000 and Rfast not available", {
  # Only test the warning if Rfast is not installed
  skip_if(requireNamespace("Rfast", quietly = TRUE),
          "Rfast is installed, skipping warning test")

  base_data <- generate_base_data(n = 100, p = 1001, k = 0, seed = 18.5)

  expect_message(
    result <- individual_data_constructor(base_data$X, base_data$y),
    "consider installing the Rfast package",
    fixed = FALSE
  )

  # Verify constructor still works despite the warning
  expect_equal(result$data$p, 1001)
})

test_that("individual_data_constructor does not warn when p <= 1000", {
  # This should never warn regardless of Rfast availability
  base_data <- generate_base_data(n = 100, p = 1000, k = 0, seed = 18.75)
  result <- individual_data_constructor(base_data$X, base_data$y)

  expect_equal(result$data$p, 1000)
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Parameters
# =============================================================================

test_that("individual_data_constructor stores all parameters", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 19)

  result <- individual_data_constructor(
    base_data$X, base_data$y,
    L = 5,
    estimate_residual_variance = TRUE,
    estimate_prior_variance = TRUE,
    max_iter = 50,
    tol = 1e-4
  )

  expect_equal(result$params$L, 5)
  expect_true(result$params$estimate_residual_variance)
  expect_true(result$params$estimate_prior_variance)
  expect_equal(result$params$max_iter, 50)
  expect_equal(result$params$tol, 1e-4)
})

# =============================================================================
# INDIVIDUAL DATA CONSTRUCTOR - Incompatible Parameter Combinations
# =============================================================================

test_that("individual_data_constructor rejects unmappable_effects with NIG", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 19.5)

  expect_error(
    individual_data_constructor(
      base_data$X, base_data$y,
      unmappable_effects = "inf",
      estimate_residual_method = "NIG"
    ),
    "The combination of unmappable_effects = 'inf' with estimate_residual_method = 'NIG' is not supported"
  )

  expect_error(
    individual_data_constructor(
      base_data$X, base_data$y,
      unmappable_effects = "ash",
      estimate_residual_method = "NIG"
    ),
    "The combination of unmappable_effects = 'ash' with estimate_residual_method = 'NIG' is not supported"
  )
})

test_that("individual_data_constructor rejects unmappable_effects='ash' with estimate_prior_method='EM'", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 19.75)

  expect_error(
    individual_data_constructor(
      base_data$X, base_data$y,
      unmappable_effects = "ash",
      estimate_prior_method = "EM"
    ),
    "The combination of unmappable_effects = 'ash' with estimate_prior_method = 'EM' is not supported"
  )
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Basic Functionality
# =============================================================================

test_that("sufficient_stats_constructor returns correct structure", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 20)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX)

  expect_type(result, "list")
  expect_true("data" %in% names(result))
  expect_true("params" %in% names(result))
  expect_s3_class(result$data, "ss")
})

test_that("sufficient_stats_constructor creates data object with correct fields", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 21)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX)

  expect_true("XtX" %in% names(result$data))
  expect_true("Xty" %in% names(result$data))
  expect_true("yty" %in% names(result$data))
  expect_true("n" %in% names(result$data))
  expect_true("p" %in% names(result$data))
})

test_that("sufficient_stats_constructor sets correct dimensions", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 22)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX)

  expect_equal(result$data$n, base_data$n)
  expect_equal(result$data$p, base_data$p)
  expect_equal(dim(result$data$XtX), c(base_data$p, base_data$p))
  expect_length(result$data$Xty, base_data$p)
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Input Validation
# =============================================================================

test_that("sufficient_stats_constructor requires n", {
  XtX <- matrix(1:25, 5, 5)
  Xty <- 1:5
  yty <- 10

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, XtX = XtX),
    "n must be provided"
  )
})

test_that("sufficient_stats_constructor rejects n <= 1", {
  XtX <- matrix(1:25, 5, 5)
  Xty <- 1:5
  yty <- 10

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = 1, XtX = XtX),
    "n must be greater than 1"
  )
})

test_that("sufficient_stats_constructor requires all inputs", {
  XtX <- matrix(1:25, 5, 5)
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n),
    "XtX, Xty, yty must all be provided"
  )
})

test_that("sufficient_stats_constructor rejects non-matrix XtX", {
  # Test with data.frame (not a matrix)
  XtX_df <- data.frame(matrix(rnorm(25), 5, 5))
  Xty <- rnorm(5)
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX_df),
    "XtX must be a numeric dense or sparse matrix"
  )
})

test_that("sufficient_stats_constructor rejects integer matrix XtX", {
  # Test with integer matrix (not double)
  XtX_int <- matrix(1L:25L, 5, 5)
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX_int),
    "XtX must be a numeric dense or sparse matrix"
  )
})

test_that("sufficient_stats_constructor rejects non-numeric XtX", {
  # Test with character matrix
  XtX_char <- matrix(as.character(1:25), 5, 5)
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX_char),
    "XtX must be a numeric dense or sparse matrix"
  )
})

test_that("sufficient_stats_constructor rejects vector XtX", {
  # Test with vector (not a matrix)
  XtX_vec <- rnorm(25)
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX_vec),
    "XtX must be a numeric dense or sparse matrix"
  )
})

test_that("sufficient_stats_constructor rejects dimension mismatch", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 23)
  XtX <- crossprod(base_data$X)
  Xty <- rnorm(10)
  yty <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX),
    "does not agree with expected"
  )
})

test_that("sufficient_stats_constructor rejects non-symmetric XtX", {
  XtX <- matrix(1:25, 5, 5)
  XtX[1, 2] <- 100
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_message(
    result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX),
    "XtX not symmetric"
  )

  expect_true(isSymmetric(result$data$XtX))
})

test_that("sufficient_stats_constructor rejects XtX with NAs", {
  XtX <- matrix(rnorm(25), 5, 5)
  XtX[1, 1] <- NA
  Xty <- 1:5
  yty <- 10
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX),
    "Input XtX matrix contains NAs"
  )
})

test_that("sufficient_stats_constructor handles Xty with NAs", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 24)
  XtX <- crossprod(base_data$X)
  Xty <- rnorm(base_data$p)
  Xty[5] <- NA
  yty <- 100

  expect_message(
    result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX),
    "NA values in Xty are replaced with 0"
  )

  expect_false(anyNA(result$data$Xty))
  expect_equal(result$data$Xty[5], 0)
})

test_that("sufficient_stats_constructor rejects infinite Xty", {
  XtX <- crossprod(matrix(rnorm(100 * 10), 100, 10))
  Xty <- rnorm(10)
  Xty[5] <- Inf
  yty <- 100
  n <- 100

  expect_error(
    sufficient_stats_constructor(Xty = Xty, yty = yty, n = n, XtX = XtX),
    "Input Xty contains infinite values"
  )
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Standardization
# =============================================================================

test_that("sufficient_stats_constructor standardizes when requested", {
  set.seed(25)
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = NULL)
  base_data$X <- matrix(rnorm(base_data$n * base_data$p, mean = 5, sd = 3), base_data$n, base_data$p)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX, standardize = TRUE)

  d_attr <- attr(result$data$XtX, "d")
  expect_length(d_attr, base_data$p)
  expect_true(all(is.finite(d_attr)))
})

test_that("sufficient_stats_constructor does not standardize when standardize=FALSE", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 26)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX, standardize = FALSE)

  csd_attr <- attr(result$data$XtX, "scaled:scale")
  expect_true(all(csd_attr == 1))
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Rfast Warning
# =============================================================================

test_that("sufficient_stats_constructor warns about Rfast when p > 1000 and Rfast not available", {
  # Only test the warning if Rfast is not installed
  skip_if(requireNamespace("Rfast", quietly = TRUE),
          "Rfast is installed, skipping warning test")

  base_data <- generate_base_data(n = 100, p = 1001, k = 0, seed = 27.5)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  expect_message(
    result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX),
    "consider installing the Rfast package",
    fixed = FALSE
  )

  # Verify constructor still works despite the warning
  expect_equal(result$data$p, 1001)
})

test_that("sufficient_stats_constructor does not warn when p <= 1000", {
  # This should never warn regardless of Rfast availability
  base_data <- generate_base_data(n = 100, p = 1000, k = 0, seed = 27.6)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX)

  # Just verify it worked
  expect_equal(result$data$p, 1000)
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - MAF Filtering
# =============================================================================

test_that("sufficient_stats_constructor applies MAF filter", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 27)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)
  maf <- runif(base_data$p, 0, 0.5)

  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    maf = maf, maf_thresh = 0.1
  )

  n_filtered <- sum(maf > 0.1)
  expect_equal(result$data$p, n_filtered)
  expect_equal(nrow(result$data$XtX), n_filtered)
  expect_length(result$data$Xty, n_filtered)
})

test_that("sufficient_stats_constructor rejects MAF with incorrect length", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 27.7)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # MAF vector with wrong length (p - 10 instead of p)
  maf_wrong_length <- runif(base_data$p - 10, 0, 0.5)

  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      maf = maf_wrong_length, maf_thresh = 0.1
    ),
    "The length of maf does not agree with expected"
  )
})

test_that("sufficient_stats_constructor rejects MAF that is too long", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 27.8)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # MAF vector with wrong length (p + 10 instead of p)
  maf_too_long <- runif(base_data$p + 10, 0, 0.5)

  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      maf = maf_too_long, maf_thresh = 0.1
    ),
    "The length of maf does not agree with expected"
  )
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Positive Semidefinite Check
# =============================================================================

test_that("sufficient_stats_constructor rejects non-positive-semidefinite XtX when check_input=TRUE", {
  # Create a matrix that is NOT positive semidefinite
  # by using a matrix with negative eigenvalues
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 28.9)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Make XtX non-positive-semidefinite by adding a negative diagonal
  # This creates negative eigenvalues
  XtX[1, 1] <- -10

  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      check_input = TRUE
    ),
    "XtX is not a positive semidefinite matrix"
  )
})

test_that("sufficient_stats_constructor accepts positive-semidefinite XtX when check_input=TRUE", {
  # Create a valid positive semidefinite matrix
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 29)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # This should work without error
  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    check_input = TRUE
  )

  expect_equal(result$data$p, base_data$p)
})

test_that("sufficient_stats_constructor warns when Xty not in column space of XtX", {
  # Create a rank-deficient matrix with exact zero eigenvalues
  p <- 5
  n <- 100

  # Diagonal matrix with rank 3 (2 zero eigenvalues)
  XtX <- diag(c(1, 1, 1, 0, 0))

  # Create Xty with non-zero components in the null space (positions 4 and 5)
  # This Xty cannot be written as X'y for any y
  Xty <- c(1, 1, 1, 10, 10)  # Last two components are in null space

  yty <- 100

  expect_message(
    result <- sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = n, XtX = XtX,
      check_input = TRUE
    ),
    "Xty does not lie in the space of the non-zero eigenvectors"
  )
})

test_that("sufficient_stats_constructor does not warn when Xty in column space", {
  # Create valid XtX and Xty from same data
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 29.3)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # This should work without warning since Xty = X'y by construction
  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    check_input = TRUE
  )

  # Just verify it worked
  expect_equal(result$data$p, base_data$p)
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Null Weight
# =============================================================================

test_that("sufficient_stats_constructor adds null column when null_weight > 0", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    null_weight = 0.1,
    X_colmeans = rep(0, base_data$p)
  )

  expect_equal(result$data$p, base_data$p + 1)
  expect_equal(nrow(result$data$XtX), base_data$p + 1)
  expect_length(result$data$Xty, base_data$p + 1)
  expect_equal(result$params$null_weight, 0.1)
})

test_that("sufficient_stats_constructor adjusts custom prior weights with null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28.5)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Create custom prior weights (not uniform)
  custom_weights <- runif(base_data$p, 0.5, 2)
  custom_weights <- custom_weights / sum(custom_weights)  # Normalize to sum to 1

  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    prior_weights = custom_weights,
    null_weight = 0.25,
    X_colmeans = rep(0, base_data$p)
  )

  # Check that we have p+1 weights (original p + null column)
  expect_length(result$params$prior_weights, base_data$p + 1)

  # Check that all weights sum to 1
  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)

  # Check that the null weight is exactly 0.25
  expect_equal(result$params$prior_weights[base_data$p + 1], 0.25, tolerance = 1e-10)

  # Check that the other weights were scaled by (1 - null_weight) = 0.75
  expect_equal(result$params$prior_weights[1:base_data$p],
               custom_weights * 0.75,
               tolerance = 1e-10)

  # Verify that the sum of the first p weights is (1 - 0.25) = 0.75
  expect_equal(sum(result$params$prior_weights[1:base_data$p]), 0.75, tolerance = 1e-10)
})

test_that("sufficient_stats_constructor rejects non-numeric null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28.6)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      null_weight = "invalid"
    ),
    "Null weight must be numeric"
  )
})

test_that("sufficient_stats_constructor rejects negative null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28.7)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      null_weight = -0.1
    ),
    "Null weight must be between 0 and 1"
  )
})

test_that("sufficient_stats_constructor rejects null_weight >= 1", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28.8)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Test null_weight = 1
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      null_weight = 1
    ),
    "Null weight must be between 0 and 1"
  )

  # Test null_weight > 1
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      null_weight = 1.5
    ),
    "Null weight must be between 0 and 1"
  )
})

test_that("sufficient_stats_constructor replicates scalar X_colmeans when null_weight is set", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 28.9)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide scalar X_colmeans which should be replicated to length p
  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    null_weight = 0.1,
    X_colmeans = 0  # Scalar value
  )

  # Should work without error
  expect_equal(result$data$p, base_data$p + 1)  # p + 1 due to null column
})

test_that("sufficient_stats_constructor rejects wrong length X_colmeans with null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 29.0)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide X_colmeans with wrong length
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      null_weight = 0.1,
      X_colmeans = rep(0, base_data$p - 10)  # Wrong length
    ),
    "The length of X_colmeans does not agree with number of variables"
  )
})

test_that("sufficient_stats_constructor replicates scalar X_colmeans without null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 29.1)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide scalar X_colmeans which should be replicated to length p
  result <- sufficient_stats_constructor(
    Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
    X_colmeans = 0  # Scalar value
  )

  # Should work without error
  expect_equal(result$data$p, base_data$p)
})

test_that("sufficient_stats_constructor rejects wrong length X_colmeans without null_weight", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 29.2)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide X_colmeans with wrong length
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      X_colmeans = rep(0, base_data$p - 10)  # Wrong length
    ),
    "X_colmeans.*does not match number of variables"
  )
})

test_that("sufficient_stats_constructor rejects wrong length prior_weights", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 29.3)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide prior_weights with wrong length
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      prior_weights = rep(1, base_data$p - 10)  # Wrong length
    ),
    "Prior weights must have length p"
  )
})

test_that("sufficient_stats_constructor rejects all-zero prior_weights", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 29.4)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  # Provide all-zero prior_weights
  expect_error(
    sufficient_stats_constructor(
      Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
      prior_weights = rep(0, base_data$p)  # All zeros
    ),
    "Prior weight should be greater than 0 for at least one variable"
  )
})

# =============================================================================
# SUFFICIENT STATISTICS CONSTRUCTOR - Method Restrictions
# =============================================================================

test_that("sufficient_stats_constructor accepts NIG", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 29)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- 100

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
                                         estimate_residual_method = "NIG")
  expect_true(result$params$use_NIG)
  expect_equal(result$params$estimate_prior_method, "EM")
})

test_that("sufficient_stats_constructor accepts unmappable_effects='ash'", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 30)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- 100

  # ash is now supported for sufficient statistics via mr.ash.rss
  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX,
                                          unmappable_effects = "ash")
  expect_true(inherits(result$data, "ss"))
  expect_equal(result$params$unmappable_effects, "ash")
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - Basic Functionality
# =============================================================================

test_that("rss_lambda_constructor returns correct structure", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)

  expect_type(result, "list")
  expect_true("data" %in% names(result))
  expect_true("params" %in% names(result))
  expect_s3_class(result$data, "rss_lambda")
})

test_that("rss_lambda_constructor creates data object with correct fields", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)

  expect_true("z" %in% names(result$data))
  expect_true("R" %in% names(result$data))
  expect_true("lambda" %in% names(result$data))
  expect_true("eigen_R" %in% names(result$data))
  expect_true("Vtz" %in% names(result$data))
  expect_true("n" %in% names(result$data))
  expect_true("p" %in% names(result$data))
})

test_that("rss_lambda_constructor stores n and dimensions correctly", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  # When n is not provided, data$n is NA_integer_ (not silently set to p)
  result <- rss_lambda_constructor(z, R, lambda = 0.5)
  expect_true(is.na(result$data$n))
  expect_equal(result$data$p, p)
  expect_length(result$data$z, p)
  expect_equal(dim(result$data$R), c(p, p))

  # When n is provided, data$n stores the GWAS sample size as supplied
  result_n <- rss_lambda_constructor(z, R, lambda = 0.5, n = 1000)
  expect_equal(result_n$data$n, 1000L)
})

test_that("rss_lambda_constructor computes eigen decomposition", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)

  expect_true("eigen_R" %in% names(result$data))
  expect_true("values" %in% names(result$data$eigen_R))
  expect_true("vectors" %in% names(result$data$eigen_R))
  expect_length(result$data$eigen_R$values, p)
})

test_that("rss_lambda_constructor computes Vtz", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)

  expect_true("Vtz" %in% names(result$data))
  expect_length(result$data$Vtz, p)
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - Input Validation
# =============================================================================

test_that("rss_lambda_constructor rejects dimension mismatch", {
  z <- rnorm(50)
  R <- diag(40)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5),
    "does not agree with expected"
  )
})

test_that("rss_lambda_constructor rejects non-symmetric R", {
  R <- matrix(rnorm(25), 5, 5)
  z <- rnorm(5)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5),
    "not a positive semidefinite matrix|R is not a symmetric matrix"
  )
})

test_that("rss_lambda_constructor accepts R with mismatched rownames and colnames", {
  p <- 10
  z <- rnorm(p)
  R <- diag(p)
  rownames(R) <- paste0("row_", 1:p)
  colnames(R) <- paste0("col_", 1:p)

  # Should succeed despite mismatched dimnames (values are symmetric)
  result <- rss_lambda_constructor(z, R, lambda = 0.5)
  expect_equal(result$data$p, p)
  expect_s3_class(result$data, "rss_lambda")
})

test_that("rss_lambda_constructor accepts R with matching rownames and colnames", {
  p <- 10
  z <- rnorm(p)
  R <- diag(p)
  rownames(R) <- paste0("SNP", 1:p)
  colnames(R) <- paste0("SNP", 1:p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)
  expect_equal(result$data$p, p)
  expect_s3_class(result$data, "rss_lambda")
})

test_that("rss_lambda_constructor accepts R with no dimnames", {
  p <- 10
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5)
  expect_equal(result$data$p, p)
  expect_s3_class(result$data, "rss_lambda")
})

test_that("rss_lambda_constructor rejects integer matrix R", {
  R <- matrix(1:25, 5, 5)
  R <- R + t(R)  # Make it symmetric
  mode(R) <- "integer"  # Convert to integer type
  z <- rnorm(5)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5),
    "Input R must be a double-precision matrix or a sparse matrix"
  )
})

test_that("rss_lambda_constructor rejects non-positive-semidefinite R when check_R=TRUE", {
  # Create a matrix with negative eigenvalue
  R <- diag(5)
  R[1, 1] <- -1  # Force negative eigenvalue
  z <- rnorm(5)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, check_R = TRUE),
    "is not a positive semidefinite matrix"
  )
})

test_that("rss_lambda_constructor accepts non-PSD R when check_R=FALSE", {
  # Create a matrix with negative eigenvalue
  R <- diag(5)
  R[1, 1] <- -0.5  # Force negative eigenvalue
  z <- rnorm(5)

  # Should succeed with check_R = FALSE (sets negative eigenvalues to 0)
  result <- suppressWarnings(
    rss_lambda_constructor(z, R, lambda = 0.5, check_R = FALSE)
  )
  expect_true(!is.null(result))
})

test_that("rss_lambda_constructor warns when z not in column space of R", {
  # Create R with rank < p (has null space)
  p <- 5
  R <- diag(c(1, 1, 1, 0, 0))  # Rank 3, nullspace dimension 2

  # Create z with components in null space (positions 4 and 5)
  z <- c(0.1, 0.1, 0.1, 10, 10)  # Large components in null directions

  expect_message(
    rss_lambda_constructor(z, R, lambda = 0.5, check_z = TRUE),
    "Input z does not lie in the space of non-zero eigenvectors of R"
  )
})

test_that("rss_lambda_constructor messages when z in column space of R", {
  # Create R with rank < p
  p <- 5
  R <- diag(c(1, 1, 1, 0, 0))  # Rank 3

  # Create z only in column space (zero components in null directions)
  z <- c(1, 2, 3, 0, 0)

  expect_message(
    suppressWarnings(
      rss_lambda_constructor(z, R, lambda = 0.5, check_z = TRUE)
    ),
    "Input z is in space spanned by the non-zero eigenvectors of R"
  )
})

test_that("rss_lambda_constructor skips z check when check_z=FALSE", {
  # Create R with rank < p
  p <- 5
  R <- diag(c(1, 1, 1, 0, 0))
  z <- c(0.1, 0.1, 0.1, 10, 10)  # z in null space
  result <- suppressWarnings(
    suppressMessages(
      rss_lambda_constructor(z, R, lambda = 0.5, check_z = FALSE)
    )
  )
  expect_true(!is.null(result))
})

test_that("rss_lambda_constructor skips z check when R is full rank", {
  # Full rank R (no null space)
  p <- 5
  R <- diag(p)
  z <- rnorm(p)

  # Should not check when length(colspace) == length(z)
  result <- suppressWarnings(
    rss_lambda_constructor(z, R, lambda = 0.5, check_z = TRUE)
  )
  expect_true(!is.null(result))
})

test_that("rss_lambda_constructor rejects R with NAs", {
  R <- diag(10)
  R[1, 1] <- NA
  z <- rnorm(10)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5),
    "R matrix contains missing values"
  )
})

test_that("rss_lambda_constructor rejects infinite z", {
  R <- diag(10)
  z <- rnorm(10)
  z[5] <- Inf

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5),
    "z contains infinite values"
  )
})

test_that("rss_lambda_constructor replaces NA z with zero", {
  R <- diag(10)
  z <- rnorm(10)
  z[5] <- NA

  expect_message(
    result <- rss_lambda_constructor(z, R, lambda = 0.5),
    "NA values in z-scores are replaced with 0"
  )

  expect_false(anyNA(result$data$z))
  expect_equal(result$data$z[5], 0)
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - Lambda Parameter
# =============================================================================

test_that("rss_lambda_constructor stores lambda value", {
  z <- rnorm(50)
  R <- diag(50)

  result <- rss_lambda_constructor(z, R, lambda = 0.3)

  expect_equal(result$data$lambda, 0.3)
})

test_that("rss_lambda_constructor estimates lambda when lambda='estimate'", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)
  R[1:10, 1:10] <- 0

  result <- rss_lambda_constructor(z, R, lambda = "estimate")

  expect_true(is.numeric(result$data$lambda))
  expect_true(result$data$lambda >= 0)
})

test_that("rss_lambda_constructor sets lambda=0 when R is full rank and lambda='estimate'", {
  set.seed(123)
  p <- 50
  z <- rnorm(p)
  R <- diag(p)  # Full rank - all eigenvalues positive

  result <- rss_lambda_constructor(z, R, lambda = "estimate")

  # When R is full rank, length(colspace) == length(z), so lambda should be set to 0
  expect_equal(result$data$lambda, 0)
})

test_that("rss_lambda_constructor adjusts residual variance with lambda", {
  z <- rnorm(50)
  R <- diag(50)

  result <- rss_lambda_constructor(z, R, lambda = 0.2, residual_variance = 0.8)

  expect_equal(result$params$residual_variance, 0.6)
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - Method Restrictions
# =============================================================================

test_that("rss_lambda_constructor rejects non-MLE residual variance methods", {
  z <- rnorm(50)
  R <- diag(50)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5,
                          estimate_residual_method = "MoM"),
    "RSS-lambda supports estimate_residual_method"
  )
  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5,
                          estimate_residual_method = "NIG"),
    "RSS-lambda supports estimate_residual_method"
  )
})

test_that("rss_lambda_constructor does not expose unmappable_effects", {
  z <- rnorm(50)
  R <- diag(50)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, unmappable_effects = "inf"),
    "unused argument"
  )
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - MAF Filtering
# =============================================================================

test_that("rss_lambda_constructor applies MAF filter", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)
  maf <- runif(p, 0, 0.5)

  result <- rss_lambda_constructor(z, R, lambda = 0.5,
                                  maf = maf, maf_thresh = 0.1)

  n_filtered <- sum(maf > 0.1)
  expect_equal(result$data$p, n_filtered)
  expect_length(result$data$z, n_filtered)
  expect_equal(nrow(result$data$R), n_filtered)
})

test_that("rss_lambda_constructor rejects MAF with wrong length", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)
  maf <- runif(p - 10)  # Wrong length

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, maf = maf),
    "The length of maf does not agree with expected 50"
  )
})

# =============================================================================
# RSS LAMBDA CONSTRUCTOR - Null Weight
# =============================================================================

test_that("rss_lambda_constructor adds null column when null_weight > 0", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- rss_lambda_constructor(z, R, lambda = 0.5, null_weight = 0.1)

  expect_equal(result$data$p, p + 1)
  expect_length(result$data$z, p + 1)
  expect_equal(nrow(result$data$R), p + 1)
  expect_equal(result$params$null_weight, 0.1)
  expect_equal(result$data$z[p + 1], 0)
})

test_that("rss_lambda_constructor adjusts custom prior weights with null_weight", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  # Create custom prior weights (not uniform)
  custom_weights <- runif(p, 0.5, 2)
  custom_weights <- custom_weights / sum(custom_weights)  # Normalize to sum to 1

  result <- rss_lambda_constructor(z, R, lambda = 0.5,
                                  prior_weights = custom_weights,
                                  null_weight = 0.15)

  # Check that we have p+1 weights (original p + null column)
  expect_length(result$params$prior_weights, p + 1)

  # Check that all weights sum to 1
  expect_equal(sum(result$params$prior_weights), 1, tolerance = 1e-10)

  # Check that the null weight is exactly 0.15
  expect_equal(result$params$prior_weights[p + 1], 0.15, tolerance = 1e-10)

  # Check that the other weights were scaled by (1 - null_weight) = 0.85
  expect_equal(result$params$prior_weights[1:p],
               custom_weights * 0.85,
               tolerance = 1e-10)

  # Verify that the sum of the first p weights is (1 - 0.15) = 0.85
  expect_equal(sum(result$params$prior_weights[1:p]), 0.85, tolerance = 1e-10)
})

test_that("rss_lambda_constructor rejects non-numeric null_weight", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, null_weight = "invalid"),
    "Null weight must be numeric"
  )
})

test_that("rss_lambda_constructor rejects negative null_weight", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, null_weight = -0.1),
    "Null weight must be between 0 and 1"
  )
})

test_that("rss_lambda_constructor rejects null_weight >= 1", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, null_weight = 1.0),
    "Null weight must be between 0 and 1"
  )

  expect_error(
    rss_lambda_constructor(z, R, lambda = 0.5, null_weight = 1.5),
    "Null weight must be between 0 and 1"
  )
})

# =============================================================================
# SUMMARY STATISTICS CONSTRUCTOR - Routing Logic
# =============================================================================

test_that("summary_stats_constructor routes to rss_lambda when lambda != 0", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- summary_stats_constructor(z = z, R = R, lambda = 0.5,
                                      estimate_residual_method = "MLE")

  expect_s3_class(result$data, "rss_lambda")
  expect_equal(result$data$lambda, 0.5)
})

test_that("summary_stats_constructor routes to sufficient_stats when lambda = 0", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  result <- summary_stats_constructor(z = z, R = R, n = 100, lambda = 0)

  expect_s3_class(result$data, "ss")
})

# =============================================================================
# SUMMARY STATISTICS CONSTRUCTOR - Input Validation
# =============================================================================

test_that("summary_stats_constructor rejects R with wrong number of rows", {
  p <- 50
  z <- rnorm(p)

  # Create R with wrong number of rows (40 instead of 50)
  R_wrong <- diag(40)

  expect_error(
    summary_stats_constructor(z = z, R = R_wrong, n = 100, lambda = 0),
    "The dimension of R \\(40 x 40\\) does not agree with expected \\(50 x 50\\)"
  )
})

test_that("summary_stats_constructor rejects n <= 1", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  # Test n = 1
  expect_error(
    summary_stats_constructor(z = z, R = R, n = 1, lambda = 0),
    "n must be greater than 1"
  )

  # Test n = 0
  expect_error(
    summary_stats_constructor(z = z, R = R, n = 0, lambda = 0),
    "n must be greater than 1"
  )

  # Test negative n
  expect_error(
    summary_stats_constructor(z = z, R = R, n = -5, lambda = 0),
    "n must be greater than 1"
  )
})

test_that("summary_stats_constructor rejects mismatched bhat and shat lengths", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  shat <- abs(rnorm(p - 5))  # Wrong length

  expect_error(
    summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "The lengths of bhat and shat do not agree"
  )
})

test_that("summary_stats_constructor accepts scalar shat and replicates it", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  shat <- 0.1  # Scalar

  # Should replicate shat to length of bhat
  result <- summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0)
  expect_true(!is.null(result))
})

test_that("summary_stats_constructor rejects missing values in bhat", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  bhat[5] <- NA
  shat <- abs(rnorm(p))

  expect_error(
    summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "bhat, shat cannot have missing values"
  )
})

test_that("summary_stats_constructor rejects missing values in shat", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  shat <- abs(rnorm(p))
  shat[10] <- NA

  expect_error(
    summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "bhat, shat cannot have missing values"
  )
})

test_that("summary_stats_constructor rejects zero elements in shat", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  shat <- abs(rnorm(p))
  shat[5] <- 0

  expect_error(
    summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "shat cannot have zero or negative elements"
  )
})

test_that("summary_stats_constructor rejects negative elements in shat", {
  p <- 50
  R <- diag(p)
  bhat <- rnorm(p)
  shat <- abs(rnorm(p))
  shat[8] <- -0.5

  expect_error(
    summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "shat cannot have zero or negative elements"
  )
})

test_that("summary_stats_constructor rejects empty z vector", {
  # When z is empty, length(z) = 0, so p = 0
  # This causes R dimension check to fail before z length check
  z <- numeric(0)  # Empty vector
  R <- matrix(0, 0, 0)  # Match the expected dimension (0 x 0)

  expect_error(
    summary_stats_constructor(z = z, R = R, n = 100, lambda = 0),
    "Input vector z should have at least one element"
  )
})

test_that("summary_stats_constructor rejects MAF with wrong length", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)
  maf <- runif(p - 10)  # Wrong length

  expect_error(
    summary_stats_constructor(z = z, R = R, n = 100, lambda = 0, maf = maf),
    "The length of maf does not agree with expected 50"
  )
})

test_that("summary_stats_constructor handles shat and var_y for original scale effects", {
  p <- 50
  bhat <- rnorm(p)
  shat <- abs(rnorm(p, mean = 0.1, sd = 0.02))
  var_y <- 2.5
  R <- diag(p)
  n <- 100

  # This should use the original scale path (lines 649-655)
  result <- summary_stats_constructor(
    bhat = bhat, shat = shat, var_y = var_y, R = R, n = n, lambda = 0
  )

  # Verify the result is created successfully
  expect_true(!is.null(result))
  expect_true(!is.null(result$data))
  expect_true(!is.null(result$data$XtX))
  expect_true(!is.null(result$data$Xty))
  expect_true(!is.null(result$data$yty))

  # Verify yty matches expected: (n - 1) * var_y
  expect_equal(result$data$yty, (n - 1) * var_y)
})

# =============================================================================
# SUMMARY STATISTICS CONSTRUCTOR - Lambda=0 Path
# =============================================================================

test_that("summary_stats_constructor converts z to sufficient stats", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)
  n <- 100

  result <- summary_stats_constructor(z = z, R = R, n = n, lambda = 0)

  expect_true("XtX" %in% names(result$data))
  expect_true("Xty" %in% names(result$data))
  expect_true("yty" %in% names(result$data))
})

test_that("summary_stats_constructor handles z without n", {
  p <- 50
  z <- rnorm(p)
  R <- diag(p)

  expect_message(
    result <- summary_stats_constructor(z = z, R = R, lambda = 0),
    "Providing the sample size"
  )

  expect_s3_class(result$data, "ss")
})

test_that("summary_stats_constructor converts bhat/shat to z", {
  p <- 50
  bhat <- rnorm(p)
  shat <- runif(p, 0.5, 1.5)
  R <- diag(p)
  n <- 100

  result <- summary_stats_constructor(bhat = bhat, shat = shat, R = R, n = n, lambda = 0)

  expect_s3_class(result$data, "ss")
})

test_that("summary_stats_constructor requires either z or bhat/shat", {
  R <- diag(50)

  expect_error(
    summary_stats_constructor(R = R, n = 100, lambda = 0),
    "Please provide either z or \\(bhat, shat\\)"
  )
})

test_that("summary_stats_constructor rejects both z and bhat/shat", {
  z <- rnorm(50)
  bhat <- rnorm(50)
  shat <- runif(50, 0.5, 1.5)
  R <- diag(50)

  expect_error(
    summary_stats_constructor(z = z, bhat = bhat, shat = shat, R = R, n = 100, lambda = 0),
    "Please provide either z or \\(bhat, shat\\), but not both"
  )
})

# =============================================================================
# SUMMARY STATISTICS CONSTRUCTOR - Lambda != 0 Restrictions
# =============================================================================

test_that("summary_stats_constructor rejects bhat/shat when lambda != 0", {
  z <- rnorm(50)
  bhat <- rnorm(50)
  shat <- runif(50, 0.5, 1.5)
  R <- diag(50)

  expect_error(
    summary_stats_constructor(z = z, R = R, bhat = bhat, shat = shat, lambda = 0.5),
    "bhat.*shat.*not supported"
  )
})

test_that("summary_stats_constructor rejects var_y when lambda != 0", {
  z <- rnorm(50)
  R <- diag(50)

  expect_error(
    summary_stats_constructor(z = z, R = R, var_y = 1.5, lambda = 0.5),
    "var_y.*not supported"
  )
})

test_that("summary_stats_constructor accepts n when lambda != 0 for PVE adjustment", {
  z <- rnorm(50)
  R <- diag(50)

  # n is used for PVE adjustment in all paths; the lambda > 0 dispatch
  # routes through rss_lambda_constructor which requires MLE.
  result <- summary_stats_constructor(z = z, R = R, n = 100, lambda = 0.5,
                                      estimate_residual_method = "MLE")
  expect_true(!is.null(result))
})

# =============================================================================
# SUMMARY STATISTICS CONSTRUCTOR - Lambda=0 Restrictions
# =============================================================================

test_that("summary_stats_constructor rejects intercept_value when lambda = 0", {
  z <- rnorm(50)
  R <- diag(50)

  expect_error(
    summary_stats_constructor(z = z, R = R, n = 100, lambda = 0, intercept_value = 0.5),
    "intercept_value.*only supported"
  )
})

# =============================================================================
# INTEGRATION - Constructor Output Usability
# =============================================================================

test_that("individual_data_constructor output works with ibss_initialize", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 31)

  result <- individual_data_constructor(base_data$X, base_data$y, L = 5)

  expect_error(
    model <- ibss_initialize(result$data, result$params),
    NA
  )
})

test_that("sufficient_stats_constructor output works with ibss_initialize", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 32)
  XtX <- crossprod(base_data$X)
  Xty <- crossprod(base_data$X, base_data$y)
  yty <- sum(base_data$y^2)

  result <- sufficient_stats_constructor(Xty = Xty, yty = yty, n = base_data$n, XtX = XtX, L = 5)

  expect_error(
    model <- ibss_initialize(result$data, result$params),
    NA
  )
})

test_that("rss_lambda_constructor output works with ibss_initialize", {
  z <- rnorm(50)
  R <- diag(50)

  result <- rss_lambda_constructor(z, R, lambda = 0.5, L = 5)

  expect_error(
    model <- ibss_initialize(result$data, result$params),
    NA
  )
})


================================================
FILE: tests/testthat/test_susie_get_functions.R
================================================
context("susie_get_* functions")

# =============================================================================
# Get Model Information
# =============================================================================

test_that("susie_get_objective returns last ELBO when last_only=TRUE", {
  set.seed(1)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  obj <- susie_get_objective(fit, last_only = TRUE)

  expect_type(obj, "double")
  expect_length(obj, 1)
  expect_equal(obj, fit$elbo[length(fit$elbo)])
})

test_that("susie_get_objective returns full ELBO vector when last_only=FALSE", {
  set.seed(2)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  obj <- susie_get_objective(fit, last_only = FALSE)

  expect_type(obj, "double")
  expect_equal(length(obj), fit$niter)
  expect_equal(obj, fit$elbo)
})

test_that("susie_get_objective detects ELBO decrease", {
  set.seed(3)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  fit$elbo <- c(-100, -90, -95, -85)

  expect_message(
    susie_get_objective(fit, warning_tol = 1e-6),
    "Objective is decreasing"
  )
})

# =============================================================================
# Get Posterior Quantities
# =============================================================================

test_that("susie_get_posterior_mean computes correctly", {
  set.seed(4)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  pm <- susie_get_posterior_mean(fit)

  # Should return p-length vector
  expect_length(pm, dat$p)
  expect_type(pm, "double")

  # Manual calculation
  expected <- colSums(fit$alpha * fit$mu) / fit$X_column_scale_factors
  expect_equal(pm, expected)
})

test_that("susie_get_posterior_mean filters effects with V < prior_tol", {
  set.seed(5)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set some V values to zero
  fit$V[c(1, 3)] <- 0

  pm <- susie_get_posterior_mean(fit, prior_tol = 1e-9)

  # Only effects 2, 4, 5 should contribute
  expected <- colSums((fit$alpha * fit$mu)[c(2, 4, 5), , drop = FALSE]) /
              fit$X_column_scale_factors
  expect_equal(pm, expected)
})

test_that("susie_get_posterior_mean returns zeros when all V=0", {
  set.seed(6)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set all V to zero
  fit$V <- rep(0, 5)

  pm <- susie_get_posterior_mean(fit)

  expect_length(pm, dat$p)
  expect_equal(pm, rep(0, dat$p))
})

test_that("susie_get_posterior_mean uses all effects when V is not numeric", {
  set.seed(26)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set V to NULL (not numeric) to trigger the else branch
  fit$V <- NULL

  pm <- susie_get_posterior_mean(fit)

  # Should return p-length vector
  expect_length(pm, dat$p)
  expect_type(pm, "double")

  # Manual calculation using ALL effects (since V is not numeric)
  expected <- colSums(fit$alpha * fit$mu) / fit$X_column_scale_factors
  expect_equal(pm, expected)
})

test_that("susie_get_posterior_sd computes correctly", {
  set.seed(7)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  psd <- susie_get_posterior_sd(fit)

  # Should return p-length vector
  expect_length(psd, dat$p)
  expect_type(psd, "double")
  expect_true(all(psd >= 0))  # SD must be non-negative

  # Manual calculation
  expected <- sqrt(colSums(fit$alpha * fit$mu2 - (fit$alpha * fit$mu)^2)) /
              fit$X_column_scale_factors
  expect_equal(psd, expected)
})

test_that("susie_get_posterior_sd filters effects with V < prior_tol", {
  set.seed(8)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set some V values to zero
  fit$V[c(2, 4)] <- 0

  psd <- susie_get_posterior_sd(fit, prior_tol = 1e-9)

  # Only effects 1, 3, 5 should contribute
  expected <- sqrt(colSums((fit$alpha * fit$mu2 -
                           (fit$alpha * fit$mu)^2)[c(1, 3, 5), , drop = FALSE])) /
              fit$X_column_scale_factors
  expect_equal(psd, expected)
})

test_that("susie_get_posterior_sd uses all effects when V is not numeric", {
  set.seed(27)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set V to NULL (not numeric) to trigger the else branch
  fit$V <- NULL

  psd <- susie_get_posterior_sd(fit)

  # Should return p-length vector
  expect_length(psd, dat$p)
  expect_type(psd, "double")
  expect_true(all(psd >= 0))  # SD must be non-negative

  # Manual calculation using ALL effects (since V is not numeric)
  expected <- sqrt(colSums(fit$alpha * fit$mu2 - (fit$alpha * fit$mu)^2)) /
              fit$X_column_scale_factors
  expect_equal(psd, expected)
})

test_that("susie_get_posterior_sd returns zeros when no effects pass prior_tol", {
  set.seed(28)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set all V to zero so no effects pass the prior_tol filter
  fit$V <- rep(0, 5)

  psd <- susie_get_posterior_sd(fit, prior_tol = 1e-9)

  # Should return p-length vector of zeros (length(include_idx) == 0)
  expect_length(psd, dat$p)
  expect_type(psd, "double")
  expect_equal(psd, numeric(dat$p))  # Should be all zeros
  expect_true(all(psd == 0))
})

test_that("susie_get_niter returns correct iteration count", {
  set.seed(9)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, max_iter = 50, verbose = FALSE)

  niter <- susie_get_niter(fit)

  expect_type(niter, "integer")
  expect_equal(niter, fit$niter)
  expect_equal(niter, length(fit$elbo))
})

test_that("susie_get_prior_variance returns V", {
  set.seed(10)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  V <- susie_get_prior_variance(fit)

  expect_equal(V, fit$V)
  expect_length(V, 5)
  expect_true(all(V >= 0))
})

test_that("susie_get_residual_variance returns sigma2", {
  set.seed(11)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  sigma2 <- susie_get_residual_variance(fit)

  expect_type(sigma2, "double")
  expect_length(sigma2, 1)
  expect_equal(sigma2, fit$sigma2)
  expect_true(sigma2 > 0)
})

test_that("susie_get_lfsr computes local false sign rate", {
  set.seed(17)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  lfsr <- susie_get_lfsr(fit)

  # Should return L-length vector (one per effect)
  expect_length(lfsr, 5)
  expect_type(lfsr, "double")

  # LFSR should be in [0, 1]
  expect_true(all(lfsr >= 0 & lfsr <= 1))
})

test_that("susie_get_posterior_samples generates samples", {
  set.seed(18)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  num_samples <- 100
  samples <- susie_get_posterior_samples(fit, num_samples = num_samples)

  # Should return list with b and gamma
  expect_type(samples, "list")
  expect_named(samples, c("b", "gamma"))

  # Check dimensions
  expect_equal(dim(samples$b), c(dat$p, num_samples))
  expect_equal(dim(samples$gamma), c(dat$p, num_samples))

  # Gamma should be binary
  expect_true(all(samples$gamma %in% c(0, 1)))

  # b should be non-zero only where gamma is 1
  for (i in 1:num_samples) {
    expect_true(all((samples$b[, i] != 0) == (samples$gamma[, i] == 1)))
  }
})

test_that("susie_get_posterior_samples filters effects with V < 1e-9", {
  set.seed(19)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set all V to zero (no effects)
  fit$V <- rep(0, 5)

  samples <- susie_get_posterior_samples(fit, num_samples = 50)

  # With all V=0, all samples should be zero
  expect_true(all(samples$b == 0))
  expect_true(all(samples$gamma == 0))
})

test_that("susie_get_posterior_samples uses all effects when V is not numeric", {
  set.seed(29)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set V to NULL (not numeric) to trigger the else branch
  fit$V <- NULL

  num_samples <- 100
  samples <- susie_get_posterior_samples(fit, num_samples = num_samples)

  # Should return list with b and gamma
  expect_type(samples, "list")
  expect_named(samples, c("b", "gamma"))

  # Check dimensions
  expect_equal(dim(samples$b), c(dat$p, num_samples))
  expect_equal(dim(samples$gamma), c(dat$p, num_samples))

  # Gamma should be binary
  expect_true(all(samples$gamma %in% c(0, 1)))

  # When V is not numeric, ALL effects are included (not filtered)
  # So samples should be generated from all L effects
})

# =============================================================================
# Get Credible Sets and Correlations
# =============================================================================

test_that("susie_get_cs identifies credible sets", {
  set.seed(20)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  cs <- susie_get_cs(fit, coverage = 0.95)

  # Should return list with cs, coverage, requested_coverage
  expect_type(cs, "list")
  expect_true("cs" %in% names(cs))
  expect_true("coverage" %in% names(cs))
  expect_true("requested_coverage" %in% names(cs))

  expect_equal(cs$requested_coverage, 0.95)

  # If CS found, check structure
  if (!is.null(cs$cs)) {
    expect_type(cs$cs, "list")
    expect_true(all(sapply(cs$cs, is.numeric)))
    expect_equal(length(cs$cs), length(cs$coverage))
  }
})

test_that("susie_get_cs filters by purity when X provided", {
  set.seed(21)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  cs_with_purity <- susie_get_cs(fit, X = dat$X, min_abs_corr = 0.5, coverage = 0.95)

  # Should have purity and cs_index fields when X provided
  if (!is.null(cs_with_purity$cs)) {
    expect_true("purity" %in% names(cs_with_purity))
    expect_true("cs_index" %in% names(cs_with_purity))

    # Purity should be data frame with min, mean, median
    expect_s3_class(cs_with_purity$purity, "data.frame")
    expect_true(all(c("min.abs.corr", "mean.abs.corr", "median.abs.corr") %in%
                    colnames(cs_with_purity$purity)))

    # All purity values should be >= min_abs_corr
    expect_true(all(cs_with_purity$purity$min.abs.corr >= 0.5))
  }
})

test_that("susie_get_cs handles dedup parameter", {
  set.seed(22)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  cs_dedup <- susie_get_cs(fit, coverage = 0.95, dedup = TRUE)
  cs_no_dedup <- susie_get_cs(fit, coverage = 0.95, dedup = FALSE)

  # With dedup=TRUE, should have <= CS than without
  n_cs_dedup <- if (is.null(cs_dedup$cs)) 0 else length(cs_dedup$cs)
  n_cs_no_dedup <- if (is.null(cs_no_dedup$cs)) 0 else length(cs_no_dedup$cs)
  expect_true(n_cs_dedup <= n_cs_no_dedup)
})

test_that("susie_get_cs errors when both X and Xcorr are provided", {
  set.seed(30)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Create Xcorr
  Xcorr <- cor(dat$X)

  # Should error when both X and Xcorr are specified
  expect_error(
    susie_get_cs(fit, X = dat$X, Xcorr = Xcorr, coverage = 0.95),
    "Only one of X or Xcorr should be specified"
  )
})

test_that("susie_get_cs warns when neither X nor Xcorr is provided", {
  set.seed(40)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Warn even when min_abs_corr is left at its default, since purity
  # filtering is skipped whenever neither X nor Xcorr is supplied.
  expect_message(
    susie_get_cs(fit),
    "purity filtering is skipped"
  )

  # Same warning when min_abs_corr is explicitly set.
  expect_message(
    susie_get_cs(fit, min_abs_corr = 0.9),
    "purity filtering is skipped"
  )
})

test_that("susie_get_cs does not warn when X or Xcorr is provided", {
  set.seed(41)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  expect_no_message(
    susie_get_cs(fit, X = dat$X, min_abs_corr = 0.5),
    message = "purity filtering is skipped"
  )

  expect_no_message(
    susie_get_cs(fit, Xcorr = cor(dat$X), min_abs_corr = 0.5),
    message = "purity filtering is skipped"
  )
})

test_that("susie_get_cs warns and fixes non-symmetric Xcorr", {
  set.seed(31)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Create a non-symmetric correlation matrix
  Xcorr <- cor(dat$X)
  # Make it non-symmetric by modifying upper triangle
  Xcorr[1, 2] <- 0.9
  Xcorr[2, 1] <- 0.8  # Different from Xcorr[1, 2]

  # Should warn about non-symmetry
  expect_message(
    cs <- susie_get_cs(fit, Xcorr = Xcorr, coverage = 0.95, check_symmetric = TRUE),
    "Xcorr is not symmetric; forcing Xcorr to be symmetric"
  )

  # Verify the symmetrization formula: (Xcorr + t(Xcorr)) / 2
  Xcorr_original <- cor(dat$X)
  Xcorr_original[1, 2] <- 0.9
  Xcorr_original[2, 1] <- 0.8

  expected_value <- (0.9 + 0.8) / 2  # Should be 0.85
  expect_equal(expected_value, 0.85)
})

test_that("susie_get_cs uses squared correlation column names when squared=TRUE", {
  set.seed(32)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS with squared=TRUE
  cs_squared <- susie_get_cs(fit, X = dat$X, coverage = 0.95, squared = TRUE)

  # If CS found, check purity column names
  if (!is.null(cs_squared$cs) && !is.null(cs_squared$purity)) {
    expect_true("purity" %in% names(cs_squared))
    expect_s3_class(cs_squared$purity, "data.frame")

    # When squared=TRUE, column names should be min.sq.corr, mean.sq.corr, median.sq.corr
    expect_true(all(c("min.sq.corr", "mean.sq.corr", "median.sq.corr") %in%
                    colnames(cs_squared$purity)))

    # Should NOT have the absolute correlation names
    expect_false("min.abs.corr" %in% colnames(cs_squared$purity))
    expect_false("mean.abs.corr" %in% colnames(cs_squared$purity))
    expect_false("median.abs.corr" %in% colnames(cs_squared$purity))
  } else {
    skip("No CS with purity found for squared correlation test")
  }

  # Compare with squared=FALSE (default)
  cs_abs <- susie_get_cs(fit, X = dat$X, coverage = 0.95, squared = FALSE)

  if (!is.null(cs_abs$cs) && !is.null(cs_abs$purity)) {
    # When squared=FALSE, column names should be min.abs.corr, mean.abs.corr, median.abs.corr
    expect_true(all(c("min.abs.corr", "mean.abs.corr", "median.abs.corr") %in%
                    colnames(cs_abs$purity)))

    # Should NOT have the squared correlation names
    expect_false("min.sq.corr" %in% colnames(cs_abs$purity))
    expect_false("mean.sq.corr" %in% colnames(cs_abs$purity))
    expect_false("median.sq.corr" %in% colnames(cs_abs$purity))
  }
})

test_that("get_cs_correlation computes correlations between CS", {
  set.seed(23)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    cs_corr <- get_cs_correlation(fit, X = dat$X)

    expect_true(is.matrix(cs_corr))
    expect_equal(nrow(cs_corr), length(fit$sets$cs))
    expect_equal(ncol(cs_corr), length(fit$sets$cs))

    expect_equal(as.numeric(diag(cs_corr)), rep(1, nrow(cs_corr)))
  } else {
    skip("No multiple CS found for correlation test")
  }
})

test_that("get_cs_correlation with Xcorr instead of X", {
  set.seed(24)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    Xcorr <- cor(dat$X)
    cs_corr <- get_cs_correlation(fit, Xcorr = Xcorr)

    expect_true(is.matrix(cs_corr))
    expect_equal(nrow(cs_corr), length(fit$sets$cs))
  } else {
    skip("No multiple CS found for Xcorr test")
  }
})

test_that("get_cs_correlation returns NA when no CS or only one CS", {
  set.seed(33)
  dat <- simulate_regression(n = 100, p = 50, k = 1)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Case 1: No CS at all
  fit$sets <- list(cs = NULL)
  result <- get_cs_correlation(fit, X = dat$X)
  expect_true(is.na(result))

  # Case 2: Only one CS
  fit$sets <- list(cs = list(c(1, 2, 3)))
  result <- get_cs_correlation(fit, X = dat$X)
  expect_true(is.na(result))
})

test_that("get_cs_correlation errors when both X and Xcorr are provided", {
  set.seed(34)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    Xcorr <- cor(dat$X)

    # Should error when both X and Xcorr are specified
    expect_error(
      get_cs_correlation(fit, X = dat$X, Xcorr = Xcorr),
      "Only one of X or Xcorr should be specified"
    )
  } else {
    skip("No multiple CS found for test")
  }
})

test_that("get_cs_correlation errors when neither X nor Xcorr are provided", {
  set.seed(35)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    # Should error when neither X nor Xcorr are specified
    expect_error(
      get_cs_correlation(fit, X = NULL, Xcorr = NULL),
      "One of X or Xcorr must be specified"
    )
  } else {
    skip("No multiple CS found for test")
  }
})

test_that("get_cs_correlation warns and fixes non-symmetric Xcorr", {
  set.seed(36)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    # Create a non-symmetric correlation matrix
    Xcorr <- cor(dat$X)
    Xcorr[1, 2] <- 0.9
    Xcorr[2, 1] <- 0.8  # Different from Xcorr[1, 2]

    # Should warn about non-symmetry
    expect_message(
      cs_corr <- get_cs_correlation(fit, Xcorr = Xcorr),
      "Xcorr is not symmetric; forcing Xcorr to be symmetric"
    )

    # Verify the symmetrization formula: (Xcorr + t(Xcorr)) / 2
    expected_value <- (0.9 + 0.8) / 2  # Should be 0.85
    expect_equal(expected_value, 0.85)
  } else {
    skip("No multiple CS found for test")
  }
})

test_that("get_cs_correlation with max=TRUE returns scalar maximum", {
  set.seed(37)
  dat <- simulate_regression(n = 200, p = 100, k = 3, signal_sd = 2)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)
  fit$sets <- susie_get_cs(fit, X = dat$X, coverage = 0.95)

  if (!is.null(fit$sets$cs) && length(fit$sets$cs) > 1) {
    # Get full correlation matrix first
    cs_corr_matrix <- get_cs_correlation(fit, X = dat$X, max = FALSE)

    # Get max correlation
    cs_corr_max <- get_cs_correlation(fit, X = dat$X, max = TRUE)

    # Should be a scalar
    expect_type(cs_corr_max, "double")
    expect_length(cs_corr_max, 1)

    # Should equal max of upper triangle absolute values
    expected_max <- max(abs(cs_corr_matrix[upper.tri(cs_corr_matrix)]))
    expect_equal(cs_corr_max, expected_max)

    # Max should be >= 0 and <= 1 (correlation)
    expect_true(cs_corr_max >= 0 && cs_corr_max <= 1)

    # When max=TRUE, should not have rownames/colnames (it's a scalar)
    expect_null(names(cs_corr_max))
  } else {
    skip("No multiple CS found for test")
  }
})

# =============================================================================
# Get PIPs and Related Functions
# =============================================================================

test_that("susie_get_pip computes PIPs correctly", {
  set.seed(12)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  pip <- susie_get_pip(fit)

  # Should return p-length vector
  expect_length(pip, dat$p)
  expect_type(pip, "double")

  # All PIPs should be in [0, 1]
  expect_true(all(pip >= 0 & pip <= 1))

  # Manual calculation: 1 - prod(1 - alpha)
  expected <- 1 - apply(1 - fit$alpha, 2, prod)
  expect_equal(pip, expected)
})

test_that("susie_get_pip handles null_index correctly", {
  set.seed(13)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, null_weight = 0.1, verbose = FALSE)

  pip <- susie_get_pip(fit)

  expect_length(pip, dat$p)
  expect_true(all(pip >= 0 & pip <= 1))

  if (!is.null(fit$null_index) && fit$null_index > 0) {
    expect_true(ncol(fit$alpha) == dat$p + 1)
  }
})

test_that("susie_get_pip filters by prior_tol", {
  set.seed(14)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set some V to zero
  fit$V[c(1, 5)] <- 0

  pip <- susie_get_pip(fit, prior_tol = 1e-9)

  # Only effects 2, 3, 4 should contribute
  expected <- 1 - apply(1 - fit$alpha[c(2, 3, 4), , drop = FALSE], 2, prod)
  expect_equal(pip, expected)
})

test_that("susie_get_pip with prune_by_cs filters to CS effects only", {
  set.seed(15)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS
  fit$sets <- susie_get_cs(fit, coverage = 0.95)

  pip_pruned <- susie_get_pip(fit, prune_by_cs = TRUE)

  # Should still return p-length vector
  expect_length(pip_pruned, dat$p)
  expect_true(all(pip_pruned >= 0 & pip_pruned <= 1))

  # If there are CS, pruned PIPs should be different from unpruned
  if (!is.null(fit$sets$cs_index)) {
    pip_full <- susie_get_pip(fit, prune_by_cs = FALSE)
    # At least some should differ (unless all effects are in CS)
    expect_true(any(pip_pruned != pip_full) || length(fit$sets$cs_index) == nrow(fit$alpha))
  }
})

test_that("susie_get_pip returns zeros when no CS and prune_by_cs=TRUE", {
  set.seed(16)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Force no credible sets
  fit$sets <- list(cs = NULL, cs_index = NULL)

  pip <- susie_get_pip(fit, prune_by_cs = TRUE)

  expect_length(pip, dat$p)
  # When no CS, all PIPs should be zero
  expect_true(all(pip == 0))
})

test_that("susie_get_pip uses all effects when V is not numeric", {
  set.seed(38)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 5, verbose = FALSE)

  # Set V to NULL (not numeric) to trigger the else branch
  fit$V <- NULL

  pip <- susie_get_pip(fit)

  # Should return p-length vector
  expect_length(pip, dat$p)
  expect_type(pip, "double")

  # All PIPs should be in [0, 1]
  expect_true(all(pip >= 0 & pip <= 1))

  # Manual calculation using ALL effects (since V is not numeric)
  expected <- 1 - apply(1 - fit$alpha, 2, prod)
  expect_equal(pip, expected)
})

test_that("susie_get_pip with prune_by_cs uses intersection of include_idx and cs_index", {
  set.seed(39)
  dat <- simulate_regression(n = 100, p = 50, k = 3)
  fit <- susie(dat$X, dat$y, L = 10, verbose = FALSE)

  # Get CS
  fit$sets <- susie_get_cs(fit, coverage = 0.95)

  # Also set some V to zero to create a filtering scenario
  fit$V[c(1, 2)] <- 0

  if (!is.null(fit$sets$cs_index)) {
    # Get PIPs with prune_by_cs=TRUE
    pip_pruned <- susie_get_pip(fit, prune_by_cs = TRUE, prior_tol = 1e-9)

    # Should return p-length vector
    expect_length(pip_pruned, dat$p)
    expect_true(all(pip_pruned >= 0 & pip_pruned <= 1))

    # Manually compute what include_idx should be
    # Effects with V > prior_tol
    include_idx_V <- which(fit$V > 1e-9)  # Should exclude 1, 2

    # Intersection with cs_index (only effects in CS)
    include_idx_final <- intersect(include_idx_V, fit$sets$cs_index)

    # If the intersection is non-empty, compute expected PIPs
    if (length(include_idx_final) > 0) {
      expected <- 1 - apply(1 - fit$alpha[include_idx_final, , drop = FALSE], 2, prod)
      expect_equal(pip_pruned, expected)
    } else {
      # If intersection is empty, should be all zeros
      expect_true(all(pip_pruned == 0))
    }
  } else {
    skip("No CS found for intersection test")
  }
})

# =============================================================================
# Initialization Functions
# =============================================================================

test_that("susie_init_coef creates valid initialization object", {
  p <- 100
  coef_index <- c(5, 20, 45, 80)
  coef_value <- c(1.5, -2.0, 0.8, -1.2)

  init <- susie_init_coef(coef_index, coef_value, p)

  # Should return susie object
  expect_s3_class(init, "susie")
  expect_type(init, "list")

  # Should have required fields
  expect_true(all(c("alpha", "mu", "mu2") %in% names(init)))
  expect_null(init$V)

  # Check dimensions
  L <- length(coef_index)
  expect_equal(dim(init$alpha), c(L, p))
  expect_equal(dim(init$mu), c(L, p))
  expect_equal(dim(init$mu2), c(L, p))
})

test_that("susie_init_coef sets alpha correctly", {
  p <- 50
  coef_index <- c(10, 25, 40)
  coef_value <- c(1.0, 2.0, 3.0)

  init <- susie_init_coef(coef_index, coef_value, p)

  # Alpha should be indicator matrix
  for (i in seq_along(coef_index)) {
    expect_equal(init$alpha[i, coef_index[i]], 1)
    expect_equal(sum(init$alpha[i, ]), 1)  # Each row sums to 1
    expect_equal(sum(init$alpha[i, -coef_index[i]]), 0)  # All others are 0
  }
})

test_that("susie_init_coef sets mu and mu2 correctly", {
  p <- 50
  coef_index <- c(10, 25, 40)
  coef_value <- c(1.5, -2.0, 0.8)

  init <- susie_init_coef(coef_index, coef_value, p)

  # Mu should have coef_value at coef_index
  for (i in seq_along(coef_index)) {
    expect_equal(init$mu[i, coef_index[i]], coef_value[i])
    expect_equal(sum(init$mu[i, -coef_index[i]]), 0)  # All others are 0
  }

  # mu2 should equal mu^2
  expect_equal(init$mu2, init$mu * init$mu)
})

test_that("susie_init_coef errors on invalid inputs", {
  # No effects
  expect_error(
    susie_init_coef(integer(0), numeric(0), 100),
    "Need at least one non-zero effect"
  )

  # Zero coefficient value
  expect_error(
    susie_init_coef(c(1, 5), c(1.0, 0.0), 100),
    "Input coef_value must be non-zero for all its elements"
  )

  # Mismatched lengths
  expect_error(
    susie_init_coef(c(1, 5, 10), c(1.0, 2.0), 100),
    "Inputs coef_index and coef_value must of the same length"
  )

  # Index out of bounds
  expect_error(
    susie_init_coef(c(1, 5, 150), c(1.0, 2.0, 3.0), 100),
    "Input coef_index exceeds the boundary of p"
  )
})

test_that("susie_init_coef works with susie", {
  set.seed(25)
  n <- 100
  p <- 50

  # Create data with known true effects
  dat <- simulate_regression(n = n, p = p, k = 3)
  true_coef_idx <- which(dat$beta != 0)
  true_coef_val <- dat$beta[true_coef_idx]

  # Initialize with true coefficients
  init <- susie_init_coef(true_coef_idx, true_coef_val, p)

  # Fit susie with initialization
  fit <- susie(dat$X, dat$y, L = 10, model_init = init, verbose = FALSE)

  # Should return valid susie fit
  expect_s3_class(fit, "susie")
  expect_true(!is.null(fit$alpha))
  expect_true(!is.null(fit$mu))
  expect_true(!is.null(fit$elbo))
})


================================================
FILE: tests/testthat/test_susie_small.R
================================================
context("test_susie_small.R")

test_that(paste("check that ELBO is monotonically increasing for ",
                "estimate_residual_method = 'NIG', ",
                "with L = 1"),{
  set.seed(1)
  data(data_small)
  y <- data_small$y
  X <- data_small$X
  fit <- susie(X,y,L = 1,estimate_residual_method = "NIG",
               alpha0 = 0.1,beta0 = 0.1,tol = 1e-6,verbose = TRUE)
  expect_true(all(diff(fit$elbo) >= 0))
})


================================================
FILE: tests/testthat/test_susie_utils.R
================================================
context("Utility functions for susieR")

# =============================================================================
# FUNDAMENTAL BUILDING BLOCKS
# =============================================================================

test_that("warning_message displays warnings correctly", {
  # Test warning style (default)
  expect_message(
    warning_message("Test warning"),
    "WARNING:.*Test warning"
  )

  # Test warning style (explicit)
  expect_message(
    warning_message("Test warning", style = "warning"),
    "WARNING:.*Test warning"
  )

  # Test hint style
  expect_message(
    warning_message("Test hint", style = "hint"),
    "HINT:.*Test hint"
  )

  # Test with warn < 0
  old_warn <- getOption("warn")
  on.exit(options(warn = old_warn), add = TRUE)

  options(warn = -1)
  expect_no_error(warning_message("Still executes", style = "warning"))

  # Hint should still show even with warn < 0
  expect_message(
    warning_message("Hint shows", style = "hint"),
    "HINT:.*Hint shows"
  )
})

test_that("safe_cor computes correlation and handles zero sd columns", {
  # Normal correlation
  x <- matrix(c(1, 2, 3, 4, 5, 6), nrow = 3, ncol = 2)
  result <- safe_cor(x)
  expected <- cor(x)
  expect_equal(result, expected)

  # With constant column (zero sd) - should handle without warning

  x_const <- cbind(x, rep(1, 3))

  # Without safe_cor, cor() would warn
  expect_warning(cor(x_const), "the standard deviation is zero")

  # safe_cor handles this without warning and returns 0 for constant column correlations
  expect_silent(result <- safe_cor(x_const))

  # Check that correlations involving constant column are 0 (not NA)
  expect_equal(result[3, 1], 0)
  expect_equal(result[3, 2], 0)
  expect_equal(result[1, 3], 0)
  expect_equal(result[2, 3], 0)
  # Diagonal should still be 1
  expect_equal(diag(result), c(1, 1, 1))
})

test_that("safe_cov2cor computes correlation from covariance and handles zero variance", {
  # Normal case
  cov_mat <- matrix(c(4, 2, 2, 3), nrow = 2)
  result <- safe_cov2cor(cov_mat)
  expected <- cov2cor(cov_mat)
  expect_equal(result, expected)

  # With zero variance entry - safe_cov2cor handles this without warning
  cov_mat_zero <- matrix(c(0, 0, 0, 3), nrow = 2)

  # Without safe_cov2cor, cov2cor() would warn
  expect_warning(cov2cor(cov_mat_zero))

  # safe_cov2cor handles zero variance by returning 0 correlations (not NA)
  expect_silent(result <- safe_cov2cor(cov_mat_zero))
  expect_true(is.matrix(result))
  # Diagonal should be 1
  expect_equal(diag(result), c(1, 1))
  # Off-diagonal correlations involving zero-variance variable should be 0

  expect_equal(result[1, 2], 0)
  expect_equal(result[2, 1], 0)
})

test_that("safe_cor handles constant columns without warnings", {
  # Create data with a constant column that would trigger a warning in base cor()
  x_const <- matrix(c(1, 2, 3, 4, 5, 6, 1, 1, 1), nrow = 3, ncol = 3)

  # Verify that base cor() would warn
  expect_warning(cor(x_const), "the standard deviation is zero")

  # Test that safe_cor handles it silently
  expect_silent(safe_cor(x_const))

  # Verify result is computed correctly
  result <- safe_cor(x_const)
  expect_true(is.matrix(result))
  # Correlations involving the constant column (col 3) should be 0, not NA

  expect_equal(result[3, 1], 0)
  expect_equal(result[3, 2], 0)
  expect_equal(result[1, 3], 0)
  expect_equal(result[2, 3], 0)
  # Diagonal should be 1
  expect_equal(diag(result), c(1, 1, 1))
})

test_that("safe_cov2cor handles zero variance without warnings", {
  # Create covariance matrix with zero variance that would trigger a warning in base cov2cor()
  cov_mat_zero <- matrix(c(0, 0, 0, 3), nrow = 2)

  # Verify that base cov2cor() would warn
  expect_warning(cov2cor(cov_mat_zero))

  # Test that safe_cov2cor handles it silently
  expect_silent(safe_cov2cor(cov_mat_zero))

  # Verify result is computed correctly
  result <- safe_cov2cor(cov_mat_zero)
  expect_true(is.matrix(result))
  # Correlations involving zero-variance variable should be 0, not NA

  expect_equal(result[1, 2], 0)
  expect_equal(result[2, 1], 0)
  # Diagonal should be 1
  expect_equal(diag(result), c(1, 1))
})

test_that("is_symmetric_matrix correctly identifies symmetric matrices", {
  # Symmetric matrix
  sym_mat <- matrix(c(1, 2, 3, 2, 4, 5, 3, 5, 6), nrow = 3)
  expect_true(is_symmetric_matrix(sym_mat))

  # Non-symmetric matrix
  nonsym_mat <- matrix(c(1, 2, 3, 4, 5, 6, 7, 8, 9), nrow = 3)
  expect_false(is_symmetric_matrix(nonsym_mat))

  # Identity matrix
  expect_true(is_symmetric_matrix(diag(5)))

  # Sparse symmetric matrix
  sparse_sym <- Matrix::Matrix(sym_mat, sparse = TRUE)
  expect_true(is_symmetric_matrix(sparse_sym))
})

test_that("apply_nonzeros applies function to nonzero elements of sparse matrix", {
  # Create sparse matrix
  X <- Matrix::Matrix(c(1, 0, 0, 2, 0, 3, 4, 0, 5), nrow = 3, sparse = TRUE)

  # Square all nonzero elements
  result <- apply_nonzeros(X, function(x) x^2)

  # Check dimensions preserved
  expect_equal(dim(result), dim(X))

  # Check that zeros remain zeros
  expect_equal(sum(result == 0), sum(X == 0))

  # Check nonzero values are squared
  expected <- Matrix::Matrix(c(1, 0, 0, 4, 0, 9, 16, 0, 25), nrow = 3, sparse = TRUE)
  expect_equal(as.matrix(result), as.matrix(expected))

  # Test with another function (doubling)
  result2 <- apply_nonzeros(X, function(x) x * 2)
  expected2 <- Matrix::Matrix(c(2, 0, 0, 4, 0, 6, 8, 0, 10), nrow = 3, sparse = TRUE)
  expect_equal(as.matrix(result2), as.matrix(expected2))
})

test_that("compute_colSds computes column standard deviations correctly", {
  # Dense matrix
  X_dense <- matrix(rnorm(100), nrow = 10, ncol = 10)
  result_dense <- compute_colSds(X_dense)
  expected_dense <- matrixStats::colSds(X_dense)
  expect_equal(result_dense, expected_dense, tolerance = 1e-10)

  # Sparse matrix
  X_sparse <- Matrix::Matrix(X_dense, sparse = TRUE)
  X_sparse[abs(X_sparse) < 0.5] <- 0  # Make it actually sparse
  result_sparse <- compute_colSds(X_sparse)
  expected_sparse <- apply(as.matrix(X_sparse), 2, sd)
  expect_equal(result_sparse, expected_sparse, tolerance = 1e-10)

  # Matrix with constant column (sd = 0)
  X_const <- cbind(X_dense, rep(1, 10))
  result_const <- compute_colSds(X_const)
  expect_equal(result_const[11], 0)
  expect_equal(result_const[1:10], matrixStats::colSds(X_dense))
})

test_that("compute_colstats computes column statistics correctly", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 123)

  # Test with both center and scale
  result <- compute_colstats(base_data$X, center = TRUE, scale = TRUE)

  # Check components exist
  expect_true(all(c("cm", "csd", "d") %in% names(result)))
  expect_length(result$cm, base_data$p)
  expect_length(result$csd, base_data$p)
  expect_length(result$d, base_data$p)

  # Check column means
  expect_equal(result$cm, colMeans(base_data$X), tolerance = 1e-10)

  # Check column sds
  expected_csd <- apply(base_data$X, 2, sd)
  expect_equal(result$csd, expected_csd, tolerance = 1e-10)

  # Check d values (sum of squared standardized values)
  X_std <- scale(base_data$X, center = TRUE, scale = TRUE)
  expected_d <- colSums(X_std^2)
  expect_equal(result$d, expected_d, tolerance = 1e-8)

  # Test with center = FALSE
  result_nocenter <- compute_colstats(base_data$X, center = FALSE, scale = TRUE)
  expect_equal(result_nocenter$cm, rep(0, base_data$p))
  expect_equal(result_nocenter$csd, expected_csd, tolerance = 1e-10)

  # Test with scale = FALSE
  result_noscale <- compute_colstats(base_data$X, center = TRUE, scale = FALSE)
  expect_equal(result_noscale$cm, colMeans(base_data$X), tolerance = 1e-10)
  expect_equal(result_noscale$csd, rep(1, base_data$p))

  # Test with neither center nor scale
  result_neither <- compute_colstats(base_data$X, center = FALSE, scale = FALSE)
  expect_equal(result_neither$cm, rep(0, base_data$p))
  expect_equal(result_neither$csd, rep(1, base_data$p))
  expected_d_neither <- colSums(base_data$X^2)
  expect_equal(result_neither$d, expected_d_neither, tolerance = 1e-10)

  # Test with column of zeros (sd = 0)
  X_zero <- cbind(base_data$X, rep(0, base_data$n))
  result_zero <- compute_colstats(X_zero, center = TRUE, scale = TRUE)
  expect_equal(result_zero$csd[base_data$p + 1], 1)  # sd = 0 replaced by 1

  # Test with sparse matrix
  X_sparse <- Matrix::Matrix(base_data$X, sparse = TRUE)
  X_sparse[abs(X_sparse) < 1] <- 0
  result_sparse <- compute_colstats(X_sparse, center = TRUE, scale = TRUE)
  expect_length(result_sparse$cm, base_data$p)
  expect_length(result_sparse$csd, base_data$p)
  expect_length(result_sparse$d, base_data$p)
})

# =============================================================================
# DATA PROCESSING & VALIDATION
# =============================================================================

test_that("check_semi_pd identifies positive semi-definite matrices", {
  # Positive definite matrix
  A_pd <- matrix(c(2, 1, 1, 2), nrow = 2)
  result_pd <- check_semi_pd(A_pd, tol = 1e-10)

  expect_true(result_pd$status)
  expect_true(all(result_pd$eigenvalues >= 0))
  expect_true(!is.null(attr(result_pd$matrix, "eigen")))

  # Positive semi-definite matrix (singular)
  A_psd <- matrix(c(1, 1, 1, 1), nrow = 2)
  result_psd <- check_semi_pd(A_psd, tol = 1e-10)

  expect_true(result_psd$status)
  expect_true(min(result_psd$eigenvalues) >= 0)
  expect_true(any(abs(result_psd$eigenvalues) < 1e-10))  # Has zero eigenvalue

  # Not positive semi-definite
  A_neg <- matrix(c(1, 2, 2, -1), nrow = 2)
  result_neg <- check_semi_pd(A_neg, tol = 1e-10)

  expect_false(result_neg$status)
  expect_true(any(result_neg$eigenvalues < 0))

  # Identity matrix
  A_id <- diag(3)
  result_id <- check_semi_pd(A_id, tol = 1e-10)

  expect_true(result_id$status)
  expect_equal(result_id$eigenvalues, rep(1, 3), tolerance = 1e-10)
})

test_that("check_projection verifies if vector is in eigenspace", {
  # Create a matrix and vector in its column space
  A <- matrix(c(4, 2, 2, 3), nrow = 2)
  b_in <- c(2, 1)  # In column space

  result_in <- check_projection(A, b_in)
  expect_true(result_in$status)
  expect_true(is.na(result_in$msg))

  # Test with pre-computed eigen decomposition
  A_with_eigen <- A
  attr(A_with_eigen, "eigen") <- eigen(A, symmetric = TRUE)
  result_with_eigen <- check_projection(A_with_eigen, b_in)
  expect_true(result_with_eigen$status)
})

test_that("validate_init validates model initialization objects", {
  # Create valid model_init
  p <- 50
  L <- 5
  valid_init <- list(
    alpha = matrix(1/p, L, p),
    mu = matrix(0, L, p),
    mu2 = matrix(0, L, p),
    V = rep(1, L),
    sigma2 = 1,
    pi = rep(1/p, p),
    null_index = 0
  )
  class(valid_init) <- "susie"

  data <- list(n = 100, p = p)
  params <- list(L = L, model_init = valid_init)

  # Should pass without error
  expect_silent(validate_init(data, params))

  # Test: not a susie object
  bad_init <- valid_init
  class(bad_init) <- "lm"
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init must be a 'susie' object")

  # Test: NA in alpha
  bad_init <- valid_init
  bad_init$alpha[1, 1] <- NA
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$alpha contains NA/Inf")

  # Test: Inf in mu
  bad_init <- valid_init
  bad_init$mu[1, 1] <- Inf
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$mu contains NA/Inf")

  # Test: alpha not a matrix
  bad_init <- valid_init
  bad_init$alpha <- as.vector(bad_init$alpha)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$alpha must be a matrix")

  # Test: alpha values outside [0,1]
  bad_init <- valid_init
  bad_init$alpha[1, 1] <- 1.5
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "invalid values outside range")

  # Test: dimension mismatch
  bad_init <- valid_init
  bad_init$mu <- matrix(0, L, p - 1)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "dimensions do not match")

  # Test: V length mismatch
  bad_init <- valid_init
  bad_init$V <- rep(1, L - 1)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "does not equal nrow")

  # Test: negative V
  bad_init <- valid_init
  bad_init$V[1] <- -1
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "at least one negative value")

  # Test: negative sigma2
  bad_init <- valid_init
  bad_init$sigma2 <- -0.5
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "sigma2 is negative")

  # Test: NULL V (should pass)
  init_no_V <- valid_init
  init_no_V$V <- NULL
  params_no_V <- list(L = L, model_init = init_no_V)
  expect_silent(validate_init(data, params_no_V))

  # Test 1: mu2 contains NA/Inf values
  bad_init <- valid_init
  bad_init$mu2[2, 3] <- NA
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$mu2 contains NA/Inf values")

  bad_init <- valid_init
  bad_init$mu2[1, 5] <- Inf
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$mu2 contains NA/Inf values")

  # Test 2: V contains NA/Inf values
  bad_init <- valid_init
  bad_init$V[2] <- NA
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$V contains NA/Inf values")

  bad_init <- valid_init
  bad_init$V[3] <- Inf
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$V contains NA/Inf values")

  # Test 3: sigma2 contains NA/Inf
  bad_init <- valid_init
  bad_init$sigma2 <- NA
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$sigma2 contains NA/Inf")

  bad_init <- valid_init
  bad_init$sigma2 <- Inf
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$sigma2 contains NA/Inf")

  # Test 4: pi contains NA/Inf
  bad_init <- valid_init
  bad_init$pi[10] <- NA
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$pi contains NA/Inf")

  bad_init <- valid_init
  bad_init$pi[5] <- Inf
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$pi contains NA/Inf")

  # Test 5: mu2 and alpha dimensions do not match
  bad_init <- valid_init
  bad_init$mu2 <- matrix(0, L, p - 1)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$mu2 and model_init\\$alpha dimensions do not match")

  bad_init <- valid_init
  bad_init$mu2 <- matrix(0, L + 1, p)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$mu2 and model_init\\$alpha dimensions do not match")

  # Test 6: V must be numeric
  # Note: This branch is unreachable because is.finite() on character vectors
  # returns FALSE, triggering the NA/Inf error first. The numeric check only runs
  # if all values pass is.finite(). Testing with numeric values only.
  bad_init <- valid_init
  bad_init$V <- rep(0, L)  # All zeros (valid finite numerics)
  # This should pass all checks since 0 is valid for V
  params_ok <- list(L = L, model_init = bad_init)
  expect_silent(validate_init(data, params_ok))

  # Test 7: sigma2 must be numeric
  # Note: Similar to above - unreachable branch due to is.finite() check first
  bad_init <- valid_init
  bad_init$sigma2 <- 0  # Zero is valid
  params_ok <- list(L = L, model_init = bad_init)
  expect_silent(validate_init(data, params_ok))

  # Test 8: pi length must match number of columns in alpha
  bad_init <- valid_init
  bad_init$pi <- rep(1/(p-1), p - 1)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$pi should have the same length as the number of columns in model_init\\$alpha")

  bad_init <- valid_init
  bad_init$pi <- rep(1/(p+1), p + 1)
  params_bad <- list(L = L, model_init = bad_init)
  expect_error(validate_init(data, params_bad), "model_init\\$pi should have the same length as the number of columns in model_init\\$alpha")
})

test_that("convert_individual_to_ss converts individual data to sufficient statistics", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5, seed = 123)
  data <- setup$data

  params <- list(
    unmappable_effects = "inf",
    verbose = FALSE
  )

  # Convert
  ss_data <- convert_individual_to_ss(data, params)

  # Check class
  expect_s3_class(ss_data, "ss")

  # Check components exist
  expect_true(all(c("XtX", "Xty", "yty", "n", "p") %in% names(ss_data)))

  # Check dimensions
  expect_equal(dim(ss_data$XtX), c(50, 50))
  expect_length(ss_data$Xty, 50)
  expect_length(ss_data$yty, 1)

  # Values may be rescaled for unmappable effects
  expect_true(is.numeric(ss_data$XtX))
  expect_true(is.numeric(ss_data$Xty))
  expect_true(is.numeric(ss_data$yty))
  expect_true(ss_data$yty > 0)

  # Check attributes preserved
  expect_equal(ss_data$X_colmeans, attr(data$X, "scaled:center"))
  expect_equal(ss_data$y_mean, data$mean_y)
  expect_equal(attr(ss_data$XtX, "d"), attr(data$X, "d"))
  expect_equal(attr(ss_data$XtX, "scaled:scale"), attr(data$X, "scaled:scale"))

  # Check eigen decomposition added for unmappable effects
  expect_true(!is.null(ss_data$eigen_vectors))
  expect_true(!is.null(ss_data$eigen_values))
  expect_true(!is.null(ss_data$VtXty))
})

test_that("extract_prior_weights extracts and rescales prior weights", {
  p <- 100

  # Test: no null weight
  model_no_null <- list(
    pi = rep(1/p, p),
    null_weight = 0,
    null_index = 0
  )
  result <- extract_prior_weights(model_no_null)
  expect_equal(result, rep(1/p, p))

  # Test: with null weight
  null_weight <- 0.1
  null_idx <- p
  pi_vec <- c(rep((1 - null_weight)/(p - 1), p - 1), null_weight)
  model_with_null <- list(
    pi = pi_vec,
    null_weight = null_weight,
    null_index = null_idx
  )
  result <- extract_prior_weights(model_with_null)

  # Should extract non-null weights and rescale to sum to 1
  expect_length(result, p - 1)
  expect_equal(sum(result), 1, tolerance = 1e-10)
  expect_equal(result, rep(1/(p-1), p-1), tolerance = 1e-10)

  # Test: null weight provided as argument
  result_arg <- extract_prior_weights(model_with_null, null_weight = null_weight)
  expect_equal(result, result_arg)

  # Test: null_weight = NULL (backwards compatibility)
  model_null_weight_null <- model_no_null
  model_null_weight_null$null_weight <- NULL
  result <- extract_prior_weights(model_null_weight_null)
  expect_equal(result, rep(1/p, p))
})

test_that("reconstruct_full_weights reconstructs prior weights with null component", {
  p <- 100
  non_null_weights <- rep(1/(p-1), p-1)

  # Test: no null weight
  result_no_null <- reconstruct_full_weights(non_null_weights, null_weight = 0)
  expect_length(result_no_null, p - 1)
  expect_equal(sum(result_no_null), 1, tolerance = 1e-10)
  expect_equal(result_no_null, non_null_weights, tolerance = 1e-10)

  # Test: with null weight
  null_weight <- 0.1
  result_with_null <- reconstruct_full_weights(non_null_weights, null_weight = null_weight)
  expect_length(result_with_null, p)
  expect_equal(sum(result_with_null), 1, tolerance = 1e-10)
  expect_equal(result_with_null[p], null_weight, tolerance = 1e-10)
  expect_equal(sum(result_with_null[1:(p-1)]), 1 - null_weight, tolerance = 1e-10)

  # Test: null_weight = NULL
  result_null <- reconstruct_full_weights(non_null_weights, null_weight = NULL)
  expect_equal(sum(result_null), 1, tolerance = 1e-10)
})

test_that("validate_and_override_params validates and adjusts parameters", {
  # Valid params
  valid_params <- list(
    L = 10,
    prior_tol = 1e-9,
    residual_variance_upperbound = 1e10,
    scaled_prior_variance = 0.2,
    unmappable_effects = "none",
    convergence_method = "elbo",
    estimate_prior_variance = TRUE,
    estimate_prior_method = "EM",
    estimate_residual_method = "MLE",
    estimate_residual_variance = TRUE,
    refine = FALSE,
    alpha0 = 0.1,
    beta0 = 0.1,
    n = 100
  )

  result <- validate_and_override_params(valid_params)
  expect_equal(result$prior_tol, 1e-9)
  expect_false(result$use_NIG)

  # Test: invalid prior_tol
  bad_params <- valid_params
  bad_params$prior_tol <- -1
  expect_error(validate_and_override_params(bad_params), "prior_tol must be non-negative")

  bad_params$prior_tol <- c(1e-9, 1e-8)
  expect_error(validate_and_override_params(bad_params), "prior_tol must be a numeric scalar")

  # Test: invalid residual_variance_upperbound (negative value)
  bad_params <- valid_params
  bad_params$residual_variance_upperbound <- -1
  expect_error(validate_and_override_params(bad_params), "must be positive")

  # Test: residual_variance_upperbound must be a numeric scalar (not a vector)
  bad_params <- valid_params
  bad_params$residual_variance_upperbound <- c(1e10, 1e11)
  expect_error(validate_and_override_params(bad_params), "residual_variance_upperbound must be a numeric scalar")

  # Test: residual_variance_upperbound must be numeric (not character)
  bad_params <- valid_params
  bad_params$residual_variance_upperbound <- "1e10"
  expect_error(validate_and_override_params(bad_params), "residual_variance_upperbound must be a numeric scalar")

  # Test: invalid scaled_prior_variance
  bad_params <- valid_params
  bad_params$scaled_prior_variance <- -0.1
  expect_error(validate_and_override_params(bad_params), "should be positive")

  # Test: invalid unmappable_effects
  bad_params <- valid_params
  bad_params$unmappable_effects <- "invalid"
  expect_error(validate_and_override_params(bad_params), "must be one of")

  # Test: unmappable effects overrides convergence method
  inf_params <- valid_params
  inf_params$unmappable_effects <- "inf"
  inf_params$convergence_method <- "elbo"
  expect_message(
    result <- validate_and_override_params(inf_params),
    "Setting convergence_method='pip'"
  )
  expect_equal(result$convergence_method, "pip")

  # Test: refine incompatible with unmappable effects
  refine_params <- valid_params
  refine_params$unmappable_effects <- "inf"
  refine_params$refine <- TRUE
  expect_error(
    validate_and_override_params(refine_params),
    "Refinement is not supported with unmappable effects"
  )

  # Test: NIG overrides convergence method when L > 1
  nig_params <- valid_params
  nig_params$L <- 10
  nig_params$estimate_residual_method <- "NIG"
  nig_params$convergence_method <- "elbo"
  nig_params$estimate_prior_method <- "simple"

  expect_message(
    result <- validate_and_override_params(nig_params),
    "PIP convergence"
  )
  expect_message(
    result <- validate_and_override_params(nig_params),
    "EM"
  )

  expect_true(result$use_NIG)
  expect_equal(result$convergence_method, "pip")
  expect_equal(result$estimate_prior_method, "EM")

  # Test: NIG does NOT override convergence method when L = 1
  # (ELBO is well-defined for single-effect models)
  nig_params_l1 <- valid_params
  nig_params_l1$L <- 1
  nig_params_l1$estimate_residual_method <- "NIG"
  nig_params_l1$convergence_method <- "elbo"
  nig_params_l1$estimate_prior_method <- "EM"

  result_l1 <- validate_and_override_params(nig_params_l1)

  expect_true(result_l1$use_NIG)
  expect_equal(result_l1$convergence_method, "elbo")  # Not overridden
  expect_equal(result_l1$estimate_prior_method, "EM")

  # Test: NIG overrides estimate_residual_variance = FALSE
  nig_erv_params <- valid_params
  nig_erv_params$estimate_residual_method <- "NIG"
  nig_erv_params$estimate_residual_variance <- FALSE
  nig_erv_params$estimate_prior_method <- "EM"

  expect_message(
    result <- validate_and_override_params(nig_erv_params),
    "estimate_residual_variance = TRUE"
  )
  expect_true(result$estimate_residual_variance)

  # Test: NIG with explicit estimate_residual_variance = TRUE produces no warning
  nig_erv_params2 <- valid_params
  nig_erv_params2$estimate_residual_method <- "NIG"
  nig_erv_params2$estimate_residual_variance <- TRUE
  nig_erv_params2$estimate_prior_method <- "EM"

  # Should not produce the "estimate_residual_variance" warning
  expect_no_message(
    result <- validate_and_override_params(nig_erv_params2),
    message = "integrates out residual variance"
  )
  expect_true(result$estimate_residual_variance)

  # Test: estimate_prior_variance = FALSE
  no_est_params <- valid_params
  no_est_params$estimate_prior_variance <- FALSE
  result <- validate_and_override_params(no_est_params)
  expect_equal(result$estimate_prior_method, "none")

  # Test: NIG with estimate_prior_variance = FALSE respects user choice
  # The EM override should NOT happen when user explicitly disables prior variance estimation
  nig_no_prior_params <- valid_params
  nig_no_prior_params$estimate_residual_method <- "NIG"
  nig_no_prior_params$estimate_prior_variance <- FALSE
  nig_no_prior_params$estimate_prior_method <- "optim"

  result <- validate_and_override_params(nig_no_prior_params)
  expect_true(result$use_NIG)
  # estimate_prior_variance = FALSE -> estimate_prior_method stays "none" (set earlier)
  # The SS block should NOT override to "EM" because estimation is disabled
  expect_equal(result$estimate_prior_method, "none")

  # Test: NIG with estimate_prior_variance = TRUE overrides to EM
  nig_yes_prior_params <- valid_params
  nig_yes_prior_params$estimate_residual_method <- "NIG"
  nig_yes_prior_params$estimate_prior_variance <- TRUE
  nig_yes_prior_params$estimate_prior_method <- "simple"

  expect_message(
    result <- validate_and_override_params(nig_yes_prior_params),
    "EM"
  )
  expect_true(result$use_NIG)
  expect_equal(result$estimate_prior_method, "EM")

  # Test: NIG rejects alpha0 = 0 (reproduces GitHub issue: L=1,
  # alpha0 = 0, beta0 > 0 previously produced an infinite ELBO crash)
  nig_bad_alpha <- valid_params
  nig_bad_alpha$estimate_residual_method <- "NIG"
  nig_bad_alpha$alpha0 <- 0
  nig_bad_alpha$beta0 <- 0.5
  expect_error(
    validate_and_override_params(nig_bad_alpha),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects alpha0 = 0, beta0 = 0 (previously produced
  # a silent NaN ELBO rather than a proper error)
  nig_both_zero <- valid_params
  nig_both_zero$estimate_residual_method <- "NIG"
  nig_both_zero$alpha0 <- 0
  nig_both_zero$beta0 <- 0
  expect_error(
    validate_and_override_params(nig_both_zero),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects negative alpha0
  nig_neg_alpha <- valid_params
  nig_neg_alpha$estimate_residual_method <- "NIG"
  nig_neg_alpha$alpha0 <- -0.5
  nig_neg_alpha$beta0 <- 1
  expect_error(
    validate_and_override_params(nig_neg_alpha),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects negative beta0
  nig_neg_beta <- valid_params
  nig_neg_beta$estimate_residual_method <- "NIG"
  nig_neg_beta$alpha0 <- 1
  nig_neg_beta$beta0 <- -0.5
  expect_error(
    validate_and_override_params(nig_neg_beta),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects non-finite alpha0/beta0
  nig_inf <- valid_params
  nig_inf$estimate_residual_method <- "NIG"
  nig_inf$alpha0 <- Inf
  expect_error(
    validate_and_override_params(nig_inf),
    "alpha0 > 0 and beta0 > 0"
  )

  nig_na <- valid_params
  nig_na$estimate_residual_method <- "NIG"
  nig_na$alpha0 <- NA_real_
  expect_error(
    validate_and_override_params(nig_na),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects non-scalar alpha0/beta0
  nig_vec <- valid_params
  nig_vec$estimate_residual_method <- "NIG"
  nig_vec$alpha0 <- c(0.1, 0.2)
  expect_error(
    validate_and_override_params(nig_vec),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: NIG rejects NULL alpha0/beta0 (non-numeric)
  nig_null <- valid_params
  nig_null$estimate_residual_method <- "NIG"
  nig_null$alpha0 <- NULL
  expect_error(
    validate_and_override_params(nig_null),
    "alpha0 > 0 and beta0 > 0"
  )

  # Test: non-NIG path does NOT validate alpha0/beta0
  # (the NIG prior is unused, so invalid values must be silently ignored)
  no_nig_bad <- valid_params
  no_nig_bad$estimate_residual_method <- "MLE"
  no_nig_bad$alpha0 <- 0
  no_nig_bad$beta0 <- 0
  result <- validate_and_override_params(no_nig_bad)
  expect_false(result$use_NIG)
  expect_null(result$alpha0)
  expect_null(result$beta0)

  # Test: NIG requires a valid sample size params$n (the default alpha0/beta0
  # scale as 1/sqrt(n), so n must be a positive finite scalar)
  nig_needs_n <- valid_params
  nig_needs_n$estimate_residual_method <- "NIG"

  # NULL n rejected
  nig_needs_n$n <- NULL
  expect_error(
    validate_and_override_params(nig_needs_n),
    "requires a valid sample size"
  )

  # Zero n rejected
  nig_needs_n$n <- 0
  expect_error(
    validate_and_override_params(nig_needs_n),
    "requires a valid sample size"
  )

  # Negative n rejected
  nig_needs_n$n <- -5
  expect_error(
    validate_and_override_params(nig_needs_n),
    "requires a valid sample size"
  )

  # Non-scalar n rejected
  nig_needs_n$n <- c(100, 200)
  expect_error(
    validate_and_override_params(nig_needs_n),
    "requires a valid sample size"
  )

  # Valid n passes
  nig_needs_n$n <- 100
  result <- suppressMessages(validate_and_override_params(nig_needs_n))
  expect_true(result$use_NIG)
})

# =============================================================================
# MODEL INITIALIZATION
# =============================================================================

test_that("initialize_matrices creates correct model matrices", {
  n <- 100
  p <- 50
  L <- 5

  data <- list(n = n, p = p)

  params <- list(
    L = L,
    scaled_prior_variance = 0.2,
    residual_variance = 1.5,
    prior_weights = rep(1/p, p),
    null_weight = 0
  )

  var_y <- 2.0

  result <- initialize_matrices(data, params, var_y)

  # Check all components exist
  expected_names <- c("alpha", "mu", "mu2", "V", "KL", "lbf",
                      "lbf_variable", "sigma2", "pi", "null_weight",
                      "predictor_weights")
  expect_true(all(expected_names %in% names(result)))

  # Check dimensions
  expect_equal(dim(result$alpha), c(L, p))
  expect_equal(dim(result$mu), c(L, p))
  expect_equal(dim(result$mu2), c(L, p))
  expect_equal(dim(result$lbf_variable), c(L, p))
  expect_length(result$V, L)
  expect_length(result$KL, L)
  expect_length(result$lbf, L)
  expect_length(result$predictor_weights, p)

  # Check initial values
  expect_equal(result$alpha, matrix(1/p, L, p))
  expect_equal(result$mu, matrix(0, L, p))
  expect_equal(result$mu2, matrix(0, L, p))
  expect_equal(result$V, rep(params$scaled_prior_variance * var_y, L))
  expect_equal(result$sigma2, params$residual_variance)
  expect_equal(result$pi, params$prior_weights)
  expect_true(all(is.na(result$KL)))
  expect_true(all(is.na(result$lbf)))
})

test_that("initialize_matrices handles vector scaled_prior_variance of length L", {
  # Regression for GitHub issue: scaled_prior_variance docs allow a length-L
  # vector, but the refactor's rep(vec * var_y, L) produced length L*L.
  n <- 100; p <- 50; L <- 5
  data <- list(n = n, p = p)
  spv <- c(0.1, 0.2, 0.3, 0.4, 0.5)
  params <- list(
    L = L,
    scaled_prior_variance = spv,
    residual_variance = 1.5,
    prior_weights = rep(1 / p, p),
    null_weight = 0
  )
  var_y <- 2.0

  result <- initialize_matrices(data, params, var_y)

  expect_length(result$V, L)
  expect_equal(result$V, spv * var_y)
})

test_that("expand_scaled_prior_variance recycles scalar and preserves vector", {
  expect_equal(expand_scaled_prior_variance(0.2, 2.0, 5), rep(0.4, 5))
  expect_equal(
    expand_scaled_prior_variance(c(0.1, 0.2, 0.3, 0.4, 0.5), 2.0, 5),
    c(0.2, 0.4, 0.6, 0.8, 1.0)
  )
})

test_that("validate_and_override_params rejects wrong-length scaled_prior_variance", {
  base_params <- list(
    prior_tol = 1e-9,
    residual_variance_upperbound = 1e4,
    scaled_prior_variance = c(0.1, 0.2, 0.3),
    L = 5,
    unmappable_effects = "none",
    slot_prior = NULL
  )
  expect_error(
    validate_and_override_params(base_params),
    "scalar or a vector of length L"
  )
})

test_that("susie with vector scaled_prior_variance runs end-to-end (pcarbo example)", {
  # Regression for GitHub issue requesting per-slot prior variances.
  # Before the fix, rep(vec * var_y, L) produced length L*L and poisoned
  # downstream state; susie_get_cs eventually raised 'get_purity returned NaN/NA'.
  set.seed(1)
  n <- 200; p <- 100
  beta <- rep(0, p); beta[1:4] <- 1
  X <- matrix(rnorm(n * p), nrow = n)
  X <- scale(X, center = TRUE, scale = TRUE)
  y <- drop(X %*% beta + rnorm(n))

  fit <- susie(X, y, L = 10,
               estimate_prior_variance = FALSE,
               scaled_prior_variance = rep(1, 10))

  expect_length(fit$V, 10)
  expect_true(all(is.finite(fit$V)))
})

test_that("vector scaled_prior_variance composes with model_init L expansion", {
  # Confirms the preserve-fitted-V behavior (from the s_init/model_init PR)
  # still applies when scaled_prior_variance is a length-L vector: the first
  # num_effects entries come from model_init$V; the rest use the user vector.
  set.seed(2)
  n <- 200; p <- 80
  beta <- rep(0, p); beta[1:3] <- 1
  X <- scale(matrix(rnorm(n * p), nrow = n), center = TRUE, scale = TRUE)
  y <- drop(X %*% beta + rnorm(n))

  init <- susie(X, y, L = 2, estimate_prior_variance = TRUE)

  L_new <- 5
  spv <- c(0.1, 0.2, 0.3, 0.4, 0.5)
  fit <- susie(X, y, L = L_new,
               estimate_prior_variance = FALSE,
               scaled_prior_variance = spv,
               model_init = init)

  expect_length(fit$V, L_new)
  expect_true(all(is.finite(fit$V)))
})

test_that("initialize_null_index sets null index correctly", {
  data <- list(p = 100)

  # Test: no null weight
  model_no_null <- list(null_weight = 0)
  result <- initialize_null_index(data, model_no_null)
  expect_equal(result, 0)

  model_null_null <- list(null_weight = NULL)
  result <- initialize_null_index(data, model_null_null)
  expect_equal(result, 0)

  # Test: with null weight
  model_with_null <- list(null_weight = 0.1)
  result <- initialize_null_index(data, model_with_null)
  expect_equal(result, data$p)
})

test_that("assign_names assigns variable names to model components", {
  p <- 10
  L <- 3
  data <- list(p = p)

  model <- list(
    alpha = matrix(1/p, L, p),
    mu = matrix(0, L, p),
    mu2 = matrix(0, L, p),
    lbf_variable = matrix(0, L, p),
    pip = rep(0.1, p),
    null_weight = NULL
  )

  variable_names <- paste0("var", 1:p)

  # Test: without null weight
  result <- assign_names(data, model, variable_names)
  expect_equal(names(result$pip), variable_names)
  expect_equal(colnames(result$alpha), variable_names)
  expect_equal(colnames(result$mu), variable_names)
  expect_equal(colnames(result$mu2), variable_names)
  expect_equal(colnames(result$lbf_variable), variable_names)

  # Test: with null weight
  model$null_weight <- 0.1
  model$null_index <- p
  model$pip <- rep(0.1, p - 1)
  variable_names_with_null <- c(paste0("var", 1:(p-1)), "null_placeholder")

  result <- assign_names(data, model, variable_names_with_null)
  expect_equal(names(result$pip), paste0("var", 1:(p-1)))
  expect_equal(colnames(result$alpha)[p], "null")

  # Test: NULL variable names
  result_null <- assign_names(data, model, NULL)
  expect_null(names(result_null$pip))
})

test_that("adjust_L adjusts number of effects correctly", {
  p <- 50
  L_requested <- 10
  num_effects_init <- 5
  var_y <- 2.0

  model_init_pruned <- list(
    alpha = matrix(1/p, num_effects_init, p),
    mu = matrix(0, num_effects_init, p),
    mu2 = matrix(0, num_effects_init, p),
    V = rep(1, num_effects_init)
  )

  params <- list(
    L = L_requested,
    scaled_prior_variance = 0.2
  )

  # Test: L > num_effects (should expand)
  result <- adjust_L(params, model_init_pruned, var_y)
  expect_equal(result$L, L_requested)
  expect_equal(nrow(result$model_init$alpha), L_requested)

  # Test: L < num_effects (should warn and use num_effects)
  params_small <- params
  params_small$L <- 3

  expect_message(
    result <- adjust_L(params_small, model_init_pruned, var_y),
    "is smaller than the"
  )
  expect_equal(result$L, num_effects_init)
})

test_that("prune_single_effects expands or filters model effects", {
  p <- 50
  L_init <- 10

  model_init <- list(
    alpha = matrix(1/p, L_init, p),
    mu = matrix(0, L_init, p),
    mu2 = matrix(0, L_init, p),
    lbf_variable = matrix(0, L_init, p),
    KL = rep(1, L_init),
    lbf = rep(0, L_init),
    V = rep(1, L_init),
    sets = list(cs_index = c(1, 3, 5))
  )

  # Test: L == num_effects (just removes sets)
  result_same <- prune_single_effects(model_init, L = L_init, V = NULL)
  expect_equal(nrow(result_same$alpha), L_init)
  expect_null(result_same$sets)

  # Test: expand to larger L with vector V (length(V) > 1)
  L_expand <- 15
  V_expand <- rep(2, L_expand)
  result_expand <- prune_single_effects(model_init, L = L_expand, V = V_expand)
  expect_equal(nrow(result_expand$alpha), L_expand)
  expect_equal(result_expand$V[1:L_init], rep(1, L_init))
  expect_equal(result_expand$V[(L_init+1):L_expand], rep(2, L_expand - L_init))

  # Test: expand to larger L with scalar V (length(V) == 1)
  # This tests the else branch: V <- rep(V, L)
  L_expand_scalar <- 12
  V_scalar <- 3  # Single value
  result_expand_scalar <- prune_single_effects(model_init, L = L_expand_scalar, V = V_scalar)
  expect_equal(nrow(result_expand_scalar$alpha), L_expand_scalar)
  # When V is scalar, it gets replicated to length L
  expect_equal(result_expand_scalar$V, rep(V_scalar, L_expand_scalar))
  expect_length(result_expand_scalar$V, L_expand_scalar)
  # All V values should be the same scalar value
  expect_true(all(result_expand_scalar$V == V_scalar))
})

test_that("add_null_effect adds null effect to model", {
  p <- 50
  L <- 5

  model_init <- list(
    alpha = matrix(1/p, L, p),
    mu = matrix(0, L, p),
    mu2 = matrix(0, L, p),
    lbf_variable = matrix(0, L, p),
    V = rep(1, L)
  )

  V_null <- 0

  result <- add_null_effect(model_init, V_null)

  # Check dimensions increased
  expect_equal(nrow(result$alpha), L + 1)
  expect_equal(nrow(result$mu), L + 1)
  expect_equal(nrow(result$mu2), L + 1)
  expect_equal(nrow(result$lbf_variable), L + 1)
  expect_length(result$V, L + 1)

  # Check null effect values
  expect_equal(result$alpha[L + 1, ], rep(1/p, p))
  expect_equal(result$mu[L + 1, ], rep(0, p))
  expect_equal(result$mu2[L + 1, ], rep(0, p))
  expect_equal(result$lbf_variable[L + 1, ], rep(0, p))
  expect_equal(result$V[L + 1], V_null)
})

# =============================================================================
# CORE ALGORITHM COMPONENTS
# =============================================================================

test_that("compute_eigen_decomposition computes eigenvalues and eigenvectors", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 456)
  XtX <- crossprod(base_data$X)

  result <- compute_eigen_decomposition(XtX, base_data$n)

  # Check components
  expect_true(all(c("V", "Dsq", "VtXty") %in% names(result)))
  expect_equal(dim(result$V), c(base_data$p, base_data$p))
  expect_length(result$Dsq, base_data$p)
  expect_null(result$VtXty)

  # Check eigenvalues in decreasing order
  expect_true(all(diff(result$Dsq) <= 0))

  # Check eigenvalues are non-negative
  expect_true(all(result$Dsq >= 0))

  # Verify decomposition
  LD <- XtX / base_data$n
  eig_direct <- eigen(LD, symmetric = TRUE)
  expect_equal(result$Dsq, sort(eig_direct$values * base_data$n, decreasing = TRUE), tolerance = 1e-10)
})

test_that("add_eigen_decomposition adds eigen components to data object", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 789)

  XtX <- crossprod(base_data$X)
  Xty <- as.vector(crossprod(base_data$X, base_data$y))
  yty <- sum(base_data$y^2)

  data <- list(
    XtX = XtX,
    Xty = Xty,
    yty = yty,
    n = base_data$n,
    p = base_data$p
  )

  params <- list(
    unmappable_effects = "inf",
    verbose = FALSE
  )

  result <- add_eigen_decomposition(data, params)

  # Check components added
  expect_true(!is.null(result$eigen_vectors))
  expect_true(!is.null(result$eigen_values))
  expect_true(!is.null(result$VtXty))

  # Check dimensions
  expect_equal(dim(result$eigen_vectors), c(base_data$p, base_data$p))
  expect_length(result$eigen_values, base_data$p)
  expect_length(result$VtXty, base_data$p)
  expect_true(all(is.finite(result$VtXty)))

  # Test with unmappable_effects = "none" (no scaling)
  params_none <- list(unmappable_effects = "none", verbose = FALSE)
  result_none <- add_eigen_decomposition(data, params_none)
  expect_true(!is.null(result_none$eigen_vectors))

  # Test with unmappable_effects = "ash" (no raw data storage needed)
  params_ash <- list(unmappable_effects = "ash", verbose = FALSE)

  result_ash <- add_eigen_decomposition(data, params_ash)
  expect_true(!is.null(result_ash$eigen_vectors))
  expect_true(!is.null(result_ash$eigen_values))
  expect_true(!is.null(result_ash$VtXty))
})

test_that("compute_omega_quantities computes omega-weighted quantities", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 111)
  XtX <- crossprod(base_data$X)

  eigen_decomp <- compute_eigen_decomposition(XtX, base_data$n)

  data <- list(
    eigen_vectors = eigen_decomp$V,
    eigen_values = eigen_decomp$Dsq,
    p = base_data$p
  )

  tau2 <- 0.01
  sigma2 <- 1.0

  result <- compute_omega_quantities(data, tau2, sigma2)

  # Check components
  expect_true(all(c("omega_var", "diagXtOmegaX") %in% names(result)))
  expect_length(result$omega_var, base_data$p)
  expect_length(result$diagXtOmegaX, base_data$p)

  # Check omega_var calculation
  expected_omega_var <- tau2 * data$eigen_values + sigma2
  expect_equal(result$omega_var, expected_omega_var, tolerance = 1e-10)

  # Check diagXtOmegaX is positive
  expect_true(all(result$diagXtOmegaX > 0))

  # Check diagXtOmegaX sums correctly
  # Should be trace of X'OmegaX
  trace_approx <- sum(result$diagXtOmegaX)
  expect_true(trace_approx > 0)
})

test_that("compute_theta_blup computes BLUP coefficients", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 222)
  L <- 5

  XtX <- crossprod(base_data$X)
  Xty <- as.vector(crossprod(base_data$X, base_data$y))

  eigen_decomp <- compute_eigen_decomposition(XtX, base_data$n)

  data <- list(
    eigen_vectors = eigen_decomp$V,
    eigen_values = eigen_decomp$Dsq,
    VtXty = crossprod(eigen_decomp$V, Xty),
    p = base_data$p
  )

  model <- list(
    alpha = matrix(1/base_data$p, L, base_data$p),
    mu = matrix(rnorm(L * base_data$p, 0, 0.1), L, base_data$p),
    tau2 = 0.01,
    sigma2 = 1.0
  )

  result <- compute_theta_blup(data, model)

  # Check output
  expect_length(result, base_data$p)

  # Check finite values
  expect_true(all(is.finite(result)))

  # When tau2 = 0, theta should be 0
  model_zero_tau2 <- model
  model_zero_tau2$tau2 <- 0
  result_zero <- compute_theta_blup(data, model_zero_tau2)
  expect_true(all(abs(as.vector(result_zero)) < 1e-10))
})

test_that("lbf_stabilization stabilizes log Bayes factors", {
  p <- 100
  lbf <- rnorm(p, mean = 5, sd = 2)
  prior_weights <- rep(1/p, p)
  shat2 <- rgamma(p, shape = 2, rate = 1)

  result <- lbf_stabilization(lbf, prior_weights, shat2)

  # Check components
  expect_true(all(c("lbf", "lpo") %in% names(result)))
  expect_length(result$lbf, p)
  expect_length(result$lpo, p)

  # Check lpo calculation
  expected_lpo <- lbf + log(prior_weights + sqrt(.Machine$double.eps))
  expect_equal(result$lpo, expected_lpo, tolerance = 1e-10)

  # Test with infinite shat2
  shat2_inf <- shat2
  shat2_inf[c(1, 5, 10)] <- Inf

  result_inf <- lbf_stabilization(lbf, prior_weights, shat2_inf)

  # LBF should be 0 where shat2 is infinite
  expect_equal(result_inf$lbf[c(1, 5, 10)], rep(0, 3))

  # LPO should be log(prior) where shat2 is infinite
  expected_lpo_inf <- log(prior_weights[c(1, 5, 10)] + sqrt(.Machine$double.eps))
  expect_equal(result_inf$lpo[c(1, 5, 10)], expected_lpo_inf, tolerance = 1e-10)
})

test_that("compute_posterior_weights computes alpha and lbf_model", {
  p <- 100
  lbf <- rnorm(p, mean = 5, sd = 2)
  prior_weights <- rep(1/p, p)
  lpo <- lbf + log(prior_weights)

  result <- compute_posterior_weights(lpo)

  # Check components
  expect_true(all(c("alpha", "lbf_model") %in% names(result)))
  expect_length(result$alpha, p)
  expect_length(result$lbf_model, 1)

  # Check alpha sums to 1
  expect_equal(sum(result$alpha), 1, tolerance = 1e-10)

  # Check alpha values are probabilities
  expect_true(all(result$alpha >= 0))
  expect_true(all(result$alpha <= 1))

  # Verify calculation
  max_lpo <- max(lpo)
  w_weighted <- exp(lpo - max_lpo)
  weighted_sum_w <- sum(w_weighted)
  expected_alpha <- w_weighted / weighted_sum_w
  expected_lbf_model <- log(weighted_sum_w) + max_lpo

  expect_equal(result$alpha, expected_alpha, tolerance = 1e-10)
  expect_equal(result$lbf_model, expected_lbf_model, tolerance = 1e-10)

  # Test numerical stability with very large lpo
  lpo_large <- c(1000, 1001, 1002, rep(0, p - 3))
  result_large <- compute_posterior_weights(lpo_large)
  expect_equal(sum(result_large$alpha), 1, tolerance = 1e-10)
  expect_true(all(result_large$alpha >= 0 & result_large$alpha <= 1))
})

test_that("compute_lbf_gradient computes gradient for prior variance", {
  p <- 100
  alpha <- rep(1/p, p)
  betahat <- rnorm(p, mean = 0, sd = 1)
  shat2 <- rgamma(p, shape = 2, rate = 1)
  V <- 1.0

  result <- compute_lbf_gradient(alpha, betahat, shat2, V, use_NIG = FALSE)

  # Check output is numeric scalar
  expect_length(result, 1)
  expect_true(is.finite(result))

  # Test with different V values
  result_small_V <- compute_lbf_gradient(alpha, betahat, shat2, V = 0.1, use_NIG = FALSE)
  result_large_V <- compute_lbf_gradient(alpha, betahat, shat2, V = 10, use_NIG = FALSE)

  expect_true(is.finite(result_small_V))
  expect_true(is.finite(result_large_V))

  # Test with NIG (should return NULL)
  result_nig <- compute_lbf_gradient(alpha, betahat, shat2, V, use_NIG = TRUE)
  expect_null(result_nig)

  # Test with NaN in intermediate calculations (should handle)
  shat2_zero <- rep(0, p)
  betahat_zero <- rep(0, p)
  result_nan <- compute_lbf_gradient(alpha, betahat_zero, shat2_zero, V, use_NIG = FALSE)
  expect_true(is.finite(result_nan))
})

# =============================================================================
# VARIANCE ESTIMATION
# =============================================================================

test_that("mom_unmappable estimates variance using method of moments", {
  # Setup test data
  setup <- setup_ss_data(n = 100, p = 50, L = 5, seed = 333, unmappable_effects = "inf")
  data <- setup$data
  params <- setup$params
  params$verbose <- FALSE
  model <- setup$model

  # Compute omega
  L <- nrow(model$alpha)
  omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
  omega <- matrix(0, L, data$p)
  for (l in seq_len(L)) {
    omega[l, ] <- omega_res$diagXtOmegaX + 1 / model$V[l]
  }

  # Test estimating both tau2 and sigma2
  result <- mom_unmappable(data, params, model, omega, tau2 = model$tau2,
                          est_tau2 = TRUE, est_sigma2 = TRUE)

  expect_true(all(c("sigma2", "tau2") %in% names(result)))
  expect_true(result$sigma2 > 0)
  expect_true(result$tau2 >= 0)

  # Test estimating only sigma2
  result_sigma_only <- mom_unmappable(data, params, model, omega, tau2 = 0.01,
                                     est_tau2 = FALSE, est_sigma2 = TRUE)
  expect_true(result_sigma_only$sigma2 > 0)
  expect_equal(result_sigma_only$tau2, 0.01)

  # Test verbose message when estimating both tau2 and sigma2
  params_verbose <- params
  params_verbose$verbose <- TRUE
  expect_message(
    result_verbose_both <- mom_unmappable(data, params_verbose, model, omega,
                                         tau2 = model$tau2,
                                         est_tau2 = TRUE, est_sigma2 = TRUE),
    "Update \\(sigma\\^2,tau\\^2\\) to"
  )
  expect_true(all(c("sigma2", "tau2") %in% names(result_verbose_both)))

  # Test verbose message when estimating only sigma2
  expect_message(
    result_verbose_sigma <- mom_unmappable(data, params_verbose, model, omega,
                                          tau2 = 0.01,
                                          est_tau2 = FALSE, est_sigma2 = TRUE),
    "Update sigma\\^2 to"
  )
  expect_true(result_verbose_sigma$sigma2 > 0)
  expect_equal(result_verbose_sigma$tau2, 0.01)
})

test_that("mle_unmappable estimates variance using MLE", {
  # Setup test data
  setup <- setup_ss_data(n = 100, p = 50, L = 5, seed = 444, unmappable_effects = "inf")
  data <- setup$data
  params <- setup$params
  params$verbose <- FALSE
  model <- setup$model

  # Compute omega
  L <- nrow(model$alpha)
  omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
  omega <- matrix(0, L, data$p)
  for (l in seq_len(L)) {
    omega[l, ] <- omega_res$diagXtOmegaX + 1 / model$V[l]
  }

  # Test estimating both tau2 and sigma2
  result <- mle_unmappable(data, params, model, omega,
                          est_tau2 = TRUE, est_sigma2 = TRUE)

  expect_true(all(c("sigma2", "tau2") %in% names(result)))
  expect_true(result$sigma2 > 0)
  expect_true(result$tau2 >= 0)

  # Test estimating only sigma2
  result_sigma_only <- mle_unmappable(data, params, model, omega,
                                     est_tau2 = FALSE, est_sigma2 = TRUE)
  expect_true(result_sigma_only$sigma2 > 0)

  # Test verbose message when estimating both tau2 and sigma2
  params_verbose <- params
  params_verbose$verbose <- TRUE
  expect_message(
    result_verbose_both <- mle_unmappable(data, params_verbose, model, omega,
                                         est_tau2 = TRUE, est_sigma2 = TRUE),
    "Update \\(sigma\\^2,tau\\^2\\) to"
  )
  expect_true(all(c("sigma2", "tau2") %in% names(result_verbose_both)))

  # Test verbose message when estimating only sigma2
  expect_message(
    result_verbose_sigma <- mle_unmappable(data, params_verbose, model, omega,
                                          est_tau2 = FALSE, est_sigma2 = TRUE),
    "Update sigma\\^2 to"
  )
  expect_true(result_verbose_sigma$sigma2 > 0)
})

test_that("compute_lbf_NIG_univariate computes log Bayes factor", {
  set.seed(555)
  n <- 100
  x <- rnorm(n)
  y <- 2 * x + rnorm(n)
  s0 <- 1
  alpha0 <- 0
  beta0 <- 0

  result <- compute_lbf_NIG_univariate(x, y, s0, alpha0, beta0)

  # Check output is numeric scalar
  expect_length(result, 1)
  expect_true(is.finite(result))

  # LBF should be positive when there's signal
  expect_true(result > 0)

  # Test with no signal
  x_null <- rnorm(n)
  y_null <- rnorm(n)
  result_null <- compute_lbf_NIG_univariate(x_null, y_null, s0, alpha0, beta0)
  expect_true(is.finite(result_null))

  # Test with different prior parameters
  result_alpha <- compute_lbf_NIG_univariate(x, y, s0, alpha0 = 2, beta0 = 1)
  expect_true(is.finite(result_alpha))
})

test_that("posterior_mean_NIG computes posterior mean", {
  set.seed(666)
  p <- 50
  xtx <- 100
  xty <- 50
  s0_t <- 1

  result <- posterior_mean_NIG(xtx, xty, s0_t)

  # Check output is numeric
  expect_length(result, 1)
  expect_true(is.finite(result))

  # Posterior mean should be shrunk toward zero
  ols_est <- xty / xtx
  expect_true(abs(result) < abs(ols_est))

  # Test with very small prior (strong shrinkage)
  result_small <- posterior_mean_NIG(xtx, xty, s0_t = 0.01)
  expect_true(abs(result_small) < abs(result))
})

test_that("posterior_var_NIG computes posterior variance", {
  set.seed(777)
  xtx <- 100
  xty <- 50
  yty <- 1000
  n <- 100
  s0_t <- 1

  result <- posterior_var_NIG(xtx, xty, yty, n, s0_t)

  # Check components
  expect_true(all(c("post_var", "beta1") %in% names(result)))
  expect_true(is.finite(result$post_var))
  expect_true(is.finite(result$beta1))

  # Posterior variance should be positive
  expect_true(result$post_var > 0)

  # Test with very small prior (should return 0)
  result_small <- posterior_var_NIG(xtx, xty, yty, n, s0_t = 1e-6)
  expect_equal(result_small$post_var, 0)
  expect_equal(result_small$beta1, 0)
})

test_that("est_residual_variance estimates residual variance", {
  # Setup individual data
  setup <- setup_individual_data(n = 100, p = 50, L = 5, seed = 888)
  data <- setup$data
  model <- setup$model

  result <- est_residual_variance(data, model)

  # Check output is numeric and positive
  expect_length(result, 1)
  expect_true(is.finite(result))
  expect_true(result > 0)

  # Should be reasonable for random data
  expect_true(result < 10)  
})

test_that("update_model_variance updates variance components", {
  # Setup individual data with all necessary methods defined
  setup <- setup_individual_data(n = 100, p = 50, L = 5, seed = 999)
  data <- setup$data
  params <- setup$params
  params$estimate_residual_variance <- TRUE
  params$estimate_residual_method <- "MLE"
  params$residual_variance_lowerbound <- 0.01
  params$residual_variance_upperbound <- 10
  params$unmappable_effects <- "none"
  model <- setup$model

  old_sigma2 <- model$sigma2

  result <- update_model_variance(data, params, model)

  # Check sigma2 was updated
  expect_true("sigma2" %in% names(result))

  # Check sigma2 is within bounds
  expect_true(result$sigma2 >= params$residual_variance_lowerbound)
  expect_true(result$sigma2 <= params$residual_variance_upperbound)

  # Check it's finite and positive
  expect_true(is.finite(result$sigma2))
  expect_true(result$sigma2 > 0)
})

# =============================================================================
# CONVERGENCE & OPTIMIZATION
# =============================================================================

test_that("check_convergence detects convergence correctly", {
  p <- 50
  L <- 5

  params <- list(
    convergence_method = "elbo",
    tol = 1e-4,
    verbose = FALSE
  )

  model <- list(
    alpha = matrix(1/p, L, p),
    runtime = list(
      prev_elbo = -1000,
      prev_alpha = matrix(1/p, L, p),
      prev_pip_diff = NULL
    )
  )

  # Test: first iteration (should not converge)
  result_iter1 <- check_convergence(NULL, params, model, elbo = c(-1000, -999),
                                   iter = 1)
  expect_false(result_iter1$converged)

  # Test: ELBO converged
  elbo_converged <- c(-1000, -999.99)
  result_elbo_conv <- check_convergence(NULL, params, model, elbo = elbo_converged,
                                       iter = 2)
  expect_true(result_elbo_conv$converged)

  # Test: ELBO not converged
  model$runtime$prev_elbo <- -1000
  elbo_not_conv <- c(NA, NA, -990)
  result_elbo_not <- check_convergence(NULL, params, model, elbo = elbo_not_conv,
                                      iter = 2)
  expect_false(result_elbo_not$converged)

  # Test: PIP convergence
  params_pip <- list(
    convergence_method = "pip",
    tol = 1e-4,
    verbose = FALSE
  )

  # PIP converged (alpha unchanged)
  result_pip_conv <- check_convergence(NULL, params_pip, model, elbo = c(-1000, -999),
                                      iter = 2)
  expect_true(result_pip_conv$converged)

  # PIP not converged (alpha changed)
  model_changed <- model
  model_changed$alpha[1, 1] <- 0.5
  result_pip_not <- check_convergence(NULL, params_pip, model_changed,
                                     elbo = c(-1000, -999),
                                     iter = 2)
  expect_false(result_pip_not$converged)

  # Test: ELBO is NA/Inf (fallback to PIP)
  expect_message(
    result_na <- check_convergence(NULL, params, model, elbo = c(-1000, NA),
                                  iter = 2),
    "NA/infinite ELBO"
  )
  expect_true(result_na$converged)  # Alpha unchanged, so converged by PIP
})

test_that("PIP convergence detects and averages short alpha cycles", {
  alpha_a <- matrix(c(0.9, 0.1, 0.2, 0.8), nrow = 2, byrow = TRUE)
  alpha_b <- matrix(c(0.1, 0.9, 0.8, 0.2), nrow = 2, byrow = TRUE)
  model <- list(
    alpha = alpha_a,
    runtime = list(
      prev_alpha = alpha_b,
      alpha_history = list(alpha_a, alpha_b),
      pip_history = list(susie_get_pip(alpha_a), susie_get_pip(alpha_b))
    )
  )
  params <- list(tol = 1e-4, pip_stall_window = 5, prior_tol = 1e-9)

  result <- check_alpha_pip_cycle_convergence(NULL, params, model)

  expect_true(result$converged)
  expect_equal(result$convergence_reason, "alpha_pip_cycle_2")
  expect_equal(result$alpha, (alpha_a + alpha_b) / 2)
})

test_that("get_objective computes ELBO correctly", {
  # Setup individual data
  setup <- setup_individual_data(n = 100, p = 50, L = 5, seed = 101)
  data <- setup$data
  params <- setup$params
  params$unmappable_effects <- "none"
  params$verbose <- FALSE
  model <- setup$model
  model$KL <- rep(0.1, 5)

  result <- get_objective(data, params, model)

  # Check output is numeric scalar
  expect_length(result, 1)
  expect_true(is.finite(result))

  # ELBO should be negative for random data
  expect_true(result < 0)

  # Test with unmappable effects
  setup_inf <- setup_ss_data(n = 100, p = 50, L = 5, seed = 102, unmappable_effects = "inf")
  data_inf <- setup_inf$data
  params_inf <- setup_inf$params
  params_inf$unmappable_effects <- "inf"
  params_inf$verbose <- FALSE
  model_inf <- setup_inf$model
  model_inf$KL <- rep(0.1, 5)
  model_inf$lbf <- rep(0, 5)

  result_inf <- get_objective(data_inf, params_inf, model_inf)
  expect_length(result_inf, 1)
  expect_true(is.finite(result_inf))
})

test_that("compute_elbo_inf computes ELBO for infinitesimal model", {
  # Setup data
  setup <- setup_ss_data(n = 100, p = 50, L = 5, seed = 103, unmappable_effects = "inf")
  data <- setup$data
  model <- setup$model

  # Compute omega
  L <- nrow(model$alpha)
  omega_res <- compute_omega_quantities(data, model$tau2, model$sigma2)
  omega <- matrix(0, L, data$p)
  for (l in seq_len(L)) {
    omega[l, ] <- omega_res$diagXtOmegaX + 1 / model$V[l]
  }

  result <- compute_elbo_inf(
    alpha = model$alpha,
    mu = model$mu,
    omega = omega,
    lbf = rep(0, L),
    sigma2 = model$sigma2,
    tau2 = model$tau2,
    n = data$n,
    p = data$p,
    eigen_vectors = data$eigen_vectors,
    eigen_values = data$eigen_values,
    VtXty = data$VtXty,
    yty = data$yty
  )

  # Check output is numeric scalar
  expect_length(result, 1)
  expect_true(is.finite(result))

  # ELBO should be negative
  expect_true(result < 0)
})

# =============================================================================
# CREDIBLE SETS & POST-PROCESSING
# =============================================================================

test_that("n_in_CS_x counts variables in credible set", {
  # Probability vector with clear peak
  x <- c(0.5, 0.3, 0.1, 0.05, 0.03, 0.02)

  # With 90% coverage, should include first 2 variables (0.5 + 0.3 = 0.8 < 0.9, add 0.1)
  result_90 <- n_in_CS_x(x, coverage = 0.9)
  expect_equal(result_90, 3)

  # With 95% coverage, should include more
  result_95 <- n_in_CS_x(x, coverage = 0.95)
  expect_true(result_95 >= result_90)

  # With 50% coverage
  result_50 <- n_in_CS_x(x, coverage = 0.5)
  expect_equal(result_50, 1)

  # Uniform distribution
  skip("Fails on Linux in CI")
  x_uniform <- rep(1/10, 10)
  result_uniform <- n_in_CS_x(x_uniform, coverage = 0.9)
  expect_equal(result_uniform, 10)  # Need all to reach 90%
})

test_that("in_CS_x creates binary indicator for credible set", {
  x <- c(0.5, 0.3, 0.1, 0.05, 0.03, 0.02)

  result_90 <- in_CS_x(x, coverage = 0.9)

  # Check output is binary
  expect_equal(sort(unique(result_90)), c(0, 1))
  expect_length(result_90, length(x))

  # Check correct variables included
  expect_equal(sum(result_90), n_in_CS_x(x, coverage = 0.9))

  # Top probability should be in CS
  expect_equal(result_90[which.max(x)], 1)

  # Test with different coverage
  result_50 <- in_CS_x(x, coverage = 0.5)
  expect_equal(sum(result_50), 1)
})

test_that("in_CS creates credible set matrix", {
  L <- 5
  p <- 100

  # Create susie object
  alpha <- matrix(0, L, p)
  for (l in 1:L) {
    alpha[l, sample(p, 1)] <- 0.6
    alpha[l, ] <- alpha[l, ] / sum(alpha[l, ]) * 0.9
    alpha[l, ] <- alpha[l, ] + 0.1 / p
  }

  res <- list(alpha = alpha)
  class(res) <- "susie"

  result <- in_CS(res, coverage = 0.9)

  # Check dimensions
  expect_equal(dim(result), c(L, p))

  # Check binary values
  expect_true(all(result %in% c(0, 1)))

  # Each row should have at least one variable
  expect_true(all(rowSums(result) > 0))

  # Test with just alpha matrix
  result_alpha <- in_CS(alpha, coverage = 0.9)
  expect_equal(result, result_alpha)
})

test_that("n_in_CS counts variables in each credible set", {
  L <- 5
  p <- 100

  alpha <- matrix(0, L, p)
  for (l in 1:L) {
    alpha[l, sample(p, 1)] <- 0.7
    alpha[l, ] <- alpha[l, ] / sum(alpha[l, ]) * 0.9
    alpha[l, ] <- alpha[l, ] + 0.1 / p
  }

  res <- list(alpha = alpha)
  class(res) <- "susie"

  result <- n_in_CS(res, coverage = 0.9)

  # Check output
  expect_length(result, L)
  expect_true(all(result > 0))
  expect_true(all(result <= p))

  # Should match in_CS
  cs_matrix <- in_CS(res, coverage = 0.9)
  expect_equal(result, rowSums(cs_matrix))
})

test_that("get_purity computes correlation purity statistics", {
  base_data <- generate_base_data(n = 100, p = 50, seed = 123)

  # Test with multiple variables
  pos <- c(1, 2, 3, 5, 8)
  result <- get_purity(pos, base_data$X, Xcorr = NULL)

  # Check output
  expect_length(result, 3)  # min, mean, median
  expect_true(all(result >= 0))
  expect_true(all(result <= 1))

  # Mean should be between min and max (which is implicitly <= 1)
  expect_true(result[2] >= result[1])

  # Test with single variable (perfect purity)
  result_single <- get_purity(1, base_data$X, Xcorr = NULL)
  expect_equal(result_single, c(1, 1, 1))

  # Test with precomputed correlation
  Xcorr <- cor(base_data$X)
  result_xcorr <- get_purity(pos, base_data$X, Xcorr = Xcorr)
  expect_length(result_xcorr, 3)
  expect_true(all(result_xcorr >= 0))

  # Test with large set (should subsample)
  pos_large <- 1:40
  result_large <- get_purity(pos_large, base_data$X, Xcorr = NULL, n = 20)
  expect_length(result_large, 3)

  # Test squared correlations
  result_squared <- get_purity(pos, base_data$X, Xcorr = NULL, squared = TRUE)
  expect_length(result_squared, 3)
  expect_true(all(result_squared >= 0))
  expect_true(all(result_squared <= 1))
})


# =============================================================================
# END OF TESTS
# =============================================================================


================================================
FILE: tests/testthat/test_susie_workhorse.R
================================================
context("SuSiE Workhorse - Main Orchestration")

# =============================================================================
# BASIC FUNCTIONALITY
# =============================================================================

test_that("susie_workhorse returns valid susie object", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  expect_type(result, "list")
})

test_that("susie_workhorse creates all required output fields", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # Core posterior components
  expect_true("alpha" %in% names(result))
  expect_true("mu" %in% names(result))
  expect_true("mu2" %in% names(result))
  expect_true("V" %in% names(result))
  expect_true("sigma2" %in% names(result))

  # Tracking components
  expect_true("lbf" %in% names(result))
  expect_true("lbf_variable" %in% names(result))
  expect_true("KL" %in% names(result))

  # Output fields
  expect_true("elbo" %in% names(result))
  expect_true("niter" %in% names(result))
  expect_true("converged" %in% names(result))
  expect_true("pip" %in% names(result))
  expect_true("sets" %in% names(result))
  expect_true("fitted" %in% names(result))
  expect_true("intercept" %in% names(result))
})

test_that("susie_workhorse returns correct dimensions", {
  n <- 100
  p <- 50
  L <- 5
  setup <- setup_individual_data(n = n, p = p, L = L)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_equal(dim(result$alpha), c(L, p))
  expect_equal(dim(result$mu), c(L, p))
  expect_equal(dim(result$mu2), c(L, p))
  expect_equal(dim(result$lbf_variable), c(L, p))
  expect_length(result$V, L)
  expect_length(result$lbf, L)
  expect_length(result$KL, L)
  expect_length(result$pip, p)
  expect_length(result$fitted, n)
})

# =============================================================================
# CONVERGENCE BEHAVIOR
# =============================================================================

test_that("susie_workhorse sets converged flag when converged", {
  # Use simple data and loose tolerance to ensure convergence
  setup <- setup_individual_data(n = 50, p = 20, L = 3)
  setup$params$max_iter <- 100
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-2

  result <- susie_workhorse(setup$data, setup$params)

  # Should converge with enough iterations
  expect_true("converged" %in% names(result))
  expect_type(result$converged, "logical")
})

test_that("susie_workhorse warns when not converged", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 1  # Too few iterations
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-10  # Very strict tolerance

  # Should warn about not converging
  result <- susie_workhorse(setup$data, setup$params)

  # Check convergence status
  expect_false(result$converged)
  expect_equal(result$niter, 1)
})

test_that("susie_workhorse tracks ELBO correctly", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("elbo" %in% names(result))
  expect_true(all(is.finite(result$elbo)))
  expect_true(length(result$elbo) <= setup$params$max_iter)
  expect_true(length(result$elbo) > 0)
})

test_that("susie_workhorse ELBO increases monotonically", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 20
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # ELBO should be non-decreasing (allow small numerical errors)
  elbo_diff <- diff(result$elbo)
  expect_true(all(elbo_diff >= -1e-6))
})

test_that("susie_workhorse records correct number of iterations", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 15
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("niter" %in% names(result))
  expect_true(result$niter <= setup$params$max_iter)
  expect_true(result$niter > 0)
  expect_equal(result$niter, length(result$elbo))
})

# =============================================================================
# VARIANCE ESTIMATION
# =============================================================================

test_that("susie_workhorse updates residual variance when requested", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$estimate_residual_variance <- TRUE
  setup$params$residual_variance <- 1.5  # Initial value

  result <- susie_workhorse(setup$data, setup$params)

  # Residual variance should be updated from initial value
  expect_true(result$sigma2 > 0)
  expect_true(is.finite(result$sigma2))
})

test_that("susie_workhorse does not update residual variance when not requested", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$estimate_residual_variance <- FALSE
  setup$params$residual_variance <- 2.0  # Fixed value

  result <- susie_workhorse(setup$data, setup$params)

  # Residual variance should remain at initial value
  expect_equal(result$sigma2, 2.0)
})

# =============================================================================
# MATHEMATICAL PROPERTIES
# =============================================================================

test_that("susie_workhorse maintains valid probability distributions", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # Each row of alpha should sum to 1
  row_sums <- rowSums(result$alpha)
  expect_equal(row_sums, rep(1, 5), tolerance = 1e-10)

  expect_true(all(result$alpha >= 0 & result$alpha <= 1))
})

test_that("susie_workhorse produces valid PIPs", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # PIPs should be valid probabilities
  expect_true(all(result$pip >= 0))
  expect_true(all(result$pip <= 1))
  expect_true(all(is.finite(result$pip)))
})

test_that("susie_workhorse V values are non-negative", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true(all(result$V >= 0))
  expect_true(all(is.finite(result$V)))
})

test_that("susie_workhorse sigma2 is positive", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true(result$sigma2 > 0)
  expect_true(is.finite(result$sigma2))
})

test_that("susie_workhorse KL divergences are non-negative", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # KL divergence should be non-negative (allow small numerical errors)
  expect_true(all(result$KL >= -1e-6))
  expect_true(all(is.finite(result$KL)))
})

# =============================================================================
# EDGE CASES
# =============================================================================

test_that("susie_workhorse works with L=1", {
  setup <- setup_individual_data(n = 100, p = 50, L = 1)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  expect_equal(dim(result$alpha), c(1, 50))
  expect_equal(sum(result$alpha), 1, tolerance = 1e-10)
})

test_that("susie_workhorse works with small p", {
  setup <- setup_individual_data(n = 100, p = 10, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  # L should be adjusted to min(L, p)
  expect_true(nrow(result$alpha) <= 10)
})

test_that("susie_workhorse works with max_iter=1", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 1
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  # Should work but likely not converge
  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  expect_equal(result$niter, 1)
  # With max_iter=1, may or may not converge depending on data
})

# =============================================================================
# CONVERGENCE METHODS
# =============================================================================

test_that("susie_workhorse works with ELBO convergence", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 20
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  expect_true("elbo" %in% names(result))
})

test_that("susie_workhorse works with PIP convergence", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 20
  setup$params$convergence_method <- "pip"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  expect_true("pip" %in% names(result))
})

# =============================================================================
# REFINEMENT
# =============================================================================

test_that("susie_workhorse respects refine=FALSE", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$refine <- FALSE

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
  # Should complete without refinement
})

test_that("susie_workhorse skips refinement when no credible sets", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 2
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-10
  setup$params$refine <- TRUE

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
})

# =============================================================================
# TRACKING
# =============================================================================

test_that("susie_workhorse includes tracking when track_fit=TRUE", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$track_fit <- TRUE

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("trace" %in% names(result))
  expect_type(result$trace, "list")
})

test_that("susie_workhorse excludes tracking when track_fit=FALSE", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$track_fit <- FALSE

  result <- susie_workhorse(setup$data, setup$params)

  expect_false("trace" %in% names(result))
})

# =============================================================================
# MODEL INITIALIZATION
# =============================================================================

test_that("susie_workhorse works without model_init", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$model_init <- NULL

  result <- susie_workhorse(setup$data, setup$params)

  expect_s3_class(result, "susie")
})

test_that("susie_workhorse works with model_init", {
  setup <- setup_individual_data(n = 100, p = 50, L = 3)
  setup$params$max_iter <- 5
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  # Create an initial model
  model_init <- susie_workhorse(setup$data, setup$params)

  # Use it to initialize another run
  setup2 <- setup_individual_data(n = 100, p = 50, L = 3, seed = 43)
  setup2$params$max_iter <- 10
  setup2$params$convergence_method <- "elbo"
  setup2$params$tol <- 1e-3
  setup2$params$model_init <- model_init

  result <- susie_workhorse(setup2$data, setup2$params)

  expect_s3_class(result, "susie")
})

# =============================================================================
# CREDIBLE SETS
# =============================================================================

test_that("susie_workhorse computes credible sets", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 20
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("sets" %in% names(result))
  expect_type(result$sets, "list")
  expect_true("cs" %in% names(result$sets))
})

# =============================================================================
# FITTED VALUES
# =============================================================================

test_that("susie_workhorse computes fitted values", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("fitted" %in% names(result))
  expect_length(result$fitted, 100)
  expect_true(all(is.finite(result$fitted)))
})

test_that("susie_workhorse computes intercept when requested", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3
  setup$params$intercept <- TRUE

  result <- susie_workhorse(setup$data, setup$params)

  expect_true("intercept" %in% names(result))
  expect_true(is.finite(result$intercept))
})

# =============================================================================
# SIGNAL RECOVERY ON SIMULATED DATA
# =============================================================================

test_that("susie_workhorse recovers true signal on simple simulated data", {
  # Generate data with known causal variables
  set.seed(123)
  n <- 200
  p <- 100
  k <- 3  # Number of causal variables

  X <- matrix(rnorm(n * p), n, p)
  beta <- rep(0, p)
  causal_idx <- c(10, 30, 50)
  beta[causal_idx] <- c(2, -2, 1.5)
  y <- drop(X %*% beta + rnorm(n, sd = 0.5))

  # Prepare data
  X <- set_X_attributes(X, center = TRUE, scale = TRUE)
  mean_y <- mean(y)
  y <- y - mean_y

  data <- structure(
    list(X = X, y = y, n = n, p = p, mean_y = mean_y),
    class = "individual"
  )

  params <- list(
    L = 5,
    intercept = TRUE,
    standardize = TRUE,
    estimate_residual_variance = TRUE,
    estimate_prior_variance = TRUE,
    estimate_prior_method = "optim",
    unmappable_effects = "none",
    use_NIG = FALSE,
    compute_univariate_zscore = TRUE,
    coverage = 0.95,
    min_abs_corr = 0.5,
    n_purity = 100,
    check_null_threshold = 0.1,
    scaled_prior_variance = 0.2,
    prior_weights = rep(1/p, p),
    null_weight = 0,
    residual_variance = NULL,
    track_fit = FALSE,
    prior_tol = 1e-9,
    max_iter = 100,
    convergence_method = "elbo",
    tol = 1e-3,
    refine = FALSE,
    model_init = NULL,
    verbose = FALSE
  )

  result <- susie_workhorse(data, params)

  # Check that causal variables have high PIPs
  expect_true(all(result$pip[causal_idx] > 0.1))

  # Check that most non-causal variables have low PIPs
  non_causal_idx <- setdiff(1:p, causal_idx)
  expect_true(mean(result$pip[non_causal_idx]) < mean(result$pip[causal_idx]))
})

# =============================================================================
# INTEGRATION WITH FULL PIPELINE
# =============================================================================

test_that("susie_workhorse produces output compatible with susie_get functions", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 20
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # Should be able to extract PIPs (already in result)
  expect_length(result$pip, 50)

  # Should have credible sets
  expect_true("sets" %in% names(result))

  # Should have all fields needed for coef() method
  expect_true(all(c("alpha", "mu", "intercept") %in% names(result)))
})

test_that("susie_workhorse output is a valid susie object", {
  setup <- setup_individual_data(n = 100, p = 50, L = 5)
  setup$params$max_iter <- 10
  setup$params$convergence_method <- "elbo"
  setup$params$tol <- 1e-3

  result <- susie_workhorse(setup$data, setup$params)

  # Check class
  expect_s3_class(result, "susie")

  # Check that we have all the core components for a susie object
  required_fields <- c(
    "alpha", "mu", "mu2", "V", "sigma2",
    "elbo", "niter", "converged",
    "pip", "sets", "fitted", "intercept",
    "lbf", "lbf_variable", "KL"
  )

  expect_true(all(required_fields %in% names(result)))
})


================================================
FILE: tests/testthat/test_trendfilter.R
================================================
context("Trend filtering")

# =============================================================================
# BASIC FUNCTIONALITY
# =============================================================================

test_that("susie_trendfilter returns susie object", {
  set.seed(1)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_type(result, "list")
  expect_true("alpha" %in% names(result))
  expect_true("mu" %in% names(result))
  expect_true("elbo" %in% names(result))
})

test_that("susie_trendfilter detects changepoints with order=0", {
  set.seed(2)
  # Create signal with clear changepoints
  mu <- c(rep(0, 25), rep(3, 25), rep(-2, 25), rep(1, 25))
  y <- mu + rnorm(100, sd = 0.3)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  # Should have non-zero PIPs near changepoint locations (25, 50, 75)
  pip <- susie_get_pip(result)
  changepoint_regions <- c(23:27, 48:52, 73:77)

  expect_true(sum(pip[changepoint_regions]) > sum(pip[-changepoint_regions]))
})

test_that("susie_trendfilter fitted values track signal", {
  set.seed(3)
  mu <- c(rep(0, 20), rep(2, 20), rep(0, 20))
  y <- mu + rnorm(60, sd = 0.1)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  fitted <- predict(result)

  # Fitted values should be closer to true signal than raw data
  expect_true(mean((fitted - mu)^2) < mean((y - mu)^2))
})

test_that("susie_trendfilter with no changepoints", {
  set.seed(4)
  # Constant signal
  y <- rep(5, 50) + rnorm(50, sd = 0.5)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  # PIPs should be low everywhere (no clear changepoints)
  pip <- susie_get_pip(result)
  expect_true(max(pip) < 0.5)
})

# =============================================================================
# ORDER PARAMETER
# =============================================================================

test_that("susie_trendfilter with order=0 (changepoints)", {
  set.seed(5)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  expect_error(
    result <- susie_trendfilter(y, order = 0, use_mad = FALSE),
    NA
  )

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter with order=1 warns", {
  set.seed(6)
  y <- seq(0, 1, length.out = 50) + rnorm(50, sd = 0.1)

  expect_message(
    result <- suppressWarnings(susie_trendfilter(y, order = 1, use_mad = FALSE)),
    "order > 0 is not recommended"
  )

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter with order=2 warns", {
  set.seed(7)
  y <- (seq(0, 1, length.out = 50))^2 + rnorm(50, sd = 0.1)

  expect_message(
    result <- suppressWarnings(susie_trendfilter(y, order = 2, use_mad = FALSE)),
    "order > 0 is not recommended"
  )

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter order=0 vs order=1 produce different results", {
  set.seed(8)
  # Linear trend
  y <- seq(0, 2, length.out = 50) + rnorm(50, sd = 0.1)

  result_0 <- susie_trendfilter(y, order = 0, use_mad = FALSE, max_iter = 10)
  result_1 <- suppressWarnings(
    susie_trendfilter(y, order = 1, use_mad = FALSE, max_iter = 10)
  )

  # Results should differ
  expect_false(all(abs(result_0$alpha - result_1$alpha) < 1e-10))
})

# =============================================================================
# USE_MAD PARAMETER
# =============================================================================

test_that("susie_trendfilter with use_mad=TRUE", {
  set.seed(9)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  expect_error(
    result <- susie_trendfilter(y, order = 0, use_mad = TRUE),
    NA
  )

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter with use_mad=FALSE", {
  set.seed(10)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  expect_error(
    result <- susie_trendfilter(y, order = 0, use_mad = FALSE),
    NA
  )

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter use_mad=TRUE vs FALSE differ", {
  set.seed(11)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result_mad <- susie_trendfilter(y, order = 0, use_mad = TRUE, max_iter = 5)
  result_no_mad <- susie_trendfilter(y, order = 0, use_mad = FALSE, max_iter = 5)

  # Results may differ due to initialization
  # Just verify both work
  expect_s3_class(result_mad, "susie")
  expect_s3_class(result_no_mad, "susie")
})

test_that("susie_trendfilter use_mad with model_init skips MAD", {
  set.seed(12)
  mu <- c(rep(0, 20), rep(2, 20))
  y <- mu + rnorm(40)

  # Create a simple init
  init <- susie_init_coef(c(20), c(2), 40)

  # With model_init, should skip MAD even if use_mad=TRUE
  result <- susie_trendfilter(y, order = 0, use_mad = TRUE,
                               model_init = init, max_iter = 2)

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter rejects MAD=0 when use_mad=TRUE", {
  # Create constant data which will cause MAD = 0
  # All differences will be 0, so median(abs(diff(y))) = 0
  y <- rep(5, 50)

  expect_error(
    susie_trendfilter(y, order = 0, use_mad = TRUE),
    "Cannot use median absolute deviation \\(MAD\\) to initialize residual variance because MAD = 0 for the input data. Please set 'use_mad = FALSE'"
  )
})

# =============================================================================
# STANDARDIZE AND INTERCEPT OPTIONS
# =============================================================================

test_that("susie_trendfilter with standardize=TRUE", {
  set.seed(13)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, standardize = TRUE, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_true(all(result$alpha >= 0 & result$alpha <= 1))
})

test_that("susie_trendfilter with standardize=FALSE", {
  set.seed(14)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, standardize = FALSE, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_true(all(result$alpha >= 0 & result$alpha <= 1))
})

test_that("susie_trendfilter with intercept=TRUE", {
  set.seed(15)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60) + 10  # Add offset

  result <- susie_trendfilter(y, order = 0, intercept = TRUE, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_true(!is.na(result$intercept))
})

test_that("susie_trendfilter with intercept=FALSE", {
  set.seed(16)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, intercept = FALSE, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_equal(result$intercept, 0)
})

# =============================================================================
# PASS-THROUGH PARAMETERS
# =============================================================================

test_that("susie_trendfilter passes L parameter to susie", {
  set.seed(17)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, L = 3, use_mad = FALSE)

  expect_equal(nrow(result$alpha), 3)
  expect_equal(length(result$V), 3)
})

test_that("susie_trendfilter passes max_iter parameter to susie", {
  set.seed(18)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, max_iter = 5, use_mad = FALSE)

  expect_true(result$niter <= 5)
})

test_that("susie_trendfilter passes estimate_prior_variance to susie", {
  set.seed(19)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result_estimate <- susie_trendfilter(y, order = 0,
                                       estimate_prior_variance = TRUE,
                                       use_mad = FALSE, max_iter = 3)
  result_fixed <- susie_trendfilter(y, order = 0,
                                    estimate_prior_variance = FALSE,
                                    use_mad = FALSE, max_iter = 3)

  # Both should work
  expect_s3_class(result_estimate, "susie")
  expect_s3_class(result_fixed, "susie")
})

test_that("susie_trendfilter passes null_weight to susie", {
  set.seed(20)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60)
  n <- length(y)

  result <- susie_trendfilter(y, order = 0, null_weight = 1/(n+1),
                               use_mad = FALSE, max_iter = 3)

  expect_s3_class(result, "susie")
  expect_true(!is.null(result$null_index))
})

# =============================================================================
# INTEGRATION WITH SUSIE METHODS
# =============================================================================

test_that("susie_trendfilter output works with susie_get_cs", {
  set.seed(21)
  mu <- c(rep(0, 25), rep(3, 25), rep(-2, 25), rep(1, 25))
  y <- mu + rnorm(100, sd = 0.3)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  cs <- susie_get_cs(result, coverage = 0.95)

  expect_type(cs, "list")
  expect_true("cs" %in% names(cs))
  expect_equal(cs$requested_coverage, 0.95)
})

test_that("susie_trendfilter output works with susie_get_pip", {
  set.seed(22)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  pip <- susie_get_pip(result)

  expect_length(pip, length(y))
  expect_type(pip, "double")
  expect_true(all(pip >= 0 & pip <= 1))
})

test_that("susie_trendfilter output works with predict", {
  set.seed(23)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  fitted <- predict(result)

  expect_length(fitted, length(y))
  expect_type(fitted, "double")
  expect_true(all(is.finite(fitted)))
})

test_that("susie_trendfilter output works with coef", {
  set.seed(24)
  mu <- c(rep(0, 20), rep(2, 20), rep(-1, 20))
  y <- mu + rnorm(60)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  coefficients <- coef(result)

  # Should have length n+1 (intercept + n basis coefficients)
  expect_length(coefficients, length(y) + 1)
  expect_type(coefficients, "double")
})

test_that("susie_trendfilter output has sets field", {
  set.seed(25)
  mu <- c(rep(0, 25), rep(3, 25), rep(-2, 25), rep(1, 25))
  y <- mu + rnorm(100, sd = 0.3)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)
  result$sets <- susie_get_cs(result, coverage = 0.95)

  # Verify sets structure
  expect_type(result$sets, "list")
  expect_true("cs" %in% names(result$sets))
  expect_true("coverage" %in% names(result$sets))
  expect_equal(result$sets$requested_coverage, 0.95)
})

# =============================================================================
# CHANGEPOINT DETECTION QUALITY
# =============================================================================

test_that("susie_trendfilter recovers true changepoints", {
  set.seed(26)
  # Simple changepoint problem
  mu <- c(rep(0, 30), rep(4, 30), rep(-2, 30))
  y <- mu + rnorm(90, sd = 0.5)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  pip <- susie_get_pip(result)

  # Changepoints should be at positions 30 and 60
  # High PIP should be near these positions
  expect_true(pip[30] > 0.5 | pip[29] > 0.5 | pip[31] > 0.5)
  expect_true(pip[60] > 0.5 | pip[59] > 0.5 | pip[61] > 0.5)
})

test_that("susie_trendfilter handles multiple small changepoints", {
  set.seed(27)
  # Many small changes
  mu <- rep(c(0, 0.5), length.out = 60)
  y <- mu + rnorm(60, sd = 0.2)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  expect_s3_class(result, "susie")
  expect_true(all(result$alpha >= 0 & result$alpha <= 1))
})

test_that("susie_trendfilter with noisy data", {
  set.seed(28)
  mu <- c(rep(0, 30), rep(2, 30))
  y <- mu + rnorm(60, sd = 2)  # High noise

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  # Should still converge
  expect_s3_class(result, "susie")
  expect_true(result$converged)
})

# =============================================================================
# EDGE CASES
# =============================================================================

test_that("susie_trendfilter with short time series", {
  set.seed(29)
  y <- c(0, 0, 0, 2, 2, 2)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE, max_iter = 3)

  expect_s3_class(result, "susie")
})

test_that("susie_trendfilter with long time series", {
  set.seed(30)
  mu <- rep(c(0, 1, 2, 0), each = 100)
  y <- mu + rnorm(400, sd = 0.5)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE, max_iter = 20)

  expect_s3_class(result, "susie")
  expect_length(predict(result), 400)
})

test_that("susie_trendfilter with constant y errors", {
  set.seed(31)
  y <- rep(5, 50)

  # Constant y has zero variance, should error
  expect_error(
    susie_trendfilter(y, order = 0, use_mad = FALSE),
    "Residual variance sigma2 must be positive"
  )
})

test_that("susie_trendfilter with single changepoint at start", {
  set.seed(32)
  mu <- c(rep(0, 5), rep(2, 45))
  y <- mu + rnorm(50, sd = 0.3)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  pip <- susie_get_pip(result)

  # Should detect changepoint near position 5
  expect_true(any(pip[3:7] > 0.3))
})

test_that("susie_trendfilter with single changepoint at end", {
  set.seed(33)
  mu <- c(rep(0, 45), rep(2, 5))
  y <- mu + rnorm(50, sd = 0.3)

  result <- susie_trendfilter(y, order = 0, use_mad = FALSE)

  pip <- susie_get_pip(result)

  # Should detect changepoint near position 45
  expect_true(any(pip[43:47] > 0.3))
})

# =============================================================================
# COMPARISON WITH MANUAL CONSTRUCTION
# =============================================================================

test_that("susie_trendfilter matches manual sparse matrix construction", {
  set.seed(34)
  with(simulate_tf(0), {
    # Manual approach with explicit X matrix
    result_manual <- susie(X, y, estimate_prior_variance = FALSE,
                           standardize = TRUE, max_iter = 5)

    # Using susie_trendfilter
    result_tf <- susie_trendfilter(y, order = 0,
                                    estimate_prior_variance = FALSE,
                                    standardize = TRUE,
                                    use_mad = FALSE, max_iter = 5)

    # Should produce similar results
    expect_equal(result_tf$alpha, result_manual$alpha, tolerance = 1e-6)
    expect_equal(result_tf$mu, result_manual$mu, tolerance = 1e-6)
  })
})

test_that("susie_trendfilter order=1 matches manual construction", {
  set.seed(35)
  with(simulate_tf(1), {
    # Manual approach
    result_manual <- susie(X, y, estimate_prior_variance = FALSE,
                           standardize = TRUE, max_iter = 5)

    # Using susie_trendfilter
    result_tf <- suppressWarnings(
      susie_trendfilter(y, order = 1,
                        estimate_prior_variance = FALSE,
                        standardize = TRUE,
                        use_mad = FALSE, max_iter = 5)
    )

    # Should produce similar results
    expect_equal(result_tf$alpha, result_manual$alpha, tolerance = 1e-6)
    expect_equal(result_tf$mu, result_manual$mu, tolerance = 1e-6)
  })
})

test_that("susie_trendfilter order=2 matches manual construction", {
  set.seed(36)
  with(simulate_tf(2), {
    # Manual approach
    result_manual <- susie(X, y, estimate_prior_variance = FALSE,
                           standardize = TRUE, max_iter = 5)

    # Using susie_trendfilter
    result_tf <- suppressWarnings(
      susie_trendfilter(y, order = 2,
                        estimate_prior_variance = FALSE,
                        standardize = TRUE,
                        use_mad = FALSE, max_iter = 5)
    )

    # Should produce similar results
    expect_equal(result_tf$alpha, result_manual$alpha, tolerance = 1e-6)
    expect_equal(result_tf$mu, result_manual$mu, tolerance = 1e-6)
  })
})

# =============================================================================
# EXAMPLES FROM DOCUMENTATION
# =============================================================================

test_that("susie_trendfilter works with documentation example", {
  set.seed(1)
  mu <- c(rep(0, 50), rep(1, 50), rep(3, 50), rep(-2, 50), rep(0, 200))
  y <- mu + rnorm(400)

  s <- susie_trendfilter(y, max_iter = 100)

  expect_s3_class(s, "susie")
  expect_length(predict(s), 400)

  # Should be able to get credible sets
  cs <- susie_get_cs(s)
  expect_type(cs, "list")
})


================================================
FILE: tests/testthat/test_univariate_regression.R
================================================
context("Univariate regression")

# =============================================================================
# BASIC FUNCTIONALITY
# =============================================================================

test_that("univariate_regression returns correct structure", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 1)

  result <- univariate_regression(base_data$X, base_data$y)

  expect_type(result, "list")
  expect_named(result, c("betahat", "sebetahat"))
  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_type(result$betahat, "double")
  expect_type(result$sebetahat, "double")
})

test_that("univariate_regression computes correct coefficients", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 2)
  beta_true <- c(1, -0.5, 0.8, 0, 0.3)
  y <- base_data$X %*% beta_true + rnorm(base_data$n, sd = 0.1)

  result <- univariate_regression(base_data$X, y, center = TRUE, scale = FALSE)

  # Each betahat should be close to the true beta
  for (i in 1:base_data$p) {
    expect_equal(result$betahat[i], beta_true[i], tolerance = 0.2)
  }
})

test_that("univariate_regression standard errors are positive", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 3)

  result <- univariate_regression(base_data$X, base_data$y)

  expect_true(all(result$sebetahat > 0))
})

test_that("univariate_regression matches manual lm calculation", {
  base_data <- generate_base_data(n = 50, p = 3, k = 0, seed = 4)

  result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = FALSE)

  # Compare to manual lm for first column
  y_centered <- base_data$y - mean(base_data$y)
  X_centered <- scale(base_data$X, center = TRUE, scale = FALSE)
  manual_fit <- lm(y_centered ~ X_centered[, 1])

  expect_equal(result$betahat[1], unname(coef(manual_fit)[2]), tolerance = 1e-10)
  expect_equal(result$sebetahat[1], unname(summary(manual_fit)$coef[2, 2]), tolerance = 1e-10)
})

# =============================================================================
# CENTER AND SCALE OPTIONS
# =============================================================================

test_that("univariate_regression with center=TRUE, scale=FALSE", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 5)

  result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = FALSE)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression with center=TRUE, scale=TRUE", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 6)

  result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = TRUE)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression with center=FALSE, scale=FALSE", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 7)

  result <- univariate_regression(base_data$X, base_data$y, center = FALSE, scale = FALSE)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression with center=FALSE, scale=TRUE", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 8)

  result <- univariate_regression(base_data$X, base_data$y, center = FALSE, scale = TRUE)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression scaling affects coefficient magnitude", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 9)
  # Create X with different variances
  X_varied <- matrix(rnorm(base_data$n * base_data$p, sd = rep(c(1, 5, 10, 2, 3), each = base_data$n)), base_data$n, base_data$p)

  result_unscaled <- univariate_regression(X_varied, base_data$y, center = TRUE, scale = FALSE)
  result_scaled <- univariate_regression(X_varied, base_data$y, center = TRUE, scale = TRUE)

  # Coefficients should differ due to scaling
  expect_false(all(abs(result_unscaled$betahat - result_scaled$betahat) < 0.01))
})

# =============================================================================
# COVARIATES (Z PARAMETER)
# =============================================================================

test_that("univariate_regression with covariates Z", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 10)
  k <- 2
  Z <- matrix(rnorm(base_data$n * k), base_data$n, k)

  result <- univariate_regression(base_data$X, base_data$y, Z = Z, center = TRUE)

  expect_type(result, "list")
  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression with Z adjusts for confounders", {
  base_data <- generate_base_data(n = 200, p = 5, k = 0, seed = 11)
  # Create confounder
  Z <- matrix(rnorm(base_data$n), base_data$n, 1)
  # X correlated with Z
  X_confounded <- base_data$X + Z %*% matrix(rnorm(base_data$p), 1, base_data$p)
  # y depends only on Z, not X
  y_confounded <- 2 * Z[, 1] + rnorm(base_data$n, sd = 0.1)

  result_no_Z <- univariate_regression(X_confounded, y_confounded, Z = NULL, center = TRUE)
  result_with_Z <- univariate_regression(X_confounded, y_confounded, Z = Z, center = TRUE)

  # Without Z, X appears associated with y
  # With Z adjustment, association should be weaker
  expect_true(mean(abs(result_with_Z$betahat)) < mean(abs(result_no_Z$betahat)))
})

test_that("univariate_regression with Z and return_residuals=TRUE", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 12)
  k <- 2
  Z <- matrix(rnorm(base_data$n * k), base_data$n, k)

  result <- univariate_regression(base_data$X, base_data$y, Z = Z, return_residuals = TRUE)

  expect_type(result, "list")
  expect_named(result, c("betahat", "sebetahat", "residuals"))
  expect_length(result$residuals, base_data$n)
  expect_type(result$residuals, "double")
})

test_that("univariate_regression return_residuals=TRUE without Z omits residuals", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 13)

  result <- univariate_regression(base_data$X, base_data$y, Z = NULL, return_residuals = TRUE)

  expect_named(result, c("betahat", "sebetahat"))
  expect_false("residuals" %in% names(result))
})

test_that("univariate_regression residuals from Z are centered", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 14)
  k <- 2
  Z <- matrix(rnorm(base_data$n * k), base_data$n, k)

  result <- univariate_regression(base_data$X, base_data$y, Z = Z, return_residuals = TRUE, center = TRUE)

  # Residuals should be approximately centered
  expect_equal(mean(result$residuals), 0, tolerance = 1e-10)
})

# =============================================================================
# NA HANDLING
# =============================================================================

test_that("univariate_regression handles NA values in y", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 15)
  base_data$y[c(5, 20, 35)] <- NA

  result <- univariate_regression(base_data$X, base_data$y)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression removes corresponding X rows when y has NA", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 16)
  beta_true <- rep(1, base_data$p)
  y_with_signal <- base_data$X %*% beta_true + rnorm(base_data$n, sd = 0.1)

  # Add NAs
  na_idx <- c(10, 20, 30)
  y_with_signal[na_idx] <- NA

  result <- univariate_regression(base_data$X, y_with_signal, center = TRUE)

  # Should still produce finite results (NA removal worked)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
  expect_length(result$betahat, base_data$p)
})

# =============================================================================
# EDGE CASES
# =============================================================================

test_that("univariate_regression with zero-variance column", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 17)
  base_data$X[, 3] <- 5  # Constant column

  # Should produce a warning message for the constant column
  expect_message(
    result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = FALSE),
    "WARNING:.*Column 3 has zero variance"
  )

  # Constant column becomes zero after centering
  expect_equal(result$betahat[3], 0)
  expect_equal(result$sebetahat[3], 0)
})

test_that("univariate_regression with perfect predictor", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 18)
  # Make y perfectly predicted by first column
  y_perfect <- 3 * base_data$X[, 1] + mean(base_data$X[, 1])

  result <- univariate_regression(base_data$X, y_perfect, center = TRUE, scale = FALSE)

  # First coefficient should be exactly 3, SE should be very small
  expect_equal(result$betahat[1], 3, tolerance = 1e-10)
  expect_true(result$sebetahat[1] < 1e-10)
})

test_that("univariate_regression with single column X", {
  base_data <- generate_base_data(n = 100, p = 1, k = 0, seed = 19)

  result <- univariate_regression(base_data$X, base_data$y)

  expect_length(result$betahat, 1)
  expect_length(result$sebetahat, 1)
  expect_true(is.finite(result$betahat[1]))
  expect_true(is.finite(result$sebetahat[1]))
})

test_that("univariate_regression with very small sample size", {
  base_data <- generate_base_data(n = 5, p = 3, k = 0, seed = 20)

  result <- univariate_regression(base_data$X, base_data$y)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
})

# =============================================================================
# Z-SCORES
# =============================================================================

test_that("univariate_regression enables z-score calculation", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 21)
  beta_true <- c(rep(1, 3), rep(0, 7))
  y_signal <- base_data$X %*% beta_true + rnorm(base_data$n)

  result <- univariate_regression(base_data$X, y_signal)

  # Calculate z-scores
  z <- result$betahat / result$sebetahat

  expect_length(z, base_data$p)
  expect_type(z, "double")

  # Causal variables should have larger |z|
  expect_true(mean(abs(z[1:3])) > mean(abs(z[4:10])))
})

# =============================================================================
# METHOD COMPARISON: LMFIT VS SUMSTATS
# =============================================================================

test_that("univariate_regression methods lmfit and sumstats agree", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 22)

  res1 <- univariate_regression(base_data$X, base_data$y, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with center=TRUE, scale=FALSE", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 23)

  res1 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = FALSE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = FALSE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with center=TRUE, scale=TRUE", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 24)

  res1 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = TRUE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = TRUE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with center=FALSE, scale=FALSE", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 25)

  res1 <- univariate_regression(base_data$X, base_data$y, center = FALSE,
                                scale = FALSE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, center = FALSE,
                                scale = FALSE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with center=FALSE, scale=TRUE", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 26)

  res1 <- univariate_regression(base_data$X, base_data$y, center = FALSE,
                                scale = TRUE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, center = FALSE,
                                scale = TRUE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with covariates Z", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 27)
  k <- 3
  Z <- matrix(rnorm(base_data$n * k), base_data$n, k)

  res1 <- univariate_regression(base_data$X, base_data$y, Z = Z,
                                center = TRUE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, Z = Z,
                                center = TRUE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with NA values in y", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 28)
  base_data$y[c(5, 20, 35)] <- NA

  res1 <- univariate_regression(base_data$X, base_data$y, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with zero-variance column", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 29)
  base_data$X[, 5] <- 3  # Constant column

  # Both methods should produce warning messages
  expect_message(
    res1 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                  scale = FALSE, method = "lmfit"),
    "WARNING:.*Column 5 has zero variance"
  )

  expect_message(
    res2 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                  scale = FALSE, method = "sumstats"),
    "WARNING:.*Column 5 has zero variance"
  )

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with single column X", {
  base_data <- generate_base_data(n = 100, p = 1, k = 0, seed = 30)

  res1 <- univariate_regression(base_data$X, base_data$y, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

test_that("lmfit and sumstats agree with large dataset", {
  base_data <- generate_base_data(n = 500, p = 5000, k = 0, seed = 31)

  res1 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = TRUE, method = "lmfit")
  res2 <- univariate_regression(base_data$X, base_data$y, center = TRUE,
                                scale = TRUE, method = "sumstats")

  expect_equal(res1$betahat, res2$betahat, tolerance = 1e-8)
  expect_equal(res1$sebetahat, res2$sebetahat, tolerance = 1e-8)
})

# =============================================================================
# COMPARISON WITH SIMPLE LM
# =============================================================================

test_that("univariate_regression agrees with lm for each column", {
  base_data <- generate_base_data(n = 50, p = 5, k = 0, seed = 32)

  result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = FALSE)

  # Prepare centered data
  y_c <- base_data$y - mean(base_data$y)
  X_c <- scale(base_data$X, center = TRUE, scale = FALSE)

  # Compare each column
  for (i in 1:base_data$p) {
    lm_fit <- lm(y_c ~ X_c[, i])
    lm_coef <- unname(coef(summary(lm_fit))[2, ])

    expect_equal(result$betahat[i], lm_coef[1], tolerance = 1e-10)
    expect_equal(result$sebetahat[i], lm_coef[2], tolerance = 1e-10)
  }
})

# =============================================================================
# FALLBACK MECHANISM
# =============================================================================

test_that("univariate_regression fallback works when fast method fails", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 33)

  # Normal execution should work
  result <- univariate_regression(base_data$X, base_data$y)

  expect_length(result$betahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

test_that("univariate_regression handles nearly singular design matrix", {
  base_data <- generate_base_data(n = 100, p = 5, k = 0, seed = 34)
  # Make two columns nearly identical
  base_data$X[, 2] <- base_data$X[, 1] + rnorm(base_data$n, sd = 1e-10)

  # Should still produce output (possibly via fallback)
  result <- univariate_regression(base_data$X, base_data$y, center = TRUE)

  expect_length(result$betahat, base_data$p)
  expect_length(result$sebetahat, base_data$p)
})

# =============================================================================
# INTEGRATION TESTS
# =============================================================================

test_that("univariate_regression output usable for RSS methods", {
  base_data <- generate_base_data(n = 200, p = 100, k = 0, seed = 35)
  beta_true <- rep(0, base_data$p)
  beta_true[1:5] <- rnorm(5)
  y_causal <- base_data$X %*% beta_true + rnorm(base_data$n)

  result <- univariate_regression(base_data$X, y_causal)

  # Should be able to compute z-scores
  z <- result$betahat / result$sebetahat

  # Should be able to compute correlation matrix
  R <- cor(base_data$X)

  # Should be usable with estimate_s_rss
  expect_error(
    s <- estimate_s_rss(z, R, n = base_data$n),
    NA
  )
})

test_that("univariate_regression with center and scale matches susie preprocessing", {
  base_data <- generate_base_data(n = 100, p = 50, k = 0, seed = 36)

  # This should match what susie does internally for univariate regression
  result <- univariate_regression(base_data$X, base_data$y, center = TRUE, scale = TRUE)

  expect_length(result$betahat, base_data$p)
  expect_true(all(is.finite(result$betahat)))
  expect_true(all(is.finite(result$sebetahat)))
})

# =============================================================================
# CALC_Z FUNCTION
# =============================================================================

test_that("calc_z returns correct z-scores for single outcome (vector Y)", {
  base_data <- generate_base_data(n = 100, p = 10, k = 0, seed = 37)

  # Compute z-scores using calc_z
  z <- susieR:::calc_z(base_data$X, base_data$y, center = FALSE, scale = FALSE)

  # Manually compute z-scores
  result <- univariate_regression(base_data$X, base_data$y, center = FALSE, scale = FALSE)
  z_manual <- result$betahat / result$sebetahat

  expect_equal(z, z_manual)
  expect_length(z, base_data$p)
  expect_type(z, "double")
})

test_that("calc_z returns correct z-scores for multiple outcomes (matrix Y)", {
  set.seed(38)
  n <- 100
  p <- 10
  m <- 3  # Number of outcomes
  X <- matrix(rnorm(n * p), n, p)
  Y <- matrix(rnorm(n * m), n, m)

  # Compute z-scores using calc_z
  z_matrix <- susieR:::calc_z(X, Y, center = FALSE, scale = FALSE)

  # Should return a matrix with p rows and m columns
  expect_true(is.matrix(z_matrix))
  expect_equal(nrow(z_matrix), p)
  expect_equal(ncol(z_matrix), m)

  # Each column should match manual calculation for that outcome
  for (i in 1:m) {
    result <- univariate_regression(X, Y[, i], center = FALSE, scale = FALSE)
    z_manual <- result$betahat / result$sebetahat
    expect_equal(z_matrix[, i], z_manual)
  }
})

test_that("calc_z with center=TRUE centers data before computing z-scores", {
  set.seed(39)
  n <- 100
  p <- 10
  X <- matrix(rnorm(n * p, mean = 5, sd = 2), n, p)
  y <- rnorm(n, mean = 10, sd = 3)

  # Compute z-scores with centering
  z_centered <- susieR:::calc_z(X, y, center = TRUE, scale = FALSE)

  # Manually compute with centering
  result <- univariate_regression(X, y, center = TRUE, scale = FALSE)
  z_manual <- result$betahat / result$sebetahat

  expect_equal(z_centered, z_manual)
  expect_length(z_centered, p)
})

test_that("calc_z with scale=TRUE scales data before computing z-scores", {
  set.seed(40)
  n <- 100
  p <- 10
  X <- matrix(rnorm(n * p, sd = c(1, 5, 10, 2, 3, 1, 4, 8, 1, 2)), n, p)
  y <- rnorm(n, sd = 5)

  # Compute z-scores with scaling
  z_scaled <- susieR:::calc_z(X, y, center = FALSE, scale = TRUE)

  # Manually compute with scaling
  result <- univariate_regression(X, y, center = FALSE, scale = TRUE)
  z_manual <- result$betahat / result$sebetahat

  expect_equal(z_scaled, z_manual)
  expect_length(z_scaled, p)
})

test_that("calc_z with center=TRUE and scale=TRUE", {
  set.seed(41)
  n <- 100
  p <- 10
  X <- matrix(rnorm(n * p, mean = 3, sd = c(1, 5, 10, 2, 3, 1, 4, 8, 1, 2)), n, p)
  y <- rnorm(n, mean = 7, sd = 5)

  # Compute z-scores with both centering and scaling
  z_both <- susieR:::calc_z(X, y, center = TRUE, scale = TRUE)

  # Manually compute with both
  result <- univariate_regression(X, y, center = TRUE, scale = TRUE)
  z_manual <- result$betahat / result$sebetahat

  expect_equal(z_both, z_manual)
  expect_length(z_both, p)
})

test_that("calc_z handles matrix Y with different centering/scaling", {
  set.seed(42)
  n <- 100
  p <- 8
  m <- 4
  # Create data with varying means and scales to ensure differences
  X <- matrix(rnorm(n * p, mean = rep(c(0, 5, -3, 2), each = n * 2)), n, p)
  Y <- matrix(rnorm(n * m, mean = rep(c(0, 10, -5, 3), each = n)), n, m)
  # Add varying scales
  for (i in 1:p) {
    X[, i] <- X[, i] * (i %% 3 + 1)
  }

  # Test all combinations
  z1 <- susieR:::calc_z(X, Y, center = FALSE, scale = FALSE)
  z2 <- susieR:::calc_z(X, Y, center = TRUE, scale = FALSE)
  z3 <- susieR:::calc_z(X, Y, center = FALSE, scale = TRUE)
  z4 <- susieR:::calc_z(X, Y, center = TRUE, scale = TRUE)

  # All should be matrices with correct dimensions
  expect_equal(dim(z1), c(p, m))
  expect_equal(dim(z2), c(p, m))
  expect_equal(dim(z3), c(p, m))
  expect_equal(dim(z4), c(p, m))

  # All should be finite
  expect_true(all(is.finite(z1)))
  expect_true(all(is.finite(z2)))
  expect_true(all(is.finite(z3)))
  expect_true(all(is.finite(z4)))
})

test_that("calc_z matrix Y branch is tested (is.null(dim(Y)) = FALSE)", {
  set.seed(43)
  n <- 50
  p <- 5
  m <- 2
  X <- matrix(rnorm(n * p), n, p)
  Y <- matrix(rnorm(n * m), n, m)

  # Y is a matrix, so dim(Y) is not NULL
  expect_false(is.null(dim(Y)))

  # This should execute the matrix branch
  z_matrix <- susieR:::calc_z(X, Y, center = TRUE, scale = FALSE)

  # Verify it's a matrix
  expect_true(is.matrix(z_matrix))
  expect_equal(ncol(z_matrix), m)
})

test_that("calc_z vector Y branch is tested (is.null(dim(Y)) = TRUE)", {
  set.seed(44)
  n <- 50
  p <- 5
  X <- matrix(rnorm(n * p), n, p)
  y <- rnorm(n)

  # y is a vector, so dim(y) is NULL
  expect_true(is.null(dim(y)))

  # This should execute the vector branch
  z_vector <- susieR:::calc_z(X, y, center = TRUE, scale = FALSE)

  # Verify it's a vector
  expect_false(is.matrix(z_vector))
  expect_length(z_vector, p)
})


================================================
FILE: tests/testthat.R
================================================
library(testthat)
library(susieR)
test_check("susieR")


================================================
FILE: vignettes/announcements.Rmd
================================================
---
title: "News and Updates"
output: 
  rmarkdown::html_vignette:
    toc: true
    toc_depth: 3
vignette: >
  %\VignetteIndexEntry{News and Updates}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r, include = FALSE}
knitr::opts_chunk$set(
  collapse = TRUE,
  comment = "#>"
)
```

# Release notes
## Version 2.0.0 - Major Release
*Release date: 2026-03-29*

### Release Overview

This major release introduces **`susieR` 2.0**, a complete architectural redesign that addresses the code duplication and fragmented architecture of the original SuSiE implementation as a result of years of continued development, while adding new features and various performance optimizations, all while maintaining backward compatibility.

`susieR` 2.0 eliminates the duplicative architecture of the original implementation through a unified framework built on modular design principles. The user-facing interface remains largely unchanged, but the implementation now uses generic functions with data-type specific backends through R's S3 dispatch system. A key design insight is that most SuSiE extensions reduce to customizations in either Bayes factor computation (per single-effect regression) or residual variance estimation (on the model objective), and the S3 dispatch architecture exploits this separation so that each extension is a local change without modifying the core IBSS algorithm. This architecture has enabled the integration of multiple SuSiE extensions, and serves as the backbone for the refactored mvsusieR package for multi-trait fine-mapping ([Zou et al. 2026](https://doi.org/10.1038/s41588-025-02486-7)). Beyond architectural improvements, this release introduces new features including unmappable effects modeling, stochastic LD reference with mixture panel support, enhanced computational speed, and improved IBSS refinement procedures.

### New Features
* **SuSiE-ash Model**: New adaptive shrinkage framework  ([Stephens 2017](https://doi.org/10.1093/biostatistics/kxw041)) for unmappable effects, extending SuSiE to handle moderately strong but unmappable effects. SuSiE-ash achieves calibration intermediate between standard SuSiE and the more conservative SuSiE-inf under polygenic architectures while maintaining comparable power.
* **SuSiE-inf Integration**: Implementation of SuSiE-inf ([Cui et al. 2024](https://www.nature.com/articles/s41588-023-01597-3)), which models infinitesimal effects alongside sparse causal signals to improve fine-mapping calibration when genetic architecture includes polygenic backgrounds.
* **Servin-Stephens Prior Integration**: New prior option ([Servin and Stephens, 2007](https://doi.org/10.1371/journal.pgen.0030114)) on residual variance estimates in single effect regression (SER) to improve credible set coverage and calibration, particularly useful for small sample studies ([Denault et al. 2025](https://www.biorxiv.org/content/10.1101/2025.05.16.654543v1)). Implemented for both individual-level and summary statistics backends.
* **Stochastic LD Reference**: Support for using genotype matrices directly, including stochastic genotypes in place of LD correlation matrices in summary statistics models (Sun et al., in preparation), with linear algebra optimizations that cache decompositions and exploit the LD structure for speedup.
* **Mixture of LD Reference Panels**: Support for combining multiple LD reference panels with adaptive weight optimization within the regularized LD (RSS-lambda) model framework (Sun et al., in preparation), enabling more robust fine-mapping with diverse or mismatched reference populations.
* **`mvsusieR` Backbone**: The S3 dispatch architecture serves as the shared backbone for mvsusieR, enabling our multi-trait fine-mapping methods to build directly on the susieR 2.0 framework with their own S3 dispatch class.

### Enhancements
* **Performance improvements for RSS model**: algebraic optimizations improves RSS models, with further gains on large genomic regions when reference genotype matrices replace LD correlation matrices.
* **Convergence Criteria**: PIP-based convergence option alongside traditional ELBO convergence, particularly useful for methods where ELBO computation is expensive.
* **Residual Variance Estimation**: Method of Moments option alongside Maximum Likelihood for improved stability.
* **Block Coordinate Ascent Refinement**: Improved refinement procedure that escapes local optima through alternative initializations and enables residual variance estimation with missing data in multi-trait fine-mapping via `mvsusieR`.
* **Verbose Diagnostics**: Detailed diagnostic output for monitoring model fitting behavior.
* **Attainable Coverage**: Post-hoc credible set coverage adjustment as a rough alternative when LD matrices are unavailable for purity filtering.
* **Unit Test Coverage**: Comprehensive unit tests covering 100% of code.


================================================
FILE: vignettes/finemapping.Rmd
================================================
---
title: "Fine-mapping example"
author: "Gao Wang"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Fine-mapping example}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

This vignette demonstrates `susieR` in the context of genetic
fine-mapping.  We use simulated data of expression level of a gene
($y$) in $N \approx 600$ individuals.  We want to identify with the
genotype matrix $X_{N\times P}$ ($P=1001$) the genetic variables that
causes changes in expression level.

The simulated data set is simulated to have exactly 3 non-zero
effects.

```{r}
library(susieR)
set.seed(1)
```

## The data-set

```{r}
data(N3finemapping)
attach(N3finemapping)
```

The loaded dataset contains regression data $X$ and $y$, along with some other
relevant properties in the context of genetic studies. It also
contains the "true" regression coefficent the data is simulated from.

Notice that we've simulated 2 sets of $Y$ as 2 simulation
replicates. Here we'll focus on the first data-set.

```{r}
dim(Y)
```

Here are the 3 "true" signals in the first data-set:

```{r}
b <- true_coef[,1]
plot(b, pch=16, ylab='effect size')
```

```{r}
which(b != 0)
```

So the underlying causal variables are 403, 653 and 773.

## Simple regression summary statistics

`univariate_regression` function can be used to compute 
summary statistics by fitting univariate simple regression variable by variable.
The results are $\hat{\beta}$ and $SE(\hat{\beta})$ from which z-scores can be
derived. Again we focus only on results from the first data-set:

```{r}
sumstats <- univariate_regression(X, Y[,1])
z_scores <- sumstats$betahat / sumstats$sebetahat
susie_plot(z_scores, y = "z", b=b)
```

## Fine-mapping with `susieR`

For starters, we assume there are at most 10 causal variables, i.e.,
set `L = 10`, although SuSiE is robust to the choice of `L`.

The `susieR` function call is:

```{r}
fitted <- susie(X, Y[,1],
                L = 10,
		verbose = TRUE)
```

### Credible sets

By default, we output 95% credible set:

```{r}
print(fitted$sets)
```

The 3 causal signals have been captured by the 3 CS reported here. The
3rd CS contains many variables, including the true causal variable
`403`. The minimum absolute correlation is 0.86.

If we use the default 90% coverage for credible sets, we still
capture the 3 signals, but "purity" of the 3rd CS is now 0.91 and size
of the CS is also a bit smaller.

```{r}
sets <- susie_get_cs(fitted,
                     X = X,
	  	     coverage = 0.9,
                     min_abs_corr = 0.1)
```

```{r}
print(sets)
```

### Posterior inclusion probabilities

Previously we've determined that summing over 3 single effect
regression models is approperate for our application. Here we
summarize the variable selection results by posterior inclusion
probability (PIP):

```{r}
susie_plot(fitted, y="PIP", b=b)
```

The true causal variables are colored red. The 95% CS identified are
circled in different colors. Of interest is the cluster around
position 400. The true signal is 403 but apparently it does not have
the highest PIP. To compare ranking of PIP and original z-score in
that CS:

```{r}
i  <- fitted$sets$cs[[3]]
z3 <- cbind(i,z_scores[i],fitted$pip[i])
colnames(z3) <- c('position', 'z-score', 'PIP')
z3[order(z3[,2], decreasing = TRUE),]
```

### Choice of priors

Notice that by default SuSiE estimates prior effect size from data. For
fine-mapping applications, however, we sometimes have knowledge of SuSiE prior effect
size since it is parameterized as percentage of variance explained (PVE) by a non-zero effect, 
which, in the context of fine-mapping, is related to per-SNP heritability. It is possible
to use `scaled_prior_variance` to specify this PVE and explicitly set `estimate_prior_variance=FALSE`
to fix the prior effect to given value.

In this data-set, SuSiE is robust to choice of priors. Here we
set PVE to 0.2,
and compare with previous results:

```{r}
fitted = susie(X, Y[,1],
               L = 10,
               estimate_residual_variance = TRUE, 
               estimate_prior_variance = FALSE, 
               scaled_prior_variance = 0.2)
susie_plot(fitted, y='PIP', b=b)
```

which largely remains unchanged. 

### A note on covariate adjustment

To include covariate `Z` in SuSiE, one approach is to regress it out from both `y`
and `X`, and then run SuSiE on the residuals. The code below illustrates the procedure:

```{r, eval=FALSE}
remove.covariate.effects <- function (X, Z, y) {
  # include the intercept term
  if (any(Z[,1]!=1)) Z = cbind(1, Z)
  A   <- forceSymmetric(crossprod(Z))
  SZy <- as.vector(solve(A,c(y %*% Z)))
  SZX <- as.matrix(solve(A,t(Z) %*% X))
  y <- y - c(Z %*% SZy)
  X <- X - Z %*% SZX
  return(list(X = X,y = y,SZy = SZy,SZX = SZX))
}

out = remove.covariate.effects(X, Z, Y[,1])
fitted_adjusted = susie(out$X, out$y, L = 10)
```

Note that the covariates `Z` should have a column of ones as the first column. If not, the above function `remove.covariate.effects`
will add such a column to `Z` before regressing it out. 
Data will be centered as a result. Also the scale of data is changed after regressing out `Z`. 
This introduces some subtleties in terms of interpreting the results.
For this reason, we provide covariate adjustment procedure as a tip in the documentation
and not part of `susieR::susie()` function. Cautions should be taken when applying this procedure and interpreting the result from it.


## Sufficient statistics: `compute_suff_stat` and `susie_ss`

When individual-level data $(X, y)$ are available and the sample size $N$
is much larger than the number of variables $P$, calling `susie(X, y)`
directly is wasteful: each IBSS iteration touches `X` again, and when many
response vectors are fit against the same `X` (for example, many proteins
or genes on a shared locus), $X'X$ is rebuilt every time. The sufficient
statistics $(X'X, X'y, y'y, n)$ capture everything `susie` needs; once they
are computed, `susie_ss` can be called directly and $X'X$ reused across
response vectors.

The function `compute_suff_stat` produces these sufficient statistics from
$(X, y)$:

```{r}
ss <- compute_suff_stat(X, Y[,1])
str(ss)
```

They pass directly to `susie_ss`:

```{r}
fitted_ss <- susie_ss(XtX = ss$XtX, Xty = ss$Xty, yty = ss$yty, n = ss$n,
                      X_colmeans = ss$X_colmeans, y_mean = ss$y_mean,
                      L = 10, estimate_residual_variance = TRUE)
```

With matched hyperparameters, `susie_ss(...)` is numerically equivalent to
running `susie` on $(X, y)$ directly:

```{r}
fitted <- susie(X, Y[,1], L = 10)
all.equal(fitted$pip, fitted_ss$pip)
```

For a second response vector on the same `X`, only `Xty` and `yty` need to
be recomputed; the costly $X'X$ is reused:

```{r}
y2_centered <- Y[,2] - mean(Y[,2])
ss2 <- ss
ss2$Xty <- drop(y2_centered %*% X)
ss2$yty <- sum(y2_centered^2)
ss2$y_mean <- mean(Y[,2])
fitted_ss2 <- susie_ss(XtX = ss2$XtX, Xty = ss2$Xty, yty = ss2$yty,
                       n = ss2$n, X_colmeans = ss2$X_colmeans,
                       y_mean = ss2$y_mean, L = 10)
```

`susie()` emits a hint suggesting this workflow whenever
`nrow(X) >= 2 * ncol(X)`.


## Session information

Here are some details about the computing environment, including the
versions of R, and the R packages, used to generate these results.

```{r}
sessionInfo()
```

[N3finemapping]: https://github.com/stephenslab/susieR/blob/master/inst/datafiles/N3finemapping.rds


================================================
FILE: vignettes/finemapping_summary_statistics.Rmd
================================================
---
title: "Fine-mapping with summary statistics"
author: "Yuxin Zou and Gao Wang"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Fine-mapping with summary statistics}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

This vignette demonstrates how to use `susieR` with "summary
statistics" in the context of genetic fine-mapping.  We use the same
simulated data as in [fine mapping vignette](finemapping.html). The
simulated data are expression levels of a gene ($y$) in $N \approx 600$
individuals.  We want to identify with the genotype matrix $X_{N\times
P}$ ($P=1001$) the genetic variables that causes changes in expression
level. This data set is shipped with `susieR`. It is simulated to have
exactly three non-zero effects.

```{r}
library(susieR)
set.seed(1)
```

## The data-set

```{r}
data(N3finemapping)
attach(N3finemapping)
n = nrow(X)
```

Notice that we've simulated two sets of $Y$ as two simulation
replicates. Here we'll focus on the first data-set.

```{r}
dim(Y)
```

Here are the three true signals in the first data-set:

```{r}
b <- true_coef[,1]
plot(b, pch=16, ylab='effect size')
```

```{r}
which(b != 0)
```

So the underlying causal variables are 403, 653 and 773.

## Summary statistics from simple regression

Summary statistics of genetic association studies typically contain
effect sizes ($\hat{\beta}$ coefficient from regression) and p-values.
These statisticscan be used to perform fine-mapping with given an
additional input of correlation matrix between variables.  The
correlation matrix in genetics is typically referred to as an "LD
matrix" (LD is short for linkage disequilibrium). One may use external
reference panels to estimate it when this matrix cannot be obtained
from samples directly. *Importantly, the LD matrix has to be a matrix
containing estimates of the correlation, $r$, and not $r^2$ or $|r|$.*
See also [this vignette](susierss_diagnostic.html) for how to check the
consistency of the LD matrix with the summary statistics.

The `univariate_regression` function can be used to compute summary
statistics by fitting univariate simple regression variable by
variable.  The results are $\hat{\beta}$ and $SE(\hat{\beta})$ from
which z-scores can be derived. Alternatively, you can obtain z-scores
from $\hat{\beta}$ and p-values if you are provided with those
information. For example,

```{r}
sumstats <- univariate_regression(X, Y[,1])
z_scores <- sumstats$betahat / sumstats$sebetahat
susie_plot(z_scores, y = "z", b=b)
```

For this example, the correlation matrix can be computed directly from
data provided:

```{r}
R <- cor(X)
```

## Fine-mapping with `susieR` using summary statistics

By default, SuSiE assumes at most 10 causal variables, with `L =
10`, although we note that SuSiE is generally robust to the choice of
`L`.

Since the individual-level data is available for us here, we can
easily compute the "in-sample LD" matrix, as well as the variance of
$y$, which is `r round(var(Y[,1]),digits = 4)`.  (By "in-sample", we
means the LD was computed from the exact same matrix `X` that was used
to obtain the other statistics.) When we fit SuSiE regression with
summary statistics, $\hat{\beta}$, $SE(\hat{\beta})$, $R$, $n$, and
var_y these are also the *sufficient statistics.* With an in-sample
LD, we can also estimate the residual variance using these sufficient
statistics. (Note that if the covariate effects are removed from the
genotypes in the univariate regression, it is recommended that the
"in-sample" LD matrix also be computed from the genotypes after the
covariate effects have been removed.)

```{r}
fitted_rss1 <- susie_rss(bhat = sumstats$betahat, shat = sumstats$sebetahat, n = n, R = R, var_y = var(Y[,1]), L = 10,
                         estimate_residual_variance = TRUE)
```

Using `summary`, we can examine the posterior inclusion probability
(PIP) for each variable, and the 95% credible sets:

```{r}
summary(fitted_rss1)$cs
```

The three causal signals have been captured by the three CSs. Note the
third CS contains many variables, including the true causal
variable 403.

We can also plot the posterior inclusion probabilities (PIPs):

```{r}
susie_plot(fitted_rss1, y="PIP", b=b)
```

The true causal variables are shown in red. The 95% CSs are
shown by three different colours (green, purple, blue).

Note this result is *exactly the same* as running `susie` on the
original individual-level data:

```{r}
fitted = susie(X, Y[,1], L = 10)
all.equal(fitted$pip, fitted_rss1$pip)
all.equal(coef(fitted)[-1], coef(fitted_rss1)[-1])
```

If, on the other hand, the variance of $y$ is unknown, we fit can SuSiE
regression with summary statistics, $\hat{\beta}$, $SE(\hat{\beta})$,
$R$ and $n$ (or *z*-scores, $R$ and $n$). The outputted effect estimates
are now on the standardized $X$ and $y$ scale. Still, we can estimate the
residual variance because we have the in-sample LD matrix:

```{r}
fitted_rss2 = susie_rss(z = z_scores, R = R, n = n, L = 10,
                        estimate_residual_variance = TRUE)
```

The result is same as if we had run `susie` on the individual-level
data, but the output effect estimates are on different scale:

```{r, fig.height=4, fig.width=3.5}
all.equal(fitted$pip, fitted_rss2$pip)
plot(coef(fitted)[-1], coef(fitted_rss2)[-1], xlab = 'effects from SuSiE', ylab = 'effects from SuSiE-RSS', xlim=c(-1,1), ylim=c(-0.3,0.3))
```

Specifically, without the variance of $y$, these estimates are same as
if we had applied SuSiE to a standardized $X$ and $y$; that is, as if
$y$ and the columns of $X$ had been normalized so that $y$ and each
column of $X$ had a standard deviation of 1.

```{r}
fitted_standardize = susie(scale(X), scale(Y[,1]), L = 10)
all.equal(coef(fitted_standardize)[-1], coef(fitted_rss2)[-1])
```


## Fine-mapping with `susieR` using LD matrix from reference panel

When the original genotypes are not available, one may use a separate
reference panel to estimate the LD matrix.

To illustrate this, we randomly generated 500 samples from $N(0,R)$
and treated them as reference panel genotype matrix `X_ref`.

```{r echo=F}
set.seed(1)
tmp = matrix(rnorm(500*1001), 500, 1001)
eigenR = eigen(R)
eigenR$values[eigenR$values < 1e-10] = 0
X_ref = tmp %*% (sqrt(eigenR$values) * t(eigenR$vectors))
R_ref = cor(X_ref)
```

We fit the SuSiE regression using out-of sample LD matrix. The
residual variance is fixed at 1 because estimating residual variance
sometimes produces very inaccurate estimates with out-of-sample LD
matrix. The output effect estimates are on the standardized $X$ and
$y$ scale.

```{r}
fitted_rss3 <- susie_rss(z_scores, R_ref, n=n, L = 10)
```

```{r}
susie_plot(fitted_rss3, y="PIP", b=b)
```

In this particular example, the SuSiE result with out-of-sample LD is
very similar to using the in-sample LD matrix because the LD matrices
are quite similar.

```{r, fig.width=3.5,fig.height=4}
plot(fitted_rss1$pip, fitted_rss3$pip, ylim=c(0,1), xlab='SuSiE PIP', ylab='SuSiE-RSS PIP')
```

In some rare cases, the sample size $n$ is unknown. When the sample
size is not provided as input to `susie_rss`, this is in effect
assuming the sample size is infinity and all the effects are small,
and the estimated PVE for each variant will be close to zero. The
outputted effect estimates are on the "noncentrality parameter" scale.

```{r}
fitted_rss4 = susie_rss(z_scores, R_ref, L = 10)
susie_plot(fitted_rss4, y="PIP", b=b)
```

## Session information

Here are some details about the computing environment, including the
versions of R, and the R packages, used to generate these results.

```{r}
sessionInfo()
```


================================================
FILE: vignettes/l0_initialization.Rmd
================================================
---
title: "SuSiE with L0Learn initialization example"
author: "Kaiqian Zhang"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{SuSiE with L0Learn initialization example}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#")
```

`susieR` allows for a customized initialization. In this vignette we
deomonstrate how to use
[`L0Learn`](https://github.com/hazimehh/L0Learn) fit to initialize
susieR.

```{r, warning=FALSE}
library(susieR)
library(L0Learn)
```

## Simulate data

First, we simulate data from the minimal example.

```{r}
set.seed(1)
n = 1000
p = 1000
beta = rep(0,p)
beta[c(1,2,300,400)] = 1
X = matrix(rnorm(n*p),nrow=n,ncol=p)
y = X %*% beta + rnorm(n)
```

## Fit L0Learn 

We start with fitting a L0-regularized model to the simulated data. 

```{r}
set.seed(1)
L0fit = L0Learn.cvfit(X, y, penalty = "L0")
```

Let's choose the penalty strength parameter that minimizes the
cross-validation error.

```{r}
lambdaIndex = which.min(L0fit$cvMeans[[1]]) 
L0coef = as.numeric(coef(L0fit$fit, lambda = L0fit$fit$lambda[[1]][lambdaIndex]))
effect.beta = L0coef[which(L0coef!=0)][-1]
effect.index = (which(L0coef!=0)-1)[-1] 
length(effect.beta)
effect.beta[1:10]
effect.index[1:10]
```

The L0Learn model finds `r length(effect.beta)` effects, which will be
used to initialize susie.

## Build an initialization object

We create an initialization from `l0learn` coefficients using
`susie_init_coef` function,

```{r}
set.seed(1)
s.init = susie_init_coef(effect.index, effect.beta, p)
```

## Run susieR with initialization

Now, we use `effect.index` and `effect.beta` obtained from L0Learn fit
to create an `s.init` object. We then run susie with this
initialization.

```{r}
susieL0.fit = susie(X,y,model_init=s.init)
susieL0.fit$sets$cs
```

## References

1. Hussein Hazimeh and Rahul Mazumder. (2018). Fast Best Subset
Selection: Coordinate Descent and Local Combinatorial Optimization
Algorithms.


================================================
FILE: vignettes/mwe.Rmd
================================================
---
title: "A minimal example"
author: "Matthew Stephens"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{minimal example}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 4.5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

In this short vignette, we fit a sparse linear regression model with
up to $L > 0$ non-zero effects. Generally, there is no harm in
over-stating $L$ (that is, the method is pretty robust to overfitting),
except that computation will grow as $L$ grows.

Here is a minimal example:

```{r}
library(susieR)
set.seed(1)
n    <- 1000
p    <- 1000
beta <- rep(0,p)
beta[c(1,2,300,400)] <- 1
X   <- matrix(rnorm(n*p),nrow=n,ncol=p)
y   <- X %*% beta + rnorm(n)
res <- susie(X,y,L=10)
plot(coef(res)[-1],pch = 20)
```

Plot the ground-truth outcomes vs. the predicted outcomes:

```{r fig.height=3.5, fig.width=3.5}
plot(y,predict(res),pch = 20)
```

## Session information

Here are some details about the computing environment, including the
versions of R, and the R packages, used to generate these results.

```{r}
sessionInfo()
```


================================================
FILE: vignettes/small_sample.Rmd
================================================
---
title: Accounting for uncertainty in residual variances for small sample studies
author: William R.P. Denault
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Small data example}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r knitr-opts, include=FALSE}
knitr::opts_chunk$set(
  comment = "#",
  collapse = TRUE,
  results  = "markup",
  fig.align = "center",
  fig.width = 4.5,
  fig.height = 3.2,
  warning = FALSE,
  message = FALSE
)
```

This is vignette is a modified example based on Figure 1 panel B-C-D
in [Denault et al paper](https://doi.org/10.1101/2025.05.16.654543).

```{r load-pkgs}
library(susieR)
```

For reproducibility, set the seed:

```{r}
set.seed(1)
```

## Data

In this example, we analyze a simulated eQTL data set. The goal
is to finemap causal variants for expression (eQTLs).

```{r load-data}
data(data_small)
y <- data_small$y
X <- data_small$X
dim(X)
```

## Baseline SuSiE fit

The original SuSiE method displays signs of misscalibration: the
result is highly suspicious as we find 10 credible sets in a data set
containing only 47 samples.

```{r run-susie, fig.height=3.5, fig.width=5, message=FALSE}
res_susie <- susie(X,y,L = 10,verbose = TRUE)
res_susie$sets$cs
susie_plot(res_susie,y = "PIP")
```

Another clue is that the fine-mapped SNPs explain >99% of the
variation in gene expression, which might be explained by overfitting:

```{r, fig.height=4.5, fig.width=4}
ypred <- predict(res_susie, X)
pve <- 1 - drop(res_susie$sigma2 / var(y))
round(100 * pve, 3)
plot(y, ypred, pch = 20,
     xlab = "observed",
     ylab = "predicted")
abline(0, 1, col = "magenta", lty = "dotted")
```

## SuSiE with Servin-Stephens SER

Setting `estimate_residual_method = "NIG"` switches SuSiE
to a variant of the single-effect regression (SER) model that accounts
for uncertainty in the residual variance. This is based on the linear
regression model for single-SNP association tests described in
[Servin and Stephens (2007)](https://doi.org/10.1371/journal.pgen.0030114).

```{r run-susie-small, message=FALSE, warning=FALSE} 
res_susie_small <-
  susie(X,y,L = 1,estimate_residual_method = "NIG",
        verbose = TRUE)
res_susie_small$sets$cs
```

This analysis looks more plausible as it identifies only 1 CS:

```{r, fig.height=3, fig.width=5}
susie_plot(res_susie_small,y = "PIP")
```

And, indeed, the predictions with the Servin-Stephens SER do not seem
to "overfit" the expression data quite so strongly.

```{r, fig.height=4.5, fig.width=4}
pred_small <- predict(res_susie_small, X)
plot(y, ypred, pch = 20,col = "darkblue",
     xlab = "observed",
     ylab = "predicted")
points(y, pred_small, pch = 20, col = "darkorange")
abline(0, 1, col = "magenta", lty = "dotted")
legend("topleft", pch = c(20, 20), col = c("darkblue","darkorange"),
       legend = c("SuSiE (default Gaussian SER)",
                  "SuSiE (Servin-Stephens SER)"))
```
  
### References

Servin, B. & Stephens, M. (2007). Imputation-based analysis of
association studies: Candidate regions and quantitative traits. *PLoS
Genetics*, 3(7): e114.

Denault et al (2025). Accounting for uncertainty in residual
variances improves calibration for fine-mapping with small sample
sizes. *bioRxiv* doi:10.1101/2025.05.16.654543.


================================================
FILE: vignettes/sparse_susie_eval.Rmd
================================================
---
title: "Evaluation of sparse version of SuSiE"
author: "Kaiqian Zhang"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{SuSiE with sparse matrix operations}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 4.5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

## Set up environment

```{r, warning=FALSE}
library(Matrix)
library(susieR)
set.seed(1)
```

## Overview

In this vignette, we provide line profiles for revised version SuSiE,
which allows for a sparse matrix structure. We compare speed
performance when the form of the matrix `X` is dense and sparse.

In this minimal example, we observe that given a large sparse matrix,
if it is in the dense form, the speed is around `40%` slower than that
in a sparse form.

## Simulate data

We randomly simulate a `n=1000` by `p=1000` dense matrix and a sparse
matrix at sparsity $99\%$, i.e. $99\%$ entries are zeros.

```{r}
create_sparsity_mat = function(sparsity, n, p) {
  nonzero          <- round(n*p*(1-sparsity))
  nonzero.idx      <- sample(n*p, nonzero)
  mat              <- numeric(n*p)
  mat[nonzero.idx] <- 1
  mat              <- matrix(mat, nrow=n, ncol=p)
  return(mat)
}
```

```{r}
n <- 1000
p <- 1000
beta <- rep(0,p)
beta[c(1,300,400,1000)] <- 10 
X.dense  <- create_sparsity_mat(0.99,n,p)
X.sparse <- as(X.dense,"sparseMatrix")
y <- c(X.dense %*% beta + rnorm(n))
```

## `X` in a dense form

```{r}
susie.dense <- susie(X.dense,y)
```

## `X` in a sparse form

```{r}
susie.sparse <- susie(X.sparse,y)
```

## Further step

We encourage people who are insterested in improving SuSiE can get
insights from those line profiles provided.


================================================
FILE: vignettes/susie_refine.Rmd
================================================
---
title: "Refine SuSiE model"
author: "Yuxin Zou"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Refine SuSiE model}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

In this vignette, we demonstrate a procedure that helps SuSiE get out of local optimum.

We simulate phenotype using UK Biobank genotypes from 50,000 individuals. There are 1001 SNPs.
It is simulated to have exactly 2 non-zero effects at 234, 287.

```{r}
library(susieR)
library(curl)
data_file <- tempfile(fileext = ".RData")
data_url <- paste0("https://raw.githubusercontent.com/stephenslab/susieR/",
                   "master/inst/datafiles/FinemappingConvergence1k.RData")
curl_download(data_url,data_file)
load(data_file)
b <- FinemappingConvergence$true_coef
susie_plot(FinemappingConvergence$z, y = "z", b=b)
```

The strongest marginal association is a non-effect SNP. 

Since the sample size is large, we use sufficient statistics ($X^\intercal X, X^\intercal y, y^\intercal y$ and sample size $n$) to fit susie model. It identifies 2 Credible Sets, one of them is false positive. This is because `susieR` get stuck around a local minimum. 

```{r}
fitted <- with(FinemappingConvergence,
               susie_ss(XtX = XtX, Xty = Xty, yty = yty, n = n))
susie_plot(fitted, y="PIP", b=b, main=paste0("ELBO = ", round(susie_get_objective(fitted),2)))
```

Our refine procedure to get out of local optimum is

1. fit a susie model, $s$ (suppose it has $K$ CSs).

2. for CS in $s$, set SNPs in CS to have prior weight 0, fit susie model --> we have K susie models: $t_1, \cdots, t_K$.

3. for each $k = 1, \cdots, K$, fit susie with initialization at $t_k$ ($\alpha, \mu, \mu^2$) --> $s_k$

4. if $\max_k \text{elbo}(s_k) > \text{elbo}(s)$, set $s = s_{kmax}$ where $kmax = \arg_k \max \text{elbo}(s_k)$ and go to step 2; if no, break.

We fit susie model with above procedure by setting `refine = TRUE`.

```{r}
fitted_refine <- with(FinemappingConvergence,
                      susie_ss(XtX = XtX, Xty = Xty, yty = yty,
					                  n = n, refine=TRUE))
susie_plot(fitted_refine, y="PIP", b=b, main=paste0("ELBO = ", round(susie_get_objective(fitted_refine),2)))
```

With the refine procedure, it identifies 2 CSs with the true signals, and the achieved evidence lower bound (ELBO) is higher.

## Session information

Here are some details about the computing environment, including the
versions of R, and the R packages, used to generate these results.

```{r}
sessionInfo()
```


================================================
FILE: vignettes/susie_rss.Rmd
================================================
---
title: "Compare susie_rss variants"
author: "Peter Carbonetto"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Compare susie_rss variants}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

In this vignette, we briefly illustrate the different ways
[susie_rss][susie_rss] can be called, and draw connections between
running `susie_rss` on summary data, and running `susie` on
individual-level data.

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      dpi = 120)
```

```{r load-pkgs}
library(susieR)
```

Simulate a data set with 200 samples and 1,000 variables, in which the
only first 4 variables affect the outcome.

```{r simdata}
set.seed(1)
n <- 200
p <- 1000
beta <- rep(0,p)
beta[1:4] <- 1
X <- matrix(rnorm(n*p),nrow = n,ncol = p)
X <- scale(X,center = TRUE,scale = FALSE)
y <- drop(X %*% beta + rnorm(n))
```

Compute summary statistics $\hat{b}_j, \hat{s}_j$ and the correlation
matrix, ${\bf R}$. These quantities will be provided as input to
susie_rss.

```{r sumstats-no-standardize}
ss  <- univariate_regression(X,y)
dat <- compute_suff_stat(X,y,standardize = FALSE)
R   <- cov2cor(dat$XtX)
```

The susie and susie_rss analyses produce the exact same results when
the summary statistics `bhat`, `shat`, `var_y` and `n` are provided to
susie_rss (and when `R` is an "in sample" correlation estimate---that
is, when it was computed from the same matrix `X` that was used to
obtain the other statistics). If the covariate effects are removed from 
the genotypes in univariate regression, the in-sample LD matrix should 
compute from the genotype residuals where the covariate effects have 
been removed.

```{r first-comparison, fig.height=3.5, fig.width=3}
res1 <- susie(X,y,L = 10)
res2 <- susie_rss(bhat = ss$betahat,shat = ss$sebetahat,R = R,n = n,
                  var_y = var(y),L = 10,estimate_residual_variance = TRUE)
plot(coef(res1),coef(res2),pch = 20,xlab = "susie",ylab = "susie_rss")
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
```

When some but not all of these statistics are provided, the results
should be similar, but not exactly the same.

Next let's compare the susie and susie_rss outputs when ${\bf X},
y$ are *standardized* before computing the summary statistics (by
"standardize", we mean that $y$ and the columns of ${\bf X}$ are each
divided by the sample standard deviation so that they each have the
same standard deviation).

```{r sumstats-standardize-1}
ss  <- univariate_regression(scale(X),scale(y))
dat <- compute_suff_stat(X,y,standardize = TRUE)
R   <- cov2cor(dat$XtX)
```

Then we compute the *z*-scores:

```{r sumstats-standardize-2}
zhat <- ss$betahat/ss$sebetahat
```

When standardizing, providing susie_rss with summary data `z` (or
`bhat`, `shat`), `R` and `n` is sufficient for susie_rss to recover
the same results as susie:

```{r second-comparison, fig.height=3.5, fig.width=6, message=FALSE}
res1 <- susie(scale(X),scale(y),L = 10)
res2 <- susie_rss(bhat = ss$betahat,shat = ss$sebetahat,R = R,n = n,
                  L = 10,estimate_residual_variance = TRUE)
res3 <- susie_rss(zhat,R,n = n,L = 10,estimate_residual_variance = TRUE)
layout(matrix(1:2,1,2))
plot(coef(res1),coef(res2),pch = 20,xlab = "susie",
          ylab = "susie_rss(bhat,shat)")
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
plot(coef(res1),coef(res3),pch = 20,xlab = "susie",ylab = "susie_rss(z)")
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
```

When the residual variance is not estimated in susie_rss, the
susie_rss results may be close to susie, but may no longer be
exactly the same:

```{r third-comparison, fig.height=3.5, fig.width=3, message=FALSE}
res4 <- susie_rss(zhat,R,n = n,L = 10)
plot(coef(res1),coef(res4),pch = 20,xlab = "susie",ylab = "susie_rss")
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
```

Whenever `R` is an "in sample" correlation matrix, we recommend
estimating the residual variance.

Without providing the sample size, `n`, the coefficients are
interpreted as the "noncentrality parameters" (NCPs), and are
(roughly) related to the susie parameters by a factor of $\sqrt{n}$:

```{r fourth-comparison, fig.height=3.5, fig.width=3, message=FALSE, warning=FALSE}
res5 <- susie_rss(zhat,R,L = 10)
plot(coef(res1),coef(res5)/sqrt(n),pch = 20,xlab = "susie",
ylab = "susie_rss/sqrt(n)")
abline(a = 0,b = 1,col = "skyblue",lty = "dashed")
```

Whenever possible, the sample size, or a reasonable estimate of the
sample size, should be provided.

[susie_rss]: https://stephenslab.github.io/susieR/reference/susie_rss.html


================================================
FILE: vignettes/susie_unmappable_effects.Rmd
================================================
---
title: "Fine-mapping with SuSiE-ash and SuSiE-inf"
author: "Alex McCreight"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Fine-mapping with SuSiE-ash and SuSiE-inf}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      dpi = 120)
```

This vignette demonstrates how to use the SuSiE-ash and SuSiE-inf models.
We use a simulated data set with n = 1000 individuals, p = 5000 variants, and
a complex genetic architecture combining 3 sparse, 5 oligogenic, and 15 polygenic effects.

## Data

```{r}
library(susieR)
data(unmappable_data)

X <- unmappable_data$X
y <- as.vector(unmappable_data$y)
b <- unmappable_data$beta

plot(abs(b), ylab = "Absolute Effect Size", pch = 16)
points(which(b != 0), abs(b[b != 0]), col = 2, pch = 16)
```

## Summary Statistics and Z-Scores

Before fitting the models, we can examine the marginal association statistics.
We use `univariate_regression()` to compute effect sizes and standard errors,
then derive z-scores:

```{r}
sumstats <- univariate_regression(X, y)
z_scores <- sumstats$betahat / sumstats$sebetahat
```

The z-scores show the strength of marginal association for each variant.
Red points indicate non-zero effect sizes:

```{r}
susie_plot(z_scores, y = "z", b = b, add_legend = TRUE)
```

Here we can see the signal landscape before fine-mapping. Note that 
some causal variants have strong z-scores while others may be weaker
or masked by LD with nearby variants.

Notably, variant 2714 has the largest true effect size in the simulation:

```{r}
strongest_idx <- which.max(abs(b))
cat("Strongest effect variant:", strongest_idx, "\n")
cat("True effect size:", round(b[strongest_idx], 3), "\n")
cat("Marginal z-score:", round(z_scores[strongest_idx], 3), "\n")
cat("Marginal p-value:", format.pval(2 * pnorm(-abs(z_scores[strongest_idx]))), "\n")
```

Despite having the largest true effect, this variant has a very small marginal z-score and 
a large p-value. This illustrates a fundamental challenge in fine-mapping: the marginal 
association of a large-effect causal variant can be masked by other variants in LD, 
while smaller-effect variants may show stronger marginal signals. 
This masking makes it difficult to identify the true causal variants from marginal statistics alone.

## Step 1: Standard SuSiE and False Positives

We first fit standard SuSiE:

```{r}
t0 <- proc.time()
fit_susie <- susie(X, y, L = 10)
t1 <- proc.time()
t1 - t0
susie_plot(fit_susie, y = "PIP", b = b, main = "SuSiE (standard)", add_legend = TRUE)
```

We set `L = 10` to allow SuSiE to capture up to 10 sparse effects. 
However, given the complex architecture with 23 true causal variants, this may be insufficient.

To see which true effects the credible sets capture, we plot the CS on
the true effect sizes:

```{r}
plot_cs_effects <- function(fit, b, main = "") {
  colors <- c("dodgerblue2", "green4", "#6A3D9A", "#FF7F00", "gold1", "firebrick2")
  plot(abs(b), pch = 16, ylab = "Absolute Effect Size", main = main)
  if (!is.null(fit$sets$cs)) {
    for (i in rev(seq_along(fit$sets$cs))) {
      cs_idx <- fit$sets$cs[[i]]
      points(cs_idx, abs(b[cs_idx]), col = colors[(i-1) %% 6 + 1], pch = 16, cex = 1.5)
    }
  }
  
  cat(sprintf("True causals: %s\n", paste(which(b != 0), collapse=", ")))
  for (i in seq_along(fit$sets$cs)) {
    cs_idx <- fit$sets$cs[[i]]
    sentinel <- cs_idx[which.max(fit$pip[cs_idx])]
    tp <- any(b[cs_idx] != 0)
    cat(sprintf("  CS%d: %d %s\n", i, sentinel, ifelse(tp, "TP", "FP")))
  }
}

plot_cs_effects(fit_susie, b, main = "SuSiE CS on true effects")
```

SuSiE identifies 5 credible sets, but examining them more closely reveals a problem.
Many of these credible sets appear to be false positives arising from
synthetic associations.

A synthetic association occurs when a non-causal variant shows an association
with the phenotype because it is in LD with true causal variants. The non-causal
variant "borrows" signal from correlated effect variants, and when it is
correlated with multiple effect variants, these contributions can accumulate
to create an inflated signal.

Let's examine one of the false positive credible sets to see this in action:

```{r}
nonzero_idx <- which(b != 0)
fp_cs <- fit_susie$sets$cs[["L4"]]
top_var <- fp_cs[which.max(fit_susie$pip[fp_cs])]

cat("False positive CS top variant:", top_var, "\n")
cat("True effect (beta):", b[top_var], "\n")
cat("Z-score:", round(z_scores[top_var], 2), "\n\n")

cat("LD with true effect variants and their contributions:\n")
contributions <- data.frame(
  variant = nonzero_idx,
  r = round(sapply(nonzero_idx, function(v) cor(X[, top_var], X[, v])), 2),
  beta = round(b[nonzero_idx], 2)
)
contributions$r_times_beta <- round(contributions$r * contributions$beta, 2)
contributions <- contributions[order(-abs(contributions$r_times_beta)), ]
print(head(contributions[abs(contributions$r) > 0.1, ], 6), row.names = FALSE)
```

Variant `r top_var` has **no true effect** (beta = 0), yet it has a z-score of
`r round(z_scores[top_var], 2)`. This synthetic signal arises because it is
correlated with multiple effect variants. Notice that:

- It has **negative LD** with negative-effect variants (2714, 2939, 2943), giving **positive** contributions
- It has **positive LD** with a positive-effect variant (2903), also giving a **positive** contribution

These contributions accumulate to create a synthetic signal at the non-causal
variant, which SuSiE then incorrectly identifies as a distinct effect. The other
false positive credible sets arise from the same artifact.

## Step 2: Increasing Purity to Reduce False Positives

One approach to reduce false positives is to increase the purity threshold.
By default, SuSiE uses `min_abs_corr = 0.5`. Let's try `min_abs_corr = 0.8`:

```{r}
cs_pure <- susie_get_cs(fit_susie, X = X, min_abs_corr = 0.8)
cat("Number of CSs with purity >= 0.8:", length(cs_pure$cs), "\n")
```

Raising the purity threshold removes some false positives, but not all of them.
Some false positive credible sets have high purity because the non-causal
variants within them are highly correlated with each other. These sets pass the
purity filter yet still fail to contain any true causal variants.

## Step 3: Fitting SuSiE-inf

SuSiE-inf models an infinitesimal component to account for unmappable effects:

```{r}
t0 <- proc.time()
fit_inf <- susie(X, y, L = 10, unmappable_effects = "inf")
t1 <- proc.time()
t1 - t0
susie_plot(fit_inf, y = "PIP", b = b, main = "SuSiE-inf", add_legend = TRUE)
```

(Note that it may take several minutes to fit the SuSiE-Inf model.)

```{r}
plot_cs_effects(fit_inf, b, main = "SuSiE-inf CS on true effects")
```

SuSiE-inf is more conservative and finds only 1 credible set, eliminating the
false positives. However, it also loses the true signal around position 3500
that standard SuSiE correctly identified.

Remarkably, SuSiE-inf identifies the variant with the strongest true effect, the 
same variant we noted earlier has a very small marginal z-score and large p-value:

```{r}
if (length(fit_inf$sets$cs) > 0) {
  inf_cs <- fit_inf$sets$cs[[1]]
  cat("SuSiE-inf CS contains variant", strongest_idx, ":", strongest_idx %in% inf_cs, "\n")
  cat("This variant has the largest true effect (beta =", round(b[strongest_idx], 3), 
      ") but marginal z-score of only", round(z_scores[strongest_idx], 3), "\n")
}
```

This is a striking, as SuSiE-inf recovers the strongest causal signal that is completely 
invisible in marginal statistics. The intuition is that by modeling background polygenic 
effects, SuSiE-inf effectively conditions on other variants, revealing signals that are otherwise masked.

However, for other signals, even if we lower the coverage threshold, we cannot recover 
them, potentially because SuSiE-inf was too aggressive removing them early-on in the SuSiE fit:

```{r}
for (cov in c(0.9, 0.8, 0.7, 0.5)) {
  cs <- susie_get_cs(fit_inf, X = X, coverage = cov)
  cat(sprintf("Coverage=%.1f: %d credible sets\n", cov, length(cs$cs)))
}
```

## Step 4: SuSiE-ash Achieves the Middle Ground

SuSiE-ash uses adaptive shrinkage to model the unmappable effects, providing
a middle ground between standard SuSiE and SuSiE-inf:

```{r}
t0 <- proc.time()
fit_ash <- susie(X, y, L = 10, unmappable_effects = "ash", verbose = TRUE)
t1 <- proc.time()
t1 - t0
susie_plot(fit_ash, y = "PIP", b = b, main = "SuSiE-ash", add_legend = TRUE)
```

(Note that it may take several minutes to fit the SuSiE-ash model.)

```{r}
plot_cs_effects(fit_ash, b, main = "SuSiE-ash CS on true effects")
```

SuSiE-ash finds 3 correct credible sets.

Still, it does not discover all 23 causal variants, nor does it recover the strongest effect (variant 2714) that SuSiE-inf found.
However, the adaptive shrinkage approach allows SuSiE-ash to distinguish between true
sparse signals and the polygenic background more effectively than either
standard SuSiE or SuSiE-inf alone.


SuSiE-ash can also be used with summary statistics via `susie_ss()`, using
`mr.ash.rss` as the backend for the adaptive shrinkage component. This enables
fine-mapping with unmappable effects when only sufficient statistics (X'X, X'y,
y'y) are available.

```{r}
XtX <- crossprod(X)
Xty <- crossprod(X, y)
yty <- sum(y^2)
n <- nrow(X)

t0 <- proc.time()
fit_ash_ss <- susie_ss(XtX = XtX, Xty = Xty, yty = yty, n = n,
                        L = 10, unmappable_effects = "ash", verbose = TRUE)
t1 <- proc.time()
t1 - t0
susie_plot(fit_ash_ss, y = "PIP", b = b, main = "SuSiE-ash (SS)", add_legend = TRUE)
```

```{r}
plot_cs_effects(fit_ash_ss, b, main = "SuSiE-ash (SS) CS on true effects")
```

We can verify the agreement between the two approaches:

```{r}
pip_ind <- susie_get_pip(fit_ash)
pip_ss <- susie_get_pip(fit_ash_ss)
cat("Max |PIP difference|:", max(abs(pip_ind - pip_ss)), "\n")
cat("PIP correlation:", cor(pip_ind, pip_ss), "\n")
cat("Max |theta difference|:", max(abs(fit_ash$theta - fit_ash_ss$theta)), "\n")
```

When only GWAS summary statistics are available, `susie_rss()` can be used.
For best agreement with individual-level analysis, we recommend providing
effect sizes (`bhat`), standard errors (`shat`), and the phenotypic variance
(`var_y`) along with the in-sample LD matrix (`R`) and sample size (`n`).
This preserves the original data scale, allowing the adaptive shrinkage
component to calibrate correctly:

```{r}
R <- cor(X)
bhat <- sumstats$betahat
shat <- sumstats$sebetahat

t0 <- proc.time()
fit_ash_rss <- susie_rss(bhat = bhat, shat = shat, R = R,
                          var_y = var(y), n = n,
                          L = 10, unmappable_effects = "ash",
                          estimate_residual_variance = TRUE, verbose = TRUE)
t1 <- proc.time()
t1 - t0
susie_plot(fit_ash_rss, y = "PIP", b = b, main = "SuSiE-ash (RSS)", add_legend = TRUE)
```

```{r}
plot_cs_effects(fit_ash_rss, b, main = "SuSiE-ash (RSS) CS on true effects")
```

With `bhat`, `shat`, `var_y`, and in-sample LD, `susie_rss` results match
`susie_ss` closely:

```{r}
pip_rss <- susie_get_pip(fit_ash_rss)
cat("Max |PIP difference| (SS vs RSS):", max(abs(pip_ss - pip_rss)), "\n")
cat("PIP correlation (SS vs RSS):", cor(pip_ss, pip_rss), "\n")
```

When only z-scores and an LD matrix are available (without `bhat`, `shat`,
or `var_y`), `susie_rss` operates on a standardized scale where `var(y) = 1`.
The credible sets are typically still correct, but the estimated `sigma2`
will be on the standardized scale rather than the original scale.
Note that when the LD matrix is not computed from the same sample as the
summary statistics (out-of-sample LD), setting
`estimate_residual_variance = FALSE` may be more appropriate to avoid
bias from LD mismatch.

## Summary

| Method | Credible Sets | False Positives |
|--------|---------------|-----------------|
| SuSiE (purity=0.5) | 5 | 4 |
| SuSiE (purity=0.8) | 3 | 2 |
| SuSiE-inf | 1 | 0 |
| SuSiE-ash | 3 | 0 |
| SuSiE-ash (SS) | 3 | 0 |
| SuSiE-ash (RSS) | 3 | 0 |

## What if we increase L for standard SuSiE?

Since the true simulation has 23 causal variants, 
one might ask: what if we simply increase `L` to give SuSiE more capacity? 
Let's try `L = 40`:

```{r}
t0 <- proc.time()
fit_susie_L40 <- susie(X, y, L = 40)
t1 <- proc.time()
t1 - t0
susie_plot(fit_susie_L40, y = "PIP", b = b, main = "SuSiE (L=40)", add_legend = TRUE)
plot_cs_effects(fit_susie_L40, b, main = "SuSiE L=40 CS on true effects")
```

With `L = 40`, standard SuSiE does improve! Now it captures 4 CS with two of them true positives. 
However, it still produces false positives and takes considerably longer to converge.

The rationale for SuSiE-ash is to avoid this concern: rather than specifying a large `L` to account 
for all potential effects, we use a reasonable `L` for sparse signals and let the adaptive shrinkage 
component absorb effects that cannot be mapped due to insufficiently specified `L`. 
This provides a more principled and computationally efficient approach.

Naturally as a result, SuSiE-ash is more robust to the choice of `L` compared to SuSiE. 
For this example, setting `L` anywhere from 5 to 40 yields similar results, 
unlike standard SuSiE where performance varies substantially with `L`. 
(Readers can verify this on their own with this data-set)

## Session Information

```{r}
sessionInfo()
```


================================================
FILE: vignettes/susierss_diagnostic.Rmd
================================================
---
title: "Diagnostic for fine-mapping with summary statistics"
author: "Yuxin Zou"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Diagnostic for fine-mapping with summary statistics}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

This vignette demonstrates the use of the diagnostic plot for
assessing consistency of the summary statistics and the reference LD
matrix.

The `susie_rss` assumes the LD matrix accurately estimate the
correlations among SNPs from the original GWAS genotype
data. Typically, the LD matrix comes from some public database of
genotypes in a suitable reference population. The inaccurate LD
information leads to unreliable fine-mapping result.

The diagnostic for consistency between summary statistics and
refenrence LD matrix is based on the RSS model under the null with
regularized LD matrix.
$$
\hat{z} | R, \lambda \sim N(0, (1-\lambda)R + \lambda I), 0<\lambda<1
$$
The parameter $\lambda$ is estimated by maximum likelihood. A larger
$\lambda$ means a greater inconsistency between summary statistics and
the LD matrix. The expected z score is computed for each SNP,
$E(\hat{z}_j | \hat{z}_{-j})$, and plotted against the observed z
scores.

```{r}
library(susieR)
library(curl)
```

## LD information from the original genotype data

We demonstrate the diagnostic plot in a simple case, the LD matrix is
estimated from the original genotype data. In this case, we expect the
diagnostic plot to confirm that the LD matrix is consistent with the
z scores.

We use the same simulated data as in
[fine mapping vignette](finemapping.html).

```{r}
data("N3finemapping")
n = nrow(N3finemapping$X)
b = N3finemapping$true_coef[,1]
sumstats <- univariate_regression(N3finemapping$X, N3finemapping$Y[,1])
z_scores <- sumstats$betahat / sumstats$sebetahat
Rin = cor(N3finemapping$X)
attr(Rin, "eigen") = eigen(Rin, symmetric = TRUE)
susie_plot(z_scores, y = "z", b=b)
```

The estimated $\lambda$ is
```{r}
lambda = estimate_s_rss(z_scores, Rin, n=n)
lambda
```

The plot for the observed z scores vs the expected z scores is 
```{r}
condz_in = kriging_rss(z_scores, Rin, n=n)
condz_in$plot
```

Summary of SuSiE Credible Sets:
```{r}
fit <- susie_rss(z_scores, Rin, n=n, estimate_residual_variance = TRUE)
susie_plot(fit,y = "PIP", b=b)
```

## LD information from the reference panel

We use another simulated data where the LD matrix is estimated from a
reference panel. In this example data set, there is one association
signal in the simulated data (red point), and there is one SNP with
mismatched reference and alternative allele between summary statistics
and the reference panel (yellow point).

**Note:** In some versions of [PLINK][plink], these mismatches can
occur when [PLINK automatically flips the alleles to make the minor
allele be the effect
allele](https://github.com/stephenslab/susieR/issues/148), leading to
different allele encodings in the z scores and LD matrix. Adding the
flag `--keep-allele-order` will disable this behaviour in PLINK.

```{r}
data_file <- tempfile(fileext = ".RData")
data_url <- paste0("https://raw.githubusercontent.com/stephenslab/susieR/",
                   "master/inst/datafiles/SummaryConsistency1k.RData")
curl_download(data_url,data_file)
load(data_file)
zflip = SummaryConsistency$z
ld = SummaryConsistency$ldref
n=10000
b = numeric(length(zflip))
b[SummaryConsistency$signal_id] = zflip[SummaryConsistency$signal_id]
plot(zflip, pch = 16, col = "#767676", main = "Marginal Associations", 
     xlab="SNP", ylab = "z scores")
points(SummaryConsistency$signal_id, zflip[SummaryConsistency$signal_id], col=2, pch=16)
points(SummaryConsistency$flip_id, zflip[SummaryConsistency$flip_id], col=7, pch=16)
```
Using the data with misaligned allele, SuSiE-RSS identifies a true positive CS containing the true effect SNP; and a false positive CS that incorrectly contains the mismatched SNP.
```{r}
fit = susie_rss(zflip, ld, n=n)
susie_plot(fit, y='PIP', b=b)
points(SummaryConsistency$flip_id, fit$pip[SummaryConsistency$flip_id], col=7, pch=16)
```

The estimated $\lambda$ is
```{r}
lambda = estimate_s_rss(zflip, ld, n=n)
lambda
```

In the diagnostic plot, the mismatched SNP shows the largest difference between observed and expected z-scores, and therefore appears furthest away from the diagonal.

```{r}
condz = kriging_rss(zflip, ld, n=n)
condz$plot
```

After fixing the allele encoding, SuSiE-RSS identifies a single true positive CS containing the true-effect SNP, and the formerly mismatched SNP is (correctly) not included in a CS.

```{r}
z = zflip
z[SummaryConsistency$flip_id] = -z[SummaryConsistency$flip_id]
fit = susie_rss(z, ld, n=n)
susie_plot(fit, y='PIP', b=b)
```

## Session information

Here are some details about the computing environment, including the
versions of R, and the R packages, used to generate these results.

```{r session-info}
sessionInfo()
```

[plink]: https://www.cog-genomics.org/plink


================================================
FILE: vignettes/trend_filtering.Rmd
================================================
---
title: "Trend filtering"
author: "Matthew Stephens"
date: "`r Sys.Date()`"
output: rmarkdown::html_vignette
vignette: >
  %\VignetteIndexEntry{Trend filtering}
  %\VignetteEngine{knitr::rmarkdown}
  %\VignetteEncoding{UTF-8}
---

```{r setup, include=FALSE}
knitr::opts_chunk$set(collapse = TRUE,comment = "#",fig.width = 4.5,
                      fig.height = 3,fig.align = "center",
                      fig.cap = "&nbsp;",dpi = 120)
```

# Introduction

Although we developed SuSiE primarily with the goal of performing
variable selection in highly sparse settings -- and, in particular,
for genetic fine-mapping -- the approach also has considerable
potential for application to other large-scale regression
problems. Here we briefly illustrate this potential by applying it to
a non-parametric regression problem that at first sight seems to be
ill-suited to our approach. In particular, it does not involve strict
sparsity, and the underlying correlation structure of the explanatory
variables is very different from the "blocky" covariance structure of
genetic data that SuSiE was designed for. Nonetheless, we will see
that SuSiE performs well here despite this (partly due to its ability
to capture non-sparse signals via Bayesian Model Averaging).

Specifically, consider the non-parametric regression:
$$y_t = \mu_t + e_t \quad t=1,\dots,T$$
where the goal is to estimate the underlying mean, $\mu_t$, under the assumption that it varies smoothly (or, more precisely, in a spatially-structured way) with $t$.
One very simple way to capture spatial structure in $\mu$ is to model it
as a (sparse) linear combination of step functions:
$$\mu = Xb$$ 
where the $j$th column of $X$ is the step function with a step at $j$ ($j = 1,\dots,(T-1)$); that is $x_{tj}=0$ for $t<=j$ and 1 for $t>j$.
The $j$th element of $b$ therefore determines the change in the mean $|\mu_j-\mu_{j+1}|$, and an assumption that $b$ is sparse encapsulates an
assumption that $\mu$ is spatially structured (indeed, piecewise constant).

This very simple approach is essentially 0th-order trend filtering
(Tibshirani, 2014, *Annals of Statistics* 42, 285--323). Note that
higher-order trend filtering can be similarly implemented using
different basis functions; here we use 0th order only for simplicity.


# Examples

Here we apply SuSiE to perform 0th order trend filtering in some simple simulated examples. We have implemented in `susieR` 0.6.0 a funciton `susie_trendfilter` which internally creates $X$ matrix with step functions in the columns to match input $y$. The algebra have been optimized to work on such trendfiltering matrices. Here we simulate some data where $\mu$ is a step function with four steps, a 0th order trendfiltering problem. The regression is truly sparse and SuSiE should do well.

```{r}
library(susieR)
set.seed(1)
n=1000
mu = c(rep(0,100),rep(1,100),rep(3,100),rep(-2,100),rep(0,600))
y = mu + rnorm(n)
s = susie_trendfilter(y, 0, L=10)
```

Plot results: the truth is black, and susie estimate is red.
```{r}
plot(y,pch=".")
lines(mu,col=1,lwd=3)
lines(predict(s),col=2,lwd=2)
s$sigma2
```

In the next example mu increases linearly. Thus we are approximating a
linear function by step functions. Here the truth is not trully
"sparse", so we might expect performance to be poor, but it is not too
bad.

```{r}
set.seed(1)
mu = seq(0,4,length=1000)
y = mu + rnorm(n)
s = susie_trendfilter(y,0,L=10)
plot(y,pch=".")
lines(mu,col=1,lwd=3)
lines(predict(s),col=2,lwd=2)
```

Compare with the genlasso (lasso-based) solution (blue). (This will
require installation of the `genlasso` package, which is not available
on CRAN, but can be installed from GitHub.)

```{r, eval=FALSE}
# install.packages("remotes")
# remotes::install_github("glmgen/genlasso")
y.tf = trendfilter(y,ord=0)
y.tf.cv = cv.trendfilter(y.tf)
plot(y,pch=".")
lines(mu,col=1,lwd=3)
lines(predict(s),col=2,lwd=2)
lines(y.tf$fit[,which(y.tf$lambda==y.tf.cv$lambda.min)],col=4,lwd=2)
```

What happens if we have linear trend plus a sudden change.

```{r, eval=FALSE}
set.seed(1)
mu = seq(0,4,length=1000)
mu = mu + c(rep(0,500),rep(4,500))
y = mu + rnorm(n)
s = susie_trendfilter(y,0,L=10)
y.tf = trendfilter(y,ord=0)
y.tf.cv = cv.trendfilter(y.tf)
plot(y,pch=".")
lines(mu,col=1,lwd=3)
lines(predict(s),col=2,lwd=2)
lines(y.tf$fit[,which(y.tf$lambda==y.tf.cv$lambda.min)],col=4,lwd=2)
```

The two fits seem similar in accuracy. We can check this numerically:
```{r, eval=FALSE}
sqrt(mean((mu-y.tf$fit[,which(y.tf$lambda==y.tf.cv$lambda.min)])^2))
sqrt(mean((mu-predict(s))^2))
```